diff --git "a/wandb/run-20220322_163235-2yj5gh94/files/wandb-summary.json" "b/wandb/run-20220322_163235-2yj5gh94/files/wandb-summary.json" --- "a/wandb/run-20220322_163235-2yj5gh94/files/wandb-summary.json" +++ "b/wandb/run-20220322_163235-2yj5gh94/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 0.0826, "train/learning_rate": 4.057803468208092e-05, "train/epoch": 4.48, "train/global_step": 2000, "_runtime": 24723, "_timestamp": 1647991478, "_step": 2003, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 4.0, 13.0, 22.0, 41.0, 79.0, 106.0, 142.0, 162.0, 160.0, 89.0, 83.0, 54.0, 20.0, 14.0, 11.0, 5.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8025725483894348, -0.7274086475372314, -0.6522447466850281, -0.5770808458328247, -0.5019170045852661, -0.42675307393074036, -0.3515892028808594, -0.276425302028656, -0.20126140117645264, -0.12609750032424927, -0.05093361437320709, 0.024230271577835083, 0.09939417243003845, 0.17455807328224182, 0.2497219443321228, 0.32488584518432617, 0.40004974603652954, 0.4752136468887329, 0.5503775477409363, 0.6255414485931396, 0.7007052898406982, 0.7758692502975464, 0.851033091545105, 0.9261969923973083, 1.0013608932495117, 1.0765247344970703, 1.1516886949539185, 1.226852536201477, 1.3020164966583252, 1.3771803379058838, 1.4523441791534424, 1.5275081396102905, 1.6026718616485596, 1.6778357028961182, 1.7529996633529663, 1.828163504600525, 1.903327465057373, 1.9784913063049316, 2.0536551475524902, 2.128818988800049, 2.2039830684661865, 2.279146909713745, 2.3543107509613037, 2.4294748306274414, 2.504638671875, 2.5798025131225586, 2.654966354370117, 2.730130195617676, 2.8052940368652344, 2.880457878112793, 2.9556217193603516, 3.0307857990264893, 3.105949640274048, 3.1811134815216064, 3.256277322769165, 3.3314414024353027, 3.4066052436828613, 3.48176908493042, 3.5569329261779785, 3.632097005844116, 3.707260847091675, 3.7824246883392334, 3.857588529586792, 3.9327526092529297, 4.007916450500488]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 6.0, 6.0, 2.0, 7.0, 9.0, 6.0, 12.0, 9.0, 15.0, 21.0, 22.0, 19.0, 39.0, 31.0, 25.0, 29.0, 29.0, 29.0, 33.0, 35.0, 42.0, 49.0, 36.0, 32.0, 41.0, 37.0, 42.0, 35.0, 40.0, 32.0, 29.0, 28.0, 33.0, 19.0, 20.0, 17.0, 14.0, 11.0, 15.0, 16.0, 7.0, 8.0, 5.0, 4.0, 3.0, 5.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7510346174240112, -0.7246689796447754, -0.6983032822608948, -0.6719376444816589, -0.6455720067024231, -0.6192063093185425, -0.5928406715393066, -0.5664750337600708, -0.540109395980835, -0.5137437582015991, -0.4873780906200409, -0.46101242303848267, -0.4346467852592468, -0.4082811176776886, -0.38191545009613037, -0.35554981231689453, -0.3291841149330139, -0.3028184473514557, -0.27645280957221985, -0.2500871419906616, -0.2237214893102646, -0.19735583662986755, -0.17099016904830933, -0.1446245163679123, -0.11825886368751526, -0.09189321100711823, -0.0655275508761406, -0.039161890745162964, -0.01279623806476593, 0.013569414615631104, 0.03993508219718933, 0.06630073487758636, 0.09266632795333862, 0.11903198063373566, 0.1453976333141327, 0.17176330089569092, 0.19812895357608795, 0.22449460625648499, 0.2508602738380432, 0.27722591161727905, 0.3035915791988373, 0.3299572467803955, 0.35632288455963135, 0.3826885521411896, 0.4090542197227478, 0.43541985750198364, 0.46178552508354187, 0.4881511926651001, 0.5145168304443359, 0.5408824682235718, 0.5672481656074524, 0.5936138033866882, 0.6199794411659241, 0.6463451385498047, 0.6727107763290405, 0.6990764141082764, 0.7254420518875122, 0.751807689666748, 0.7781733870506287, 0.8045390248298645, 0.8309046626091003, 0.857270359992981, 0.8836359977722168, 0.9100016355514526, 0.9363673329353333]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 4.0, 8.0, 7.0, 14.0, 22.0, 22.0, 35.0, 50.0, 84.0, 118.0, 153.0, 228.0, 342.0, 439.0, 640.0, 1066.0, 1685.0, 2732.0, 4964.0, 9050.0, 19075.0, 54512.0, 283579.0, 1615838.0, 1790557.0, 311903.0, 55765.0, 19585.0, 9211.0, 4885.0, 2881.0, 1664.0, 1007.0, 666.0, 439.0, 319.0, 214.0, 149.0, 97.0, 78.0, 66.0, 34.0, 38.0, 11.0, 9.0, 15.0, 12.0, 8.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.5546875, -2.4696044921875, -2.384521484375, -2.2994384765625, -2.21435546875, -2.1292724609375, -2.044189453125, -1.9591064453125, -1.8740234375, -1.7889404296875, -1.703857421875, -1.6187744140625, -1.53369140625, -1.4486083984375, -1.363525390625, -1.2784423828125, -1.193359375, -1.1082763671875, -1.023193359375, -0.9381103515625, -0.85302734375, -0.7679443359375, -0.682861328125, -0.5977783203125, -0.5126953125, -0.4276123046875, -0.342529296875, -0.2574462890625, -0.17236328125, -0.0872802734375, -0.002197265625, 0.0828857421875, 0.16796875, 0.2530517578125, 0.338134765625, 0.4232177734375, 0.50830078125, 0.5933837890625, 0.678466796875, 0.7635498046875, 0.8486328125, 0.9337158203125, 1.018798828125, 1.1038818359375, 1.18896484375, 1.2740478515625, 1.359130859375, 1.4442138671875, 1.529296875, 1.6143798828125, 1.699462890625, 1.7845458984375, 1.86962890625, 1.9547119140625, 2.039794921875, 2.1248779296875, 2.2099609375, 2.2950439453125, 2.380126953125, 2.4652099609375, 2.55029296875, 2.6353759765625, 2.720458984375, 2.8055419921875, 2.890625]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 4.0, 5.0, 3.0, 10.0, 6.0, 3.0, 10.0, 8.0, 15.0, 20.0, 13.0, 26.0, 28.0, 24.0, 28.0, 36.0, 28.0, 30.0, 31.0, 42.0, 37.0, 27.0, 53.0, 47.0, 50.0, 37.0, 37.0, 34.0, 30.0, 34.0, 35.0, 27.0, 29.0, 15.0, 19.0, 17.0, 19.0, 14.0, 16.0, 15.0, 11.0, 3.0, 7.0, 6.0, 7.0, 4.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.302734375, -1.253692626953125, -1.20465087890625, -1.155609130859375, -1.1065673828125, -1.057525634765625, -1.00848388671875, -0.959442138671875, -0.910400390625, -0.861358642578125, -0.81231689453125, -0.763275146484375, -0.7142333984375, -0.665191650390625, -0.61614990234375, -0.567108154296875, -0.51806640625, -0.469024658203125, -0.41998291015625, -0.370941162109375, -0.3218994140625, -0.272857666015625, -0.22381591796875, -0.174774169921875, -0.125732421875, -0.076690673828125, -0.02764892578125, 0.021392822265625, 0.0704345703125, 0.119476318359375, 0.16851806640625, 0.217559814453125, 0.2666015625, 0.315643310546875, 0.36468505859375, 0.413726806640625, 0.4627685546875, 0.511810302734375, 0.56085205078125, 0.609893798828125, 0.658935546875, 0.707977294921875, 0.75701904296875, 0.806060791015625, 0.8551025390625, 0.904144287109375, 0.95318603515625, 1.002227783203125, 1.05126953125, 1.100311279296875, 1.14935302734375, 1.198394775390625, 1.2474365234375, 1.296478271484375, 1.34552001953125, 1.394561767578125, 1.443603515625, 1.492645263671875, 1.54168701171875, 1.590728759765625, 1.6397705078125, 1.688812255859375, 1.73785400390625, 1.786895751953125, 1.8359375]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 6.0, 5.0, 7.0, 10.0, 22.0, 34.0, 62.0, 127.0, 248.0, 882.0, 52576.0, 4134989.0, 4480.0, 449.0, 144.0, 93.0, 59.0, 33.0, 14.0, 16.0, 7.0, 6.0, 7.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.5625, -17.92822265625, -17.2939453125, -16.65966796875, -16.025390625, -15.39111328125, -14.7568359375, -14.12255859375, -13.48828125, -12.85400390625, -12.2197265625, -11.58544921875, -10.951171875, -10.31689453125, -9.6826171875, -9.04833984375, -8.4140625, -7.77978515625, -7.1455078125, -6.51123046875, -5.876953125, -5.24267578125, -4.6083984375, -3.97412109375, -3.33984375, -2.70556640625, -2.0712890625, -1.43701171875, -0.802734375, -0.16845703125, 0.4658203125, 1.10009765625, 1.734375, 2.36865234375, 3.0029296875, 3.63720703125, 4.271484375, 4.90576171875, 5.5400390625, 6.17431640625, 6.80859375, 7.44287109375, 8.0771484375, 8.71142578125, 9.345703125, 9.97998046875, 10.6142578125, 11.24853515625, 11.8828125, 12.51708984375, 13.1513671875, 13.78564453125, 14.419921875, 15.05419921875, 15.6884765625, 16.32275390625, 16.95703125, 17.59130859375, 18.2255859375, 18.85986328125, 19.494140625, 20.12841796875, 20.7626953125, 21.39697265625, 22.03125]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 1.0, 2.0, 6.0, 5.0, 4.0, 4.0, 5.0, 9.0, 10.0, 16.0, 14.0, 23.0, 38.0, 40.0, 69.0, 102.0, 138.0, 201.0, 398.0, 682.0, 895.0, 523.0, 278.0, 172.0, 122.0, 77.0, 54.0, 31.0, 42.0, 30.0, 20.0, 9.0, 18.0, 10.0, 7.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.8330078125, -0.8063507080078125, -0.779693603515625, -0.7530364990234375, -0.72637939453125, -0.6997222900390625, -0.673065185546875, -0.6464080810546875, -0.6197509765625, -0.5930938720703125, -0.566436767578125, -0.5397796630859375, -0.51312255859375, -0.4864654541015625, -0.459808349609375, -0.4331512451171875, -0.406494140625, -0.3798370361328125, -0.353179931640625, -0.3265228271484375, -0.29986572265625, -0.2732086181640625, -0.246551513671875, -0.2198944091796875, -0.1932373046875, -0.1665802001953125, -0.139923095703125, -0.1132659912109375, -0.08660888671875, -0.0599517822265625, -0.033294677734375, -0.0066375732421875, 0.02001953125, 0.0466766357421875, 0.073333740234375, 0.0999908447265625, 0.12664794921875, 0.1533050537109375, 0.179962158203125, 0.2066192626953125, 0.2332763671875, 0.2599334716796875, 0.286590576171875, 0.3132476806640625, 0.33990478515625, 0.3665618896484375, 0.393218994140625, 0.4198760986328125, 0.446533203125, 0.4731903076171875, 0.499847412109375, 0.5265045166015625, 0.55316162109375, 0.5798187255859375, 0.606475830078125, 0.6331329345703125, 0.6597900390625, 0.6864471435546875, 0.713104248046875, 0.7397613525390625, 0.76641845703125, 0.7930755615234375, 0.819732666015625, 0.8463897705078125, 0.873046875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 8.0, 3.0, 9.0, 17.0, 18.0, 20.0, 28.0, 35.0, 37.0, 67.0, 67.0, 75.0, 71.0, 74.0, 72.0, 80.0, 73.0, 57.0, 44.0, 41.0, 20.0, 26.0, 11.0, 10.0, 16.0, 12.0, 6.0, 1.0, 2.0, 3.0, 3.0, 4.0], "bins": [-4.130331039428711, -4.039455890655518, -3.9485809803009033, -3.857706069946289, -3.7668309211730957, -3.6759560108184814, -3.585081100463867, -3.494205951690674, -3.4033308029174805, -3.312455892562866, -3.221580743789673, -3.1307058334350586, -3.0398306846618652, -2.948955774307251, -2.8580808639526367, -2.7672057151794434, -2.676330804824829, -2.585455894470215, -2.4945807456970215, -2.4037058353424072, -2.312830686569214, -2.2219557762145996, -2.1310806274414062, -2.040205717086792, -1.9493306875228882, -1.8584556579589844, -1.7675806283950806, -1.6767055988311768, -1.5858306884765625, -1.4949555397033691, -1.4040806293487549, -1.313205599784851, -1.2223306894302368, -1.131455659866333, -1.0405806303024292, -0.9497056603431702, -0.8588306307792664, -0.7679556012153625, -0.6770806312561035, -0.5862056016921997, -0.4953305721282959, -0.4044555425643921, -0.31358054280281067, -0.22270554304122925, -0.13183051347732544, -0.04095548391342163, 0.0499194860458374, 0.1407945156097412, 0.23166954517364502, 0.32254457473754883, 0.41341957449913025, 0.5042945742607117, 0.5951696038246155, 0.6860446333885193, 0.7769196033477783, 0.8677946329116821, 0.9586696624755859, 1.0495446920394897, 1.1404197216033936, 1.2312946319580078, 1.3221697807312012, 1.4130446910858154, 1.5039197206497192, 1.594794750213623, 1.6856697797775269]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 3.0, 5.0, 9.0, 8.0, 12.0, 10.0, 11.0, 19.0, 14.0, 21.0, 15.0, 25.0, 21.0, 29.0, 19.0, 33.0, 40.0, 30.0, 27.0, 22.0, 53.0, 38.0, 41.0, 42.0, 36.0, 34.0, 36.0, 41.0, 40.0, 31.0, 23.0, 18.0, 21.0, 25.0, 22.0, 25.0, 11.0, 14.0, 13.0, 9.0, 13.0, 12.0, 6.0, 2.0, 8.0, 3.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.5629359483718872, -1.5149544477462769, -1.4669729471206665, -1.4189914464950562, -1.3710099458694458, -1.3230284452438354, -1.2750468254089355, -1.2270653247833252, -1.1790838241577148, -1.1311023235321045, -1.0831208229064941, -1.0351393222808838, -0.9871578216552734, -0.9391763210296631, -0.891194760799408, -0.8432132601737976, -0.795231819152832, -0.7472503185272217, -0.6992688179016113, -0.651287317276001, -0.6033058166503906, -0.5553243160247803, -0.5073427557945251, -0.4593612551689148, -0.41137975454330444, -0.3633982539176941, -0.31541675329208374, -0.267435222864151, -0.21945372223854065, -0.1714722216129303, -0.12349069118499756, -0.07550919055938721, -0.027527809143066406, 0.020453698933124542, 0.06843520700931549, 0.11641672253608704, 0.1643982231616974, 0.21237972378730774, 0.2603612542152405, 0.30834275484085083, 0.3563242554664612, 0.40430575609207153, 0.4522872567176819, 0.500268816947937, 0.5482503175735474, 0.5962318181991577, 0.6442133188247681, 0.6921948194503784, 0.7401763200759888, 0.7881578207015991, 0.8361393213272095, 0.8841208219528198, 0.9321023225784302, 0.9800838232040405, 1.0280654430389404, 1.0760469436645508, 1.1240284442901611, 1.1720099449157715, 1.2199914455413818, 1.2679729461669922, 1.3159544467926025, 1.363935947418213, 1.4119174480438232, 1.4598989486694336, 1.507880449295044]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 8.0, 14.0, 16.0, 36.0, 41.0, 47.0, 91.0, 128.0, 224.0, 349.0, 581.0, 1068.0, 1925.0, 3585.0, 7095.0, 14076.0, 31094.0, 71103.0, 165959.0, 340417.0, 231928.0, 97775.0, 42187.0, 19380.0, 8990.0, 4675.0, 2417.0, 1385.0, 763.0, 444.0, 288.0, 148.0, 123.0, 54.0, 52.0, 22.0, 19.0, 10.0, 19.0, 7.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.06640625, -1.0356674194335938, -1.0049285888671875, -0.9741897583007812, -0.943450927734375, -0.9127120971679688, -0.8819732666015625, -0.8512344360351562, -0.82049560546875, -0.7897567749023438, -0.7590179443359375, -0.7282791137695312, -0.697540283203125, -0.6668014526367188, -0.6360626220703125, -0.6053237915039062, -0.5745849609375, -0.5438461303710938, -0.5131072998046875, -0.48236846923828125, -0.451629638671875, -0.42089080810546875, -0.3901519775390625, -0.35941314697265625, -0.32867431640625, -0.29793548583984375, -0.2671966552734375, -0.23645782470703125, -0.205718994140625, -0.17498016357421875, -0.1442413330078125, -0.11350250244140625, -0.082763671875, -0.05202484130859375, -0.0212860107421875, 0.00945281982421875, 0.040191650390625, 0.07093048095703125, 0.1016693115234375, 0.13240814208984375, 0.16314697265625, 0.19388580322265625, 0.2246246337890625, 0.25536346435546875, 0.286102294921875, 0.31684112548828125, 0.3475799560546875, 0.37831878662109375, 0.4090576171875, 0.43979644775390625, 0.4705352783203125, 0.5012741088867188, 0.532012939453125, 0.5627517700195312, 0.5934906005859375, 0.6242294311523438, 0.65496826171875, 0.6857070922851562, 0.7164459228515625, 0.7471847534179688, 0.777923583984375, 0.8086624145507812, 0.8394012451171875, 0.8701400756835938, 0.90087890625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 2.0, 5.0, 8.0, 6.0, 7.0, 9.0, 7.0, 6.0, 17.0, 18.0, 18.0, 20.0, 23.0, 26.0, 19.0, 31.0, 40.0, 29.0, 33.0, 35.0, 39.0, 37.0, 36.0, 39.0, 29.0, 39.0, 29.0, 39.0, 32.0, 36.0, 41.0, 32.0, 21.0, 30.0, 28.0, 16.0, 12.0, 18.0, 21.0, 12.0, 10.0, 6.0, 10.0, 9.0, 5.0, 6.0, 6.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.93603515625, -0.9057998657226562, -0.8755645751953125, -0.8453292846679688, -0.815093994140625, -0.7848587036132812, -0.7546234130859375, -0.7243881225585938, -0.69415283203125, -0.6639175415039062, -0.6336822509765625, -0.6034469604492188, -0.573211669921875, -0.5429763793945312, -0.5127410888671875, -0.48250579833984375, -0.4522705078125, -0.42203521728515625, -0.3917999267578125, -0.36156463623046875, -0.331329345703125, -0.30109405517578125, -0.2708587646484375, -0.24062347412109375, -0.21038818359375, -0.18015289306640625, -0.1499176025390625, -0.11968231201171875, -0.089447021484375, -0.05921173095703125, -0.0289764404296875, 0.00125885009765625, 0.031494140625, 0.06172943115234375, 0.0919647216796875, 0.12220001220703125, 0.152435302734375, 0.18267059326171875, 0.2129058837890625, 0.24314117431640625, 0.27337646484375, 0.30361175537109375, 0.3338470458984375, 0.36408233642578125, 0.394317626953125, 0.42455291748046875, 0.4547882080078125, 0.48502349853515625, 0.5152587890625, 0.5454940795898438, 0.5757293701171875, 0.6059646606445312, 0.636199951171875, 0.6664352416992188, 0.6966705322265625, 0.7269058227539062, 0.75714111328125, 0.7873764038085938, 0.8176116943359375, 0.8478469848632812, 0.878082275390625, 0.9083175659179688, 0.9385528564453125, 0.9687881469726562, 0.9990234375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 4.0, 7.0, 7.0, 9.0, 11.0, 7.0, 22.0, 30.0, 41.0, 64.0, 82.0, 179.0, 253.0, 451.0, 1018.0, 2250.0, 5957.0, 20363.0, 87267.0, 433932.0, 390810.0, 77887.0, 18317.0, 5506.0, 2033.0, 917.0, 463.0, 243.0, 141.0, 98.0, 66.0, 37.0, 29.0, 18.0, 13.0, 12.0, 2.0, 4.0, 2.0, 7.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0732421875, -1.0265045166015625, -0.979766845703125, -0.9330291748046875, -0.88629150390625, -0.8395538330078125, -0.792816162109375, -0.7460784912109375, -0.6993408203125, -0.6526031494140625, -0.605865478515625, -0.5591278076171875, -0.51239013671875, -0.4656524658203125, -0.418914794921875, -0.3721771240234375, -0.325439453125, -0.2787017822265625, -0.231964111328125, -0.1852264404296875, -0.13848876953125, -0.0917510986328125, -0.045013427734375, 0.0017242431640625, 0.0484619140625, 0.0951995849609375, 0.141937255859375, 0.1886749267578125, 0.23541259765625, 0.2821502685546875, 0.328887939453125, 0.3756256103515625, 0.42236328125, 0.4691009521484375, 0.515838623046875, 0.5625762939453125, 0.60931396484375, 0.6560516357421875, 0.702789306640625, 0.7495269775390625, 0.7962646484375, 0.8430023193359375, 0.889739990234375, 0.9364776611328125, 0.98321533203125, 1.0299530029296875, 1.076690673828125, 1.1234283447265625, 1.170166015625, 1.2169036865234375, 1.263641357421875, 1.3103790283203125, 1.35711669921875, 1.4038543701171875, 1.450592041015625, 1.4973297119140625, 1.5440673828125, 1.5908050537109375, 1.637542724609375, 1.6842803955078125, 1.73101806640625, 1.7777557373046875, 1.824493408203125, 1.8712310791015625, 1.91796875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 9.0, 9.0, 6.0, 11.0, 12.0, 15.0, 15.0, 28.0, 30.0, 31.0, 37.0, 44.0, 56.0, 51.0, 53.0, 53.0, 49.0, 54.0, 60.0, 48.0, 49.0, 49.0, 33.0, 32.0, 30.0, 35.0, 20.0, 17.0, 8.0, 17.0, 5.0, 7.0, 11.0, 4.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.921875, -2.832244873046875, -2.74261474609375, -2.652984619140625, -2.5633544921875, -2.473724365234375, -2.38409423828125, -2.294464111328125, -2.204833984375, -2.115203857421875, -2.02557373046875, -1.935943603515625, -1.8463134765625, -1.756683349609375, -1.66705322265625, -1.577423095703125, -1.48779296875, -1.398162841796875, -1.30853271484375, -1.218902587890625, -1.1292724609375, -1.039642333984375, -0.95001220703125, -0.860382080078125, -0.770751953125, -0.681121826171875, -0.59149169921875, -0.501861572265625, -0.4122314453125, -0.322601318359375, -0.23297119140625, -0.143341064453125, -0.0537109375, 0.035919189453125, 0.12554931640625, 0.215179443359375, 0.3048095703125, 0.394439697265625, 0.48406982421875, 0.573699951171875, 0.663330078125, 0.752960205078125, 0.84259033203125, 0.932220458984375, 1.0218505859375, 1.111480712890625, 1.20111083984375, 1.290740966796875, 1.38037109375, 1.470001220703125, 1.55963134765625, 1.649261474609375, 1.7388916015625, 1.828521728515625, 1.91815185546875, 2.007781982421875, 2.097412109375, 2.187042236328125, 2.27667236328125, 2.366302490234375, 2.4559326171875, 2.545562744140625, 2.63519287109375, 2.724822998046875, 2.814453125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 1.0, 6.0, 8.0, 9.0, 13.0, 18.0, 35.0, 61.0, 73.0, 142.0, 164.0, 295.0, 425.0, 758.0, 1302.0, 2439.0, 4869.0, 10715.0, 27426.0, 84960.0, 315354.0, 416443.0, 120082.0, 36799.0, 13513.0, 5901.0, 2904.0, 1562.0, 888.0, 517.0, 306.0, 193.0, 126.0, 81.0, 53.0, 30.0, 20.0, 26.0, 8.0, 7.0, 7.0, 6.0, 3.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.28759765625, -0.27864837646484375, -0.2696990966796875, -0.26074981689453125, -0.251800537109375, -0.24285125732421875, -0.2339019775390625, -0.22495269775390625, -0.21600341796875, -0.20705413818359375, -0.1981048583984375, -0.18915557861328125, -0.180206298828125, -0.17125701904296875, -0.1623077392578125, -0.15335845947265625, -0.1444091796875, -0.13545989990234375, -0.1265106201171875, -0.11756134033203125, -0.108612060546875, -0.09966278076171875, -0.0907135009765625, -0.08176422119140625, -0.07281494140625, -0.06386566162109375, -0.0549163818359375, -0.04596710205078125, -0.037017822265625, -0.02806854248046875, -0.0191192626953125, -0.01016998291015625, -0.001220703125, 0.00772857666015625, 0.0166778564453125, 0.02562713623046875, 0.034576416015625, 0.04352569580078125, 0.0524749755859375, 0.06142425537109375, 0.07037353515625, 0.07932281494140625, 0.0882720947265625, 0.09722137451171875, 0.106170654296875, 0.11511993408203125, 0.1240692138671875, 0.13301849365234375, 0.1419677734375, 0.15091705322265625, 0.1598663330078125, 0.16881561279296875, 0.177764892578125, 0.18671417236328125, 0.1956634521484375, 0.20461273193359375, 0.21356201171875, 0.22251129150390625, 0.2314605712890625, 0.24040985107421875, 0.249359130859375, 0.25830841064453125, 0.2672576904296875, 0.27620697021484375, 0.28515625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 3.0, 4.0, 5.0, 12.0, 11.0, 25.0, 26.0, 55.0, 80.0, 134.0, 199.0, 201.0, 114.0, 64.0, 19.0, 23.0, 7.0, 7.0, 4.0, 8.0, 1.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00025081634521484375, -0.0002380460500717163, -0.00022527575492858887, -0.00021250545978546143, -0.00019973516464233398, -0.00018696486949920654, -0.0001741945743560791, -0.00016142427921295166, -0.00014865398406982422, -0.00013588368892669678, -0.00012311339378356934, -0.0001103430986404419, -9.757280349731445e-05, -8.480250835418701e-05, -7.203221321105957e-05, -5.926191806793213e-05, -4.649162292480469e-05, -3.3721327781677246e-05, -2.0951032638549805e-05, -8.180737495422363e-06, 4.589557647705078e-06, 1.735985279083252e-05, 3.013014793395996e-05, 4.29004430770874e-05, 5.5670738220214844e-05, 6.844103336334229e-05, 8.121132850646973e-05, 9.398162364959717e-05, 0.00010675191879272461, 0.00011952221393585205, 0.0001322925090789795, 0.00014506280422210693, 0.00015783309936523438, 0.00017060339450836182, 0.00018337368965148926, 0.0001961439847946167, 0.00020891427993774414, 0.00022168457508087158, 0.00023445487022399902, 0.00024722516536712646, 0.0002599954605102539, 0.00027276575565338135, 0.0002855360507965088, 0.00029830634593963623, 0.00031107664108276367, 0.0003238469362258911, 0.00033661723136901855, 0.000349387526512146, 0.00036215782165527344, 0.0003749281167984009, 0.0003876984119415283, 0.00040046870708465576, 0.0004132390022277832, 0.00042600929737091064, 0.0004387795925140381, 0.00045154988765716553, 0.00046432018280029297, 0.0004770904779434204, 0.0004898607730865479, 0.0005026310682296753, 0.0005154013633728027, 0.0005281716585159302, 0.0005409419536590576, 0.0005537122488021851, 0.0005664825439453125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 4.0, 5.0, 7.0, 6.0, 5.0, 8.0, 7.0, 23.0, 18.0, 30.0, 36.0, 58.0, 64.0, 126.0, 271.0, 536.0, 1704.0, 6423.0, 35717.0, 314414.0, 595009.0, 78184.0, 11608.0, 2663.0, 800.0, 331.0, 174.0, 105.0, 60.0, 37.0, 22.0, 27.0, 22.0, 14.0, 9.0, 3.0, 4.0, 4.0, 5.0, 6.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52099609375, -0.5037384033203125, -0.486480712890625, -0.4692230224609375, -0.45196533203125, -0.4347076416015625, -0.417449951171875, -0.4001922607421875, -0.3829345703125, -0.3656768798828125, -0.348419189453125, -0.3311614990234375, -0.31390380859375, -0.2966461181640625, -0.279388427734375, -0.2621307373046875, -0.244873046875, -0.2276153564453125, -0.210357666015625, -0.1930999755859375, -0.17584228515625, -0.1585845947265625, -0.141326904296875, -0.1240692138671875, -0.1068115234375, -0.0895538330078125, -0.072296142578125, -0.0550384521484375, -0.03778076171875, -0.0205230712890625, -0.003265380859375, 0.0139923095703125, 0.03125, 0.0485076904296875, 0.065765380859375, 0.0830230712890625, 0.10028076171875, 0.1175384521484375, 0.134796142578125, 0.1520538330078125, 0.1693115234375, 0.1865692138671875, 0.203826904296875, 0.2210845947265625, 0.23834228515625, 0.2555999755859375, 0.272857666015625, 0.2901153564453125, 0.307373046875, 0.3246307373046875, 0.341888427734375, 0.3591461181640625, 0.37640380859375, 0.3936614990234375, 0.410919189453125, 0.4281768798828125, 0.4454345703125, 0.4626922607421875, 0.479949951171875, 0.4972076416015625, 0.51446533203125, 0.5317230224609375, 0.548980712890625, 0.5662384033203125, 0.58349609375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 1.0, 5.0, 6.0, 8.0, 4.0, 14.0, 9.0, 9.0, 25.0, 29.0, 32.0, 45.0, 43.0, 57.0, 62.0, 60.0, 66.0, 76.0, 74.0, 57.0, 42.0, 51.0, 51.0, 36.0, 30.0, 13.0, 20.0, 15.0, 12.0, 15.0, 9.0, 5.0, 5.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0858154296875, -0.08279228210449219, -0.07976913452148438, -0.07674598693847656, -0.07372283935546875, -0.07069969177246094, -0.06767654418945312, -0.06465339660644531, -0.0616302490234375, -0.05860710144042969, -0.055583953857421875, -0.05256080627441406, -0.04953765869140625, -0.04651451110839844, -0.043491363525390625, -0.04046821594238281, -0.037445068359375, -0.03442192077636719, -0.031398773193359375, -0.028375625610351562, -0.02535247802734375, -0.022329330444335938, -0.019306182861328125, -0.016283035278320312, -0.0132598876953125, -0.010236740112304688, -0.007213592529296875, -0.0041904449462890625, -0.00116729736328125, 0.0018558502197265625, 0.004878997802734375, 0.007902145385742188, 0.01092529296875, 0.013948440551757812, 0.016971588134765625, 0.019994735717773438, 0.02301788330078125, 0.026041030883789062, 0.029064178466796875, 0.03208732604980469, 0.0351104736328125, 0.03813362121582031, 0.041156768798828125, 0.04417991638183594, 0.04720306396484375, 0.05022621154785156, 0.053249359130859375, 0.05627250671386719, 0.059295654296875, 0.06231880187988281, 0.06534194946289062, 0.06836509704589844, 0.07138824462890625, 0.07441139221191406, 0.07743453979492188, 0.08045768737792969, 0.0834808349609375, 0.08650398254394531, 0.08952713012695312, 0.09255027770996094, 0.09557342529296875, 0.09859657287597656, 0.10161972045898438, 0.10464286804199219, 0.107666015625]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 11.0, 19.0, 20.0, 31.0, 49.0, 75.0, 94.0, 136.0, 141.0, 123.0, 90.0, 70.0, 55.0, 25.0, 27.0, 16.0, 9.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.6749579906463623, -3.5885374546051025, -3.5021166801452637, -3.415696144104004, -3.329275608062744, -3.2428550720214844, -3.1564342975616455, -3.0700137615203857, -2.983592987060547, -2.897172451019287, -2.8107516765594482, -2.7243311405181885, -2.6379106044769287, -2.55148983001709, -2.46506929397583, -2.3786487579345703, -2.2922282218933105, -2.205807685852051, -2.119386911392212, -2.032966375350952, -1.9465458393096924, -1.860125184059143, -1.7737045288085938, -1.687283992767334, -1.6008633375167847, -1.5144426822662354, -1.4280221462249756, -1.3416014909744263, -1.255180835723877, -1.1687602996826172, -1.0823396444320679, -0.9959190487861633, -0.9094983339309692, -0.8230777382850647, -0.7366571426391602, -0.6502364873886108, -0.5638158917427063, -0.47739529609680176, -0.39097464084625244, -0.3045540452003479, -0.21813344955444336, -0.13171283900737762, -0.04529222846031189, 0.04112839698791504, 0.12754899263381958, 0.21396958827972412, 0.30039024353027344, 0.386810839176178, 0.4732314348220825, 0.5596520304679871, 0.6460726261138916, 0.7324932813644409, 0.8189138770103455, 0.90533447265625, 0.9917551279067993, 1.0781757831573486, 1.1645963191986084, 1.2510169744491577, 1.3374375104904175, 1.4238581657409668, 1.5102787017822266, 1.5966993570327759, 1.6831200122833252, 1.769540548324585, 1.8559612035751343]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 7.0, 4.0, 12.0, 14.0, 9.0, 15.0, 14.0, 16.0, 23.0, 14.0, 23.0, 28.0, 30.0, 26.0, 30.0, 41.0, 40.0, 41.0, 43.0, 40.0, 51.0, 37.0, 43.0, 33.0, 38.0, 40.0, 25.0, 24.0, 25.0, 38.0, 25.0, 21.0, 32.0, 11.0, 17.0, 14.0, 8.0, 14.0, 7.0, 10.0, 6.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0068734884262085, -0.9750584363937378, -0.9432433843612671, -0.9114283323287964, -0.8796132802963257, -0.847798228263855, -0.815983235836029, -0.7841681838035583, -0.7523531317710876, -0.7205380797386169, -0.6887230277061462, -0.6569079756736755, -0.6250929832458496, -0.5932779312133789, -0.5614628791809082, -0.5296478271484375, -0.4978327751159668, -0.4660177230834961, -0.4342026710510254, -0.4023876488208771, -0.37057259678840637, -0.33875754475593567, -0.30694252252578735, -0.27512747049331665, -0.24331241846084595, -0.21149736642837524, -0.17968232929706573, -0.14786729216575623, -0.11605224013328552, -0.08423718810081482, -0.05242215096950531, -0.0206071138381958, 0.011208057403564453, 0.04302310198545456, 0.07483814656734467, 0.10665319114923477, 0.13846823573112488, 0.17028328776359558, 0.2020983248949051, 0.2339133620262146, 0.2657284140586853, 0.297543466091156, 0.3293585181236267, 0.361173540353775, 0.3929885923862457, 0.42480364441871643, 0.45661866664886475, 0.48843371868133545, 0.5202487707138062, 0.5520638227462769, 0.5838788747787476, 0.6156939268112183, 0.647508978843689, 0.6793240308761597, 0.7111390233039856, 0.7429540753364563, 0.774769127368927, 0.8065841794013977, 0.8383992314338684, 0.8702142834663391, 0.902029275894165, 0.9338443279266357, 0.9656593799591064, 0.9974744319915771, 1.0292894840240479]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 7.0, 5.0, 6.0, 10.0, 12.0, 18.0, 29.0, 36.0, 61.0, 61.0, 67.0, 143.0, 206.0, 354.0, 539.0, 1190.0, 2312.0, 5701.0, 18561.0, 116375.0, 747436.0, 125238.0, 19153.0, 5893.0, 2376.0, 1191.0, 585.0, 320.0, 227.0, 136.0, 75.0, 74.0, 38.0, 37.0, 24.0, 20.0, 13.0, 8.0, 7.0, 3.0, 5.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.69677734375, -0.6746673583984375, -0.652557373046875, -0.6304473876953125, -0.60833740234375, -0.5862274169921875, -0.564117431640625, -0.5420074462890625, -0.5198974609375, -0.4977874755859375, -0.475677490234375, -0.4535675048828125, -0.43145751953125, -0.4093475341796875, -0.387237548828125, -0.3651275634765625, -0.343017578125, -0.3209075927734375, -0.298797607421875, -0.2766876220703125, -0.25457763671875, -0.2324676513671875, -0.210357666015625, -0.1882476806640625, -0.1661376953125, -0.1440277099609375, -0.121917724609375, -0.0998077392578125, -0.07769775390625, -0.0555877685546875, -0.033477783203125, -0.0113677978515625, 0.0107421875, 0.0328521728515625, 0.054962158203125, 0.0770721435546875, 0.09918212890625, 0.1212921142578125, 0.143402099609375, 0.1655120849609375, 0.1876220703125, 0.2097320556640625, 0.231842041015625, 0.2539520263671875, 0.27606201171875, 0.2981719970703125, 0.320281982421875, 0.3423919677734375, 0.364501953125, 0.3866119384765625, 0.408721923828125, 0.4308319091796875, 0.45294189453125, 0.4750518798828125, 0.497161865234375, 0.5192718505859375, 0.5413818359375, 0.5634918212890625, 0.585601806640625, 0.6077117919921875, 0.62982177734375, 0.6519317626953125, 0.674041748046875, 0.6961517333984375, 0.71826171875]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 0.0, 3.0, 8.0, 2.0, 4.0, 7.0, 9.0, 8.0, 11.0, 9.0, 11.0, 15.0, 16.0, 20.0, 13.0, 24.0, 18.0, 27.0, 22.0, 26.0, 30.0, 36.0, 44.0, 39.0, 48.0, 32.0, 41.0, 40.0, 36.0, 31.0, 24.0, 41.0, 35.0, 26.0, 26.0, 26.0, 29.0, 21.0, 30.0, 27.0, 13.0, 12.0, 13.0, 12.0, 9.0, 10.0, 9.0, 2.0, 2.0, 4.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.37109375, -1.3244171142578125, -1.277740478515625, -1.2310638427734375, -1.18438720703125, -1.1377105712890625, -1.091033935546875, -1.0443572998046875, -0.9976806640625, -0.9510040283203125, -0.904327392578125, -0.8576507568359375, -0.81097412109375, -0.7642974853515625, -0.717620849609375, -0.6709442138671875, -0.624267578125, -0.5775909423828125, -0.530914306640625, -0.4842376708984375, -0.43756103515625, -0.3908843994140625, -0.344207763671875, -0.2975311279296875, -0.2508544921875, -0.2041778564453125, -0.157501220703125, -0.1108245849609375, -0.06414794921875, -0.0174713134765625, 0.029205322265625, 0.0758819580078125, 0.12255859375, 0.1692352294921875, 0.215911865234375, 0.2625885009765625, 0.30926513671875, 0.3559417724609375, 0.402618408203125, 0.4492950439453125, 0.4959716796875, 0.5426483154296875, 0.589324951171875, 0.6360015869140625, 0.68267822265625, 0.7293548583984375, 0.776031494140625, 0.8227081298828125, 0.869384765625, 0.9160614013671875, 0.962738037109375, 1.0094146728515625, 1.05609130859375, 1.1027679443359375, 1.149444580078125, 1.1961212158203125, 1.2427978515625, 1.2894744873046875, 1.336151123046875, 1.3828277587890625, 1.42950439453125, 1.4761810302734375, 1.522857666015625, 1.5695343017578125, 1.6162109375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 9.0, 5.0, 7.0, 7.0, 14.0, 14.0, 21.0, 17.0, 22.0, 40.0, 46.0, 58.0, 82.0, 99.0, 181.0, 253.0, 480.0, 1406.0, 5088.0, 33304.0, 838710.0, 152861.0, 11454.0, 2457.0, 815.0, 343.0, 191.0, 145.0, 96.0, 71.0, 54.0, 41.0, 31.0, 22.0, 13.0, 20.0, 19.0, 15.0, 4.0, 8.0, 5.0, 4.0, 7.0, 4.0, 4.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.025390625, -0.99090576171875, -0.9564208984375, -0.92193603515625, -0.887451171875, -0.85296630859375, -0.8184814453125, -0.78399658203125, -0.74951171875, -0.71502685546875, -0.6805419921875, -0.64605712890625, -0.611572265625, -0.57708740234375, -0.5426025390625, -0.50811767578125, -0.4736328125, -0.43914794921875, -0.4046630859375, -0.37017822265625, -0.335693359375, -0.30120849609375, -0.2667236328125, -0.23223876953125, -0.19775390625, -0.16326904296875, -0.1287841796875, -0.09429931640625, -0.059814453125, -0.02532958984375, 0.0091552734375, 0.04364013671875, 0.078125, 0.11260986328125, 0.1470947265625, 0.18157958984375, 0.216064453125, 0.25054931640625, 0.2850341796875, 0.31951904296875, 0.35400390625, 0.38848876953125, 0.4229736328125, 0.45745849609375, 0.491943359375, 0.52642822265625, 0.5609130859375, 0.59539794921875, 0.6298828125, 0.66436767578125, 0.6988525390625, 0.73333740234375, 0.767822265625, 0.80230712890625, 0.8367919921875, 0.87127685546875, 0.90576171875, 0.94024658203125, 0.9747314453125, 1.00921630859375, 1.043701171875, 1.07818603515625, 1.1126708984375, 1.14715576171875, 1.181640625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 3.0, 9.0, 5.0, 11.0, 6.0, 13.0, 17.0, 19.0, 19.0, 21.0, 24.0, 31.0, 27.0, 29.0, 37.0, 37.0, 33.0, 43.0, 45.0, 50.0, 43.0, 52.0, 32.0, 43.0, 47.0, 30.0, 44.0, 29.0, 32.0, 24.0, 22.0, 19.0, 17.0, 14.0, 22.0, 13.0, 7.0, 4.0, 5.0, 7.0, 4.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6015625, -1.548126220703125, -1.49468994140625, -1.441253662109375, -1.3878173828125, -1.334381103515625, -1.28094482421875, -1.227508544921875, -1.174072265625, -1.120635986328125, -1.06719970703125, -1.013763427734375, -0.9603271484375, -0.906890869140625, -0.85345458984375, -0.800018310546875, -0.74658203125, -0.693145751953125, -0.63970947265625, -0.586273193359375, -0.5328369140625, -0.479400634765625, -0.42596435546875, -0.372528076171875, -0.319091796875, -0.265655517578125, -0.21221923828125, -0.158782958984375, -0.1053466796875, -0.051910400390625, 0.00152587890625, 0.054962158203125, 0.1083984375, 0.161834716796875, 0.21527099609375, 0.268707275390625, 0.3221435546875, 0.375579833984375, 0.42901611328125, 0.482452392578125, 0.535888671875, 0.589324951171875, 0.64276123046875, 0.696197509765625, 0.7496337890625, 0.803070068359375, 0.85650634765625, 0.909942626953125, 0.96337890625, 1.016815185546875, 1.07025146484375, 1.123687744140625, 1.1771240234375, 1.230560302734375, 1.28399658203125, 1.337432861328125, 1.390869140625, 1.444305419921875, 1.49774169921875, 1.551177978515625, 1.6046142578125, 1.658050537109375, 1.71148681640625, 1.764923095703125, 1.818359375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 10.0, 16.0, 18.0, 26.0, 48.0, 54.0, 104.0, 137.0, 216.0, 346.0, 685.0, 1228.0, 2485.0, 5514.0, 16661.0, 98855.0, 831564.0, 67414.0, 13534.0, 4869.0, 2253.0, 1099.0, 546.0, 315.0, 191.0, 114.0, 97.0, 38.0, 46.0, 13.0, 12.0, 10.0, 3.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.204345703125, -0.19762802124023438, -0.19091033935546875, -0.18419265747070312, -0.1774749755859375, -0.17075729370117188, -0.16403961181640625, -0.15732192993164062, -0.150604248046875, -0.14388656616210938, -0.13716888427734375, -0.13045120239257812, -0.1237335205078125, -0.11701583862304688, -0.11029815673828125, -0.10358047485351562, -0.09686279296875, -0.09014511108398438, -0.08342742919921875, -0.07670974731445312, -0.0699920654296875, -0.06327438354492188, -0.05655670166015625, -0.049839019775390625, -0.043121337890625, -0.036403656005859375, -0.02968597412109375, -0.022968292236328125, -0.0162506103515625, -0.009532928466796875, -0.00281524658203125, 0.003902435302734375, 0.0106201171875, 0.017337799072265625, 0.02405548095703125, 0.030773162841796875, 0.0374908447265625, 0.044208526611328125, 0.05092620849609375, 0.057643890380859375, 0.064361572265625, 0.07107925415039062, 0.07779693603515625, 0.08451461791992188, 0.0912322998046875, 0.09794998168945312, 0.10466766357421875, 0.11138534545898438, 0.11810302734375, 0.12482070922851562, 0.13153839111328125, 0.13825607299804688, 0.1449737548828125, 0.15169143676757812, 0.15840911865234375, 0.16512680053710938, 0.171844482421875, 0.17856216430664062, 0.18527984619140625, 0.19199752807617188, 0.1987152099609375, 0.20543289184570312, 0.21215057373046875, 0.21886825561523438, 0.2255859375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 4.0, 6.0, 7.0, 19.0, 31.0, 51.0, 102.0, 299.0, 250.0, 85.0, 47.0, 24.0, 24.0, 9.0, 5.0, 8.0, 8.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.328655242919922e-05, -5.171447992324829e-05, -5.014240741729736e-05, -4.8570334911346436e-05, -4.699826240539551e-05, -4.542618989944458e-05, -4.385411739349365e-05, -4.2282044887542725e-05, -4.07099723815918e-05, -3.913789987564087e-05, -3.756582736968994e-05, -3.5993754863739014e-05, -3.4421682357788086e-05, -3.284960985183716e-05, -3.127753734588623e-05, -2.9705464839935303e-05, -2.8133392333984375e-05, -2.6561319828033447e-05, -2.498924732208252e-05, -2.3417174816131592e-05, -2.1845102310180664e-05, -2.0273029804229736e-05, -1.870095729827881e-05, -1.712888479232788e-05, -1.5556812286376953e-05, -1.3984739780426025e-05, -1.2412667274475098e-05, -1.084059476852417e-05, -9.268522262573242e-06, -7.696449756622314e-06, -6.124377250671387e-06, -4.552304744720459e-06, -2.9802322387695312e-06, -1.4081597328186035e-06, 1.6391277313232422e-07, 1.735985279083252e-06, 3.3080577850341797e-06, 4.880130290985107e-06, 6.452202796936035e-06, 8.024275302886963e-06, 9.59634780883789e-06, 1.1168420314788818e-05, 1.2740492820739746e-05, 1.4312565326690674e-05, 1.58846378326416e-05, 1.745671033859253e-05, 1.9028782844543457e-05, 2.0600855350494385e-05, 2.2172927856445312e-05, 2.374500036239624e-05, 2.5317072868347168e-05, 2.6889145374298096e-05, 2.8461217880249023e-05, 3.003329038619995e-05, 3.160536289215088e-05, 3.317743539810181e-05, 3.4749507904052734e-05, 3.632158041000366e-05, 3.789365291595459e-05, 3.946572542190552e-05, 4.1037797927856445e-05, 4.260987043380737e-05, 4.41819429397583e-05, 4.575401544570923e-05, 4.7326087951660156e-05]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 4.0, 6.0, 4.0, 4.0, 2.0, 9.0, 9.0, 11.0, 13.0, 22.0, 38.0, 60.0, 115.0, 230.0, 382.0, 767.0, 1562.0, 3779.0, 10344.0, 45660.0, 875325.0, 87116.0, 14294.0, 4791.0, 2021.0, 936.0, 483.0, 235.0, 121.0, 64.0, 49.0, 29.0, 21.0, 13.0, 10.0, 14.0, 10.0, 6.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2225341796875, -0.2134990692138672, -0.20446395874023438, -0.19542884826660156, -0.18639373779296875, -0.17735862731933594, -0.16832351684570312, -0.1592884063720703, -0.1502532958984375, -0.1412181854248047, -0.13218307495117188, -0.12314796447753906, -0.11411285400390625, -0.10507774353027344, -0.09604263305664062, -0.08700752258300781, -0.077972412109375, -0.06893730163574219, -0.059902191162109375, -0.05086708068847656, -0.04183197021484375, -0.03279685974121094, -0.023761749267578125, -0.014726638793945312, -0.0056915283203125, 0.0033435821533203125, 0.012378692626953125, 0.021413803100585938, 0.03044891357421875, 0.03948402404785156, 0.048519134521484375, 0.05755424499511719, 0.06658935546875, 0.07562446594238281, 0.08465957641601562, 0.09369468688964844, 0.10272979736328125, 0.11176490783691406, 0.12080001831054688, 0.1298351287841797, 0.1388702392578125, 0.1479053497314453, 0.15694046020507812, 0.16597557067871094, 0.17501068115234375, 0.18404579162597656, 0.19308090209960938, 0.2021160125732422, 0.211151123046875, 0.2201862335205078, 0.22922134399414062, 0.23825645446777344, 0.24729156494140625, 0.25632667541503906, 0.2653617858886719, 0.2743968963623047, 0.2834320068359375, 0.2924671173095703, 0.3015022277832031, 0.31053733825683594, 0.31957244873046875, 0.32860755920410156, 0.3376426696777344, 0.3466777801513672, 0.355712890625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 4.0, 7.0, 7.0, 2.0, 8.0, 11.0, 23.0, 55.0, 90.0, 231.0, 294.0, 101.0, 61.0, 27.0, 13.0, 7.0, 13.0, 3.0, 9.0, 7.0, 5.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.131591796875, -0.1277475357055664, -0.12390327453613281, -0.12005901336669922, -0.11621475219726562, -0.11237049102783203, -0.10852622985839844, -0.10468196868896484, -0.10083770751953125, -0.09699344635009766, -0.09314918518066406, -0.08930492401123047, -0.08546066284179688, -0.08161640167236328, -0.07777214050292969, -0.0739278793334961, -0.0700836181640625, -0.0662393569946289, -0.06239509582519531, -0.05855083465576172, -0.054706573486328125, -0.05086231231689453, -0.04701805114746094, -0.043173789978027344, -0.03932952880859375, -0.035485267639160156, -0.03164100646972656, -0.02779674530029297, -0.023952484130859375, -0.02010822296142578, -0.016263961791992188, -0.012419700622558594, -0.008575439453125, -0.004731178283691406, -0.0008869171142578125, 0.0029573440551757812, 0.006801605224609375, 0.010645866394042969, 0.014490127563476562, 0.018334388732910156, 0.02217864990234375, 0.026022911071777344, 0.029867172241210938, 0.03371143341064453, 0.037555694580078125, 0.04139995574951172, 0.04524421691894531, 0.049088478088378906, 0.0529327392578125, 0.056777000427246094, 0.06062126159667969, 0.06446552276611328, 0.06830978393554688, 0.07215404510498047, 0.07599830627441406, 0.07984256744384766, 0.08368682861328125, 0.08753108978271484, 0.09137535095214844, 0.09521961212158203, 0.09906387329101562, 0.10290813446044922, 0.10675239562988281, 0.1105966567993164, 0.11444091796875]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 7.0, 29.0, 81.0, 249.0, 354.0, 196.0, 72.0, 23.0, 6.0, 0.0, 2.0], "bins": [-21.121305465698242, -20.7532901763916, -20.385272979736328, -20.017257690429688, -19.649240493774414, -19.281225204467773, -18.9132080078125, -18.54519271850586, -18.17717742919922, -17.809162139892578, -17.441144943237305, -17.073129653930664, -16.70511245727539, -16.33709716796875, -15.969080924987793, -15.601064682006836, -15.233048439025879, -14.865032196044922, -14.497015953063965, -14.128999710083008, -13.760984420776367, -13.39296817779541, -13.024951934814453, -12.656935691833496, -12.288919448852539, -11.920903205871582, -11.552886962890625, -11.184871673583984, -10.816855430603027, -10.44883918762207, -10.080822944641113, -9.712806701660156, -9.344792366027832, -8.976776123046875, -8.608759880065918, -8.240743637084961, -7.87272834777832, -7.504712104797363, -7.136695861816406, -6.768679618835449, -6.400663375854492, -6.032647132873535, -5.664631366729736, -5.296615123748779, -4.9285993576049805, -4.560583114624023, -4.192566871643066, -3.8245508670806885, -3.4565351009368896, -3.0885190963745117, -2.7205028533935547, -2.3524868488311768, -1.9844708442687988, -1.616454839706421, -1.2484385967254639, -0.8804225921630859, -0.512406587600708, -0.1443905234336853, 0.2236255407333374, 0.5916416645050049, 0.9596576690673828, 1.3276736736297607, 1.6956899166107178, 2.0637059211730957, 2.4317219257354736]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 3.0, 5.0, 4.0, 7.0, 7.0, 5.0, 13.0, 11.0, 12.0, 18.0, 14.0, 13.0, 17.0, 12.0, 28.0, 32.0, 24.0, 23.0, 29.0, 35.0, 47.0, 40.0, 48.0, 47.0, 39.0, 25.0, 46.0, 31.0, 26.0, 41.0, 32.0, 35.0, 19.0, 33.0, 25.0, 36.0, 25.0, 10.0, 14.0, 10.0, 11.0, 10.0, 8.0, 8.0, 5.0, 10.0, 3.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.557124137878418, -2.479018449783325, -2.4009130001068115, -2.3228073120117188, -2.244701862335205, -2.1665961742401123, -2.0884907245635986, -2.010385036468506, -1.9322794675827026, -1.8541738986968994, -1.7760683298110962, -1.697962760925293, -1.6198570728302002, -1.5417516231536865, -1.4636459350585938, -1.3855403661727905, -1.3074347972869873, -1.229329228401184, -1.1512236595153809, -1.0731180906295776, -0.9950124621391296, -0.9169068932533264, -0.8388012647628784, -0.7606956958770752, -0.682590126991272, -0.6044845581054688, -0.5263789892196655, -0.44827336072921753, -0.3701677918434143, -0.2920622229576111, -0.21395662426948547, -0.13585102558135986, -0.05774545669555664, 0.020360127091407776, 0.09846571087837219, 0.1765712946653366, 0.254676878452301, 0.33278244733810425, 0.41088804602622986, 0.48899364471435547, 0.5670992136001587, 0.6452047824859619, 0.7233103513717651, 0.8014159798622131, 0.8795215487480164, 0.9576271176338196, 1.0357327461242676, 1.1138383150100708, 1.191943883895874, 1.2700494527816772, 1.3481550216674805, 1.4262605905532837, 1.504366159439087, 1.5824718475341797, 1.660577416419983, 1.7386829853057861, 1.8167885541915894, 1.8948941230773926, 1.9729996919631958, 2.051105260848999, 2.129210948944092, 2.2073163986206055, 2.2854220867156982, 2.363527774810791, 2.4416332244873047]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 7.0, 9.0, 10.0, 8.0, 21.0, 11.0, 11.0, 18.0, 33.0, 46.0, 79.0, 126.0, 215.0, 480.0, 1200.0, 3106.0, 9469.0, 36608.0, 323420.0, 2917471.0, 816415.0, 63911.0, 14046.0, 4421.0, 1635.0, 632.0, 343.0, 157.0, 116.0, 65.0, 42.0, 27.0, 24.0, 14.0, 14.0, 23.0, 11.0, 7.0, 15.0, 6.0, 3.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.484375, -2.397705078125, -2.31103515625, -2.224365234375, -2.1376953125, -2.051025390625, -1.96435546875, -1.877685546875, -1.791015625, -1.704345703125, -1.61767578125, -1.531005859375, -1.4443359375, -1.357666015625, -1.27099609375, -1.184326171875, -1.09765625, -1.010986328125, -0.92431640625, -0.837646484375, -0.7509765625, -0.664306640625, -0.57763671875, -0.490966796875, -0.404296875, -0.317626953125, -0.23095703125, -0.144287109375, -0.0576171875, 0.029052734375, 0.11572265625, 0.202392578125, 0.2890625, 0.375732421875, 0.46240234375, 0.549072265625, 0.6357421875, 0.722412109375, 0.80908203125, 0.895751953125, 0.982421875, 1.069091796875, 1.15576171875, 1.242431640625, 1.3291015625, 1.415771484375, 1.50244140625, 1.589111328125, 1.67578125, 1.762451171875, 1.84912109375, 1.935791015625, 2.0224609375, 2.109130859375, 2.19580078125, 2.282470703125, 2.369140625, 2.455810546875, 2.54248046875, 2.629150390625, 2.7158203125, 2.802490234375, 2.88916015625, 2.975830078125, 3.0625]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 10.0, 10.0, 7.0, 14.0, 14.0, 14.0, 19.0, 26.0, 37.0, 40.0, 33.0, 63.0, 43.0, 59.0, 71.0, 57.0, 65.0, 50.0, 49.0, 59.0, 38.0, 40.0, 38.0, 24.0, 29.0, 17.0, 9.0, 24.0, 13.0, 15.0, 7.0, 7.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3505859375, -1.3051605224609375, -1.259735107421875, -1.2143096923828125, -1.16888427734375, -1.1234588623046875, -1.078033447265625, -1.0326080322265625, -0.9871826171875, -0.9417572021484375, -0.896331787109375, -0.8509063720703125, -0.80548095703125, -0.7600555419921875, -0.714630126953125, -0.6692047119140625, -0.623779296875, -0.5783538818359375, -0.532928466796875, -0.4875030517578125, -0.44207763671875, -0.3966522216796875, -0.351226806640625, -0.3058013916015625, -0.2603759765625, -0.2149505615234375, -0.169525146484375, -0.1240997314453125, -0.07867431640625, -0.0332489013671875, 0.012176513671875, 0.0576019287109375, 0.10302734375, 0.1484527587890625, 0.193878173828125, 0.2393035888671875, 0.28472900390625, 0.3301544189453125, 0.375579833984375, 0.4210052490234375, 0.4664306640625, 0.5118560791015625, 0.557281494140625, 0.6027069091796875, 0.64813232421875, 0.6935577392578125, 0.738983154296875, 0.7844085693359375, 0.829833984375, 0.8752593994140625, 0.920684814453125, 0.9661102294921875, 1.01153564453125, 1.0569610595703125, 1.102386474609375, 1.1478118896484375, 1.1932373046875, 1.2386627197265625, 1.284088134765625, 1.3295135498046875, 1.37493896484375, 1.4203643798828125, 1.465789794921875, 1.5112152099609375, 1.556640625]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 7.0, 6.0, 9.0, 9.0, 12.0, 24.0, 42.0, 47.0, 103.0, 251.0, 952.0, 13599.0, 4093245.0, 83412.0, 1865.0, 370.0, 148.0, 66.0, 36.0, 32.0, 21.0, 10.0, 8.0, 5.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.78125, -6.494873046875, -6.20849609375, -5.922119140625, -5.6357421875, -5.349365234375, -5.06298828125, -4.776611328125, -4.490234375, -4.203857421875, -3.91748046875, -3.631103515625, -3.3447265625, -3.058349609375, -2.77197265625, -2.485595703125, -2.19921875, -1.912841796875, -1.62646484375, -1.340087890625, -1.0537109375, -0.767333984375, -0.48095703125, -0.194580078125, 0.091796875, 0.378173828125, 0.66455078125, 0.950927734375, 1.2373046875, 1.523681640625, 1.81005859375, 2.096435546875, 2.3828125, 2.669189453125, 2.95556640625, 3.241943359375, 3.5283203125, 3.814697265625, 4.10107421875, 4.387451171875, 4.673828125, 4.960205078125, 5.24658203125, 5.532958984375, 5.8193359375, 6.105712890625, 6.39208984375, 6.678466796875, 6.96484375, 7.251220703125, 7.53759765625, 7.823974609375, 8.1103515625, 8.396728515625, 8.68310546875, 8.969482421875, 9.255859375, 9.542236328125, 9.82861328125, 10.114990234375, 10.4013671875, 10.687744140625, 10.97412109375, 11.260498046875, 11.546875]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 5.0, 7.0, 7.0, 6.0, 14.0, 16.0, 24.0, 37.0, 41.0, 67.0, 110.0, 224.0, 456.0, 825.0, 932.0, 572.0, 302.0, 171.0, 105.0, 48.0, 44.0, 27.0, 18.0, 7.0, 6.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7666015625, -0.7394561767578125, -0.712310791015625, -0.6851654052734375, -0.65802001953125, -0.6308746337890625, -0.603729248046875, -0.5765838623046875, -0.5494384765625, -0.5222930908203125, -0.495147705078125, -0.4680023193359375, -0.44085693359375, -0.4137115478515625, -0.386566162109375, -0.3594207763671875, -0.332275390625, -0.3051300048828125, -0.277984619140625, -0.2508392333984375, -0.22369384765625, -0.1965484619140625, -0.169403076171875, -0.1422576904296875, -0.1151123046875, -0.0879669189453125, -0.060821533203125, -0.0336761474609375, -0.00653076171875, 0.0206146240234375, 0.047760009765625, 0.0749053955078125, 0.10205078125, 0.1291961669921875, 0.156341552734375, 0.1834869384765625, 0.21063232421875, 0.2377777099609375, 0.264923095703125, 0.2920684814453125, 0.3192138671875, 0.3463592529296875, 0.373504638671875, 0.4006500244140625, 0.42779541015625, 0.4549407958984375, 0.482086181640625, 0.5092315673828125, 0.536376953125, 0.5635223388671875, 0.590667724609375, 0.6178131103515625, 0.64495849609375, 0.6721038818359375, 0.699249267578125, 0.7263946533203125, 0.7535400390625, 0.7806854248046875, 0.807830810546875, 0.8349761962890625, 0.86212158203125, 0.8892669677734375, 0.916412353515625, 0.9435577392578125, 0.970703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 6.0, 2.0, 8.0, 2.0, 10.0, 10.0, 16.0, 16.0, 16.0, 24.0, 28.0, 39.0, 60.0, 41.0, 55.0, 58.0, 72.0, 77.0, 71.0, 72.0, 59.0, 55.0, 27.0, 32.0, 32.0, 31.0, 17.0, 13.0, 10.0, 9.0, 14.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6548538208007812, -1.6035499572753906, -1.5522462129592896, -1.500942349433899, -1.4496384859085083, -1.3983347415924072, -1.3470308780670166, -1.295727014541626, -1.2444231510162354, -1.1931192874908447, -1.1418155431747437, -1.090511679649353, -1.0392078161239624, -0.9879040122032166, -0.9366002082824707, -0.8852963447570801, -0.833992600440979, -0.7826887965202332, -0.7313849329948425, -0.6800811290740967, -0.628777265548706, -0.5774734616279602, -0.5261696577072144, -0.4748658239841461, -0.4235619902610779, -0.37225815653800964, -0.3209543228149414, -0.26965051889419556, -0.21834668517112732, -0.16704285144805908, -0.11573904752731323, -0.064435213804245, -0.013131260871887207, 0.03817256540060043, 0.08947639167308807, 0.14078021049499512, 0.19208404421806335, 0.2433878779411316, 0.29469168186187744, 0.3459955155849457, 0.3972993493080139, 0.44860318303108215, 0.4999070167541504, 0.5512108206748962, 0.6025146245956421, 0.6538184881210327, 0.7051222920417786, 0.7564260959625244, 0.807729959487915, 0.8590337634086609, 0.9103376269340515, 0.9616414308547974, 1.012945294380188, 1.064249038696289, 1.1155529022216797, 1.1668567657470703, 1.218160629272461, 1.2694644927978516, 1.3207682371139526, 1.3720721006393433, 1.4233759641647339, 1.474679708480835, 1.5259835720062256, 1.5772874355316162, 1.6285911798477173]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 8.0, 11.0, 7.0, 12.0, 11.0, 12.0, 20.0, 7.0, 13.0, 12.0, 19.0, 21.0, 25.0, 29.0, 29.0, 21.0, 31.0, 26.0, 24.0, 37.0, 38.0, 33.0, 37.0, 34.0, 37.0, 26.0, 33.0, 31.0, 24.0, 33.0, 40.0, 26.0, 23.0, 30.0, 31.0, 13.0, 20.0, 12.0, 12.0, 13.0, 20.0, 7.0, 14.0, 11.0, 7.0, 8.0, 4.0, 7.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-1.110924482345581, -1.0798918008804321, -1.0488591194152832, -1.0178263187408447, -0.9867936372756958, -0.9557609558105469, -0.9247282147407532, -0.8936954736709595, -0.8626627922058105, -0.8316301107406616, -0.8005973696708679, -0.7695646286010742, -0.7385319471359253, -0.7074992656707764, -0.6764665246009827, -0.645433783531189, -0.61440110206604, -0.5833684206008911, -0.5523356795310974, -0.5213029384613037, -0.4902702569961548, -0.45923754572868347, -0.42820483446121216, -0.39717212319374084, -0.36613941192626953, -0.3351067006587982, -0.3040739893913269, -0.2730412781238556, -0.24200856685638428, -0.21097585558891296, -0.17994314432144165, -0.14891043305397034, -0.1178777813911438, -0.08684507012367249, -0.05581235885620117, -0.02477964758872986, 0.006253063678741455, 0.03728577494621277, 0.06831848621368408, 0.0993511974811554, 0.1303839087486267, 0.16141662001609802, 0.19244933128356934, 0.22348204255104065, 0.25451475381851196, 0.2855474650859833, 0.3165801763534546, 0.3476128876209259, 0.3786455988883972, 0.40967831015586853, 0.44071102142333984, 0.47174373269081116, 0.5027764439582825, 0.5338091850280762, 0.5648418664932251, 0.595874547958374, 0.6269072890281677, 0.6579400300979614, 0.6889727115631104, 0.7200053930282593, 0.751038134098053, 0.7820708751678467, 0.8131035566329956, 0.8441362380981445, 0.8751689791679382]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 4.0, 7.0, 9.0, 9.0, 21.0, 22.0, 34.0, 52.0, 78.0, 109.0, 156.0, 297.0, 468.0, 803.0, 1548.0, 2981.0, 5959.0, 12604.0, 29600.0, 78618.0, 214882.0, 375773.0, 199851.0, 72979.0, 27890.0, 11957.0, 5571.0, 2784.0, 1448.0, 770.0, 468.0, 301.0, 180.0, 94.0, 77.0, 53.0, 30.0, 23.0, 16.0, 8.0, 6.0, 2.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.77197265625, -0.74957275390625, -0.7271728515625, -0.70477294921875, -0.682373046875, -0.65997314453125, -0.6375732421875, -0.61517333984375, -0.5927734375, -0.57037353515625, -0.5479736328125, -0.52557373046875, -0.503173828125, -0.48077392578125, -0.4583740234375, -0.43597412109375, -0.41357421875, -0.39117431640625, -0.3687744140625, -0.34637451171875, -0.323974609375, -0.30157470703125, -0.2791748046875, -0.25677490234375, -0.234375, -0.21197509765625, -0.1895751953125, -0.16717529296875, -0.144775390625, -0.12237548828125, -0.0999755859375, -0.07757568359375, -0.05517578125, -0.03277587890625, -0.0103759765625, 0.01202392578125, 0.034423828125, 0.05682373046875, 0.0792236328125, 0.10162353515625, 0.1240234375, 0.14642333984375, 0.1688232421875, 0.19122314453125, 0.213623046875, 0.23602294921875, 0.2584228515625, 0.28082275390625, 0.30322265625, 0.32562255859375, 0.3480224609375, 0.37042236328125, 0.392822265625, 0.41522216796875, 0.4376220703125, 0.46002197265625, 0.482421875, 0.50482177734375, 0.5272216796875, 0.54962158203125, 0.572021484375, 0.59442138671875, 0.6168212890625, 0.63922119140625, 0.66162109375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 7.0, 4.0, 9.0, 15.0, 20.0, 17.0, 22.0, 30.0, 33.0, 40.0, 54.0, 40.0, 49.0, 78.0, 52.0, 67.0, 56.0, 60.0, 51.0, 50.0, 44.0, 45.0, 34.0, 40.0, 15.0, 26.0, 19.0, 10.0, 10.0, 7.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80126953125, -0.7671127319335938, -0.7329559326171875, -0.6987991333007812, -0.664642333984375, -0.6304855346679688, -0.5963287353515625, -0.5621719360351562, -0.52801513671875, -0.49385833740234375, -0.4597015380859375, -0.42554473876953125, -0.391387939453125, -0.35723114013671875, -0.3230743408203125, -0.28891754150390625, -0.2547607421875, -0.22060394287109375, -0.1864471435546875, -0.15229034423828125, -0.118133544921875, -0.08397674560546875, -0.0498199462890625, -0.01566314697265625, 0.01849365234375, 0.05265045166015625, 0.0868072509765625, 0.12096405029296875, 0.155120849609375, 0.18927764892578125, 0.2234344482421875, 0.25759124755859375, 0.291748046875, 0.32590484619140625, 0.3600616455078125, 0.39421844482421875, 0.428375244140625, 0.46253204345703125, 0.4966888427734375, 0.5308456420898438, 0.56500244140625, 0.5991592407226562, 0.6333160400390625, 0.6674728393554688, 0.701629638671875, 0.7357864379882812, 0.7699432373046875, 0.8041000366210938, 0.8382568359375, 0.8724136352539062, 0.9065704345703125, 0.9407272338867188, 0.974884033203125, 1.0090408325195312, 1.0431976318359375, 1.0773544311523438, 1.11151123046875, 1.1456680297851562, 1.1798248291015625, 1.2139816284179688, 1.248138427734375, 1.2822952270507812, 1.3164520263671875, 1.3506088256835938, 1.384765625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 4.0, 2.0, 4.0, 8.0, 8.0, 8.0, 8.0, 16.0, 25.0, 31.0, 51.0, 75.0, 119.0, 194.0, 273.0, 454.0, 842.0, 1780.0, 4262.0, 12538.0, 43227.0, 182446.0, 495086.0, 229479.0, 53566.0, 14810.0, 5103.0, 1912.0, 864.0, 483.0, 282.0, 181.0, 112.0, 86.0, 58.0, 41.0, 20.0, 29.0, 15.0, 9.0, 8.0, 12.0, 7.0, 6.0, 7.0, 2.0, 2.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9013671875, -0.8737030029296875, -0.846038818359375, -0.8183746337890625, -0.79071044921875, -0.7630462646484375, -0.735382080078125, -0.7077178955078125, -0.6800537109375, -0.6523895263671875, -0.624725341796875, -0.5970611572265625, -0.56939697265625, -0.5417327880859375, -0.514068603515625, -0.4864044189453125, -0.458740234375, -0.4310760498046875, -0.403411865234375, -0.3757476806640625, -0.34808349609375, -0.3204193115234375, -0.292755126953125, -0.2650909423828125, -0.2374267578125, -0.2097625732421875, -0.182098388671875, -0.1544342041015625, -0.12677001953125, -0.0991058349609375, -0.071441650390625, -0.0437774658203125, -0.01611328125, 0.0115509033203125, 0.039215087890625, 0.0668792724609375, 0.09454345703125, 0.1222076416015625, 0.149871826171875, 0.1775360107421875, 0.2052001953125, 0.2328643798828125, 0.260528564453125, 0.2881927490234375, 0.31585693359375, 0.3435211181640625, 0.371185302734375, 0.3988494873046875, 0.426513671875, 0.4541778564453125, 0.481842041015625, 0.5095062255859375, 0.53717041015625, 0.5648345947265625, 0.592498779296875, 0.6201629638671875, 0.6478271484375, 0.6754913330078125, 0.703155517578125, 0.7308197021484375, 0.75848388671875, 0.7861480712890625, 0.813812255859375, 0.8414764404296875, 0.869140625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 7.0, 3.0, 8.0, 9.0, 11.0, 8.0, 21.0, 21.0, 13.0, 23.0, 29.0, 30.0, 36.0, 44.0, 43.0, 49.0, 44.0, 53.0, 44.0, 55.0, 32.0, 56.0, 35.0, 43.0, 24.0, 33.0, 26.0, 36.0, 26.0, 31.0, 25.0, 15.0, 17.0, 12.0, 12.0, 9.0, 8.0, 10.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3193359375, -1.2689056396484375, -1.218475341796875, -1.1680450439453125, -1.11761474609375, -1.0671844482421875, -1.016754150390625, -0.9663238525390625, -0.9158935546875, -0.8654632568359375, -0.815032958984375, -0.7646026611328125, -0.71417236328125, -0.6637420654296875, -0.613311767578125, -0.5628814697265625, -0.512451171875, -0.4620208740234375, -0.411590576171875, -0.3611602783203125, -0.31072998046875, -0.2602996826171875, -0.209869384765625, -0.1594390869140625, -0.1090087890625, -0.0585784912109375, -0.008148193359375, 0.0422821044921875, 0.09271240234375, 0.1431427001953125, 0.193572998046875, 0.2440032958984375, 0.29443359375, 0.3448638916015625, 0.395294189453125, 0.4457244873046875, 0.49615478515625, 0.5465850830078125, 0.597015380859375, 0.6474456787109375, 0.6978759765625, 0.7483062744140625, 0.798736572265625, 0.8491668701171875, 0.89959716796875, 0.9500274658203125, 1.000457763671875, 1.0508880615234375, 1.101318359375, 1.1517486572265625, 1.202178955078125, 1.2526092529296875, 1.30303955078125, 1.3534698486328125, 1.403900146484375, 1.4543304443359375, 1.5047607421875, 1.5551910400390625, 1.605621337890625, 1.6560516357421875, 1.70648193359375, 1.7569122314453125, 1.807342529296875, 1.8577728271484375, 1.908203125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 8.0, 4.0, 11.0, 12.0, 13.0, 23.0, 34.0, 43.0, 57.0, 124.0, 156.0, 252.0, 387.0, 693.0, 1177.0, 2035.0, 3811.0, 8796.0, 23350.0, 84207.0, 439947.0, 375055.0, 71243.0, 20853.0, 7797.0, 3685.0, 1912.0, 1099.0, 664.0, 369.0, 247.0, 172.0, 100.0, 62.0, 54.0, 35.0, 20.0, 18.0, 11.0, 5.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.289794921875, -0.28173255920410156, -0.2736701965332031, -0.2656078338623047, -0.25754547119140625, -0.2494831085205078, -0.24142074584960938, -0.23335838317871094, -0.2252960205078125, -0.21723365783691406, -0.20917129516601562, -0.2011089324951172, -0.19304656982421875, -0.1849842071533203, -0.17692184448242188, -0.16885948181152344, -0.160797119140625, -0.15273475646972656, -0.14467239379882812, -0.1366100311279297, -0.12854766845703125, -0.12048530578613281, -0.11242294311523438, -0.10436058044433594, -0.0962982177734375, -0.08823585510253906, -0.08017349243164062, -0.07211112976074219, -0.06404876708984375, -0.05598640441894531, -0.047924041748046875, -0.03986167907714844, -0.03179931640625, -0.023736953735351562, -0.015674591064453125, -0.0076122283935546875, 0.00045013427734375, 0.008512496948242188, 0.016574859619140625, 0.024637222290039062, 0.0326995849609375, 0.04076194763183594, 0.048824310302734375, 0.05688667297363281, 0.06494903564453125, 0.07301139831542969, 0.08107376098632812, 0.08913612365722656, 0.097198486328125, 0.10526084899902344, 0.11332321166992188, 0.12138557434082031, 0.12944793701171875, 0.1375102996826172, 0.14557266235351562, 0.15363502502441406, 0.1616973876953125, 0.16975975036621094, 0.17782211303710938, 0.1858844757080078, 0.19394683837890625, 0.2020092010498047, 0.21007156372070312, 0.21813392639160156, 0.2261962890625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 11.0, 7.0, 20.0, 19.0, 34.0, 42.0, 56.0, 100.0, 123.0, 139.0, 138.0, 94.0, 65.0, 46.0, 26.0, 28.0, 16.0, 8.0, 5.0, 3.0, 2.0, 4.0, 5.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00022292137145996094, -0.00021646171808242798, -0.00021000206470489502, -0.00020354241132736206, -0.0001970827579498291, -0.00019062310457229614, -0.00018416345119476318, -0.00017770379781723022, -0.00017124414443969727, -0.0001647844910621643, -0.00015832483768463135, -0.0001518651843070984, -0.00014540553092956543, -0.00013894587755203247, -0.0001324862241744995, -0.00012602657079696655, -0.0001195669174194336, -0.00011310726404190063, -0.00010664761066436768, -0.00010018795728683472, -9.372830390930176e-05, -8.72686505317688e-05, -8.080899715423584e-05, -7.434934377670288e-05, -6.788969039916992e-05, -6.143003702163696e-05, -5.4970383644104004e-05, -4.8510730266571045e-05, -4.2051076889038086e-05, -3.559142351150513e-05, -2.9131770133972168e-05, -2.267211675643921e-05, -1.621246337890625e-05, -9.752810001373291e-06, -3.293156623840332e-06, 3.166496753692627e-06, 9.626150131225586e-06, 1.6085803508758545e-05, 2.2545456886291504e-05, 2.9005110263824463e-05, 3.546476364135742e-05, 4.192441701889038e-05, 4.838407039642334e-05, 5.48437237739563e-05, 6.130337715148926e-05, 6.776303052902222e-05, 7.422268390655518e-05, 8.068233728408813e-05, 8.71419906616211e-05, 9.360164403915405e-05, 0.00010006129741668701, 0.00010652095079421997, 0.00011298060417175293, 0.00011944025754928589, 0.00012589991092681885, 0.0001323595643043518, 0.00013881921768188477, 0.00014527887105941772, 0.00015173852443695068, 0.00015819817781448364, 0.0001646578311920166, 0.00017111748456954956, 0.00017757713794708252, 0.00018403679132461548, 0.00019049644470214844]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 5.0, 13.0, 9.0, 5.0, 23.0, 27.0, 48.0, 102.0, 175.0, 323.0, 618.0, 1376.0, 3473.0, 11278.0, 56954.0, 554937.0, 366696.0, 38884.0, 8545.0, 2831.0, 1078.0, 520.0, 279.0, 156.0, 67.0, 40.0, 33.0, 22.0, 11.0, 8.0, 7.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.42138671875, -0.40996551513671875, -0.3985443115234375, -0.38712310791015625, -0.375701904296875, -0.36428070068359375, -0.3528594970703125, -0.34143829345703125, -0.33001708984375, -0.31859588623046875, -0.3071746826171875, -0.29575347900390625, -0.284332275390625, -0.27291107177734375, -0.2614898681640625, -0.25006866455078125, -0.2386474609375, -0.22722625732421875, -0.2158050537109375, -0.20438385009765625, -0.192962646484375, -0.18154144287109375, -0.1701202392578125, -0.15869903564453125, -0.14727783203125, -0.13585662841796875, -0.1244354248046875, -0.11301422119140625, -0.101593017578125, -0.09017181396484375, -0.0787506103515625, -0.06732940673828125, -0.055908203125, -0.04448699951171875, -0.0330657958984375, -0.02164459228515625, -0.010223388671875, 0.00119781494140625, 0.0126190185546875, 0.02404022216796875, 0.03546142578125, 0.04688262939453125, 0.0583038330078125, 0.06972503662109375, 0.081146240234375, 0.09256744384765625, 0.1039886474609375, 0.11540985107421875, 0.1268310546875, 0.13825225830078125, 0.1496734619140625, 0.16109466552734375, 0.172515869140625, 0.18393707275390625, 0.1953582763671875, 0.20677947998046875, 0.21820068359375, 0.22962188720703125, 0.2410430908203125, 0.25246429443359375, 0.263885498046875, 0.27530670166015625, 0.2867279052734375, 0.29814910888671875, 0.3095703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 3.0, 2.0, 7.0, 0.0, 3.0, 3.0, 8.0, 10.0, 17.0, 21.0, 23.0, 35.0, 47.0, 52.0, 55.0, 58.0, 70.0, 91.0, 98.0, 74.0, 79.0, 57.0, 45.0, 40.0, 27.0, 24.0, 8.0, 7.0, 9.0, 1.0, 4.0, 5.0, 4.0, 1.0, 5.0, 1.0, 1.0, 4.0, 2.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.057098388671875, -0.05505228042602539, -0.05300617218017578, -0.05096006393432617, -0.04891395568847656, -0.04686784744262695, -0.044821739196777344, -0.042775630950927734, -0.040729522705078125, -0.038683414459228516, -0.036637306213378906, -0.0345911979675293, -0.03254508972167969, -0.030498981475830078, -0.02845287322998047, -0.02640676498413086, -0.02436065673828125, -0.02231454849243164, -0.02026844024658203, -0.018222332000732422, -0.016176223754882812, -0.014130115509033203, -0.012084007263183594, -0.010037899017333984, -0.007991790771484375, -0.005945682525634766, -0.0038995742797851562, -0.0018534660339355469, 0.0001926422119140625, 0.002238750457763672, 0.004284858703613281, 0.006330966949462891, 0.0083770751953125, 0.01042318344116211, 0.012469291687011719, 0.014515399932861328, 0.016561508178710938, 0.018607616424560547, 0.020653724670410156, 0.022699832916259766, 0.024745941162109375, 0.026792049407958984, 0.028838157653808594, 0.030884265899658203, 0.03293037414550781, 0.03497648239135742, 0.03702259063720703, 0.03906869888305664, 0.04111480712890625, 0.04316091537475586, 0.04520702362060547, 0.04725313186645508, 0.04929924011230469, 0.0513453483581543, 0.053391456604003906, 0.055437564849853516, 0.057483673095703125, 0.059529781341552734, 0.061575889587402344, 0.06362199783325195, 0.06566810607910156, 0.06771421432495117, 0.06976032257080078, 0.07180643081665039, 0.0738525390625]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 4.0, 5.0, 11.0, 12.0, 20.0, 30.0, 44.0, 66.0, 72.0, 92.0, 117.0, 124.0, 112.0, 88.0, 68.0, 32.0, 31.0, 23.0, 16.0, 6.0, 8.0, 5.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.134186029434204, -1.085532546043396, -1.036879062652588, -0.9882256388664246, -0.9395721554756165, -0.8909186720848083, -0.842265248298645, -0.7936117649078369, -0.7449582815170288, -0.6963047981262207, -0.6476513147354126, -0.5989978909492493, -0.5503444075584412, -0.5016909241676331, -0.45303747057914734, -0.4043840169906616, -0.3557305335998535, -0.3070770502090454, -0.2584235966205597, -0.20977012813091278, -0.16111665964126587, -0.11246319115161896, -0.06380972266197205, -0.015156269073486328, 0.03349721431732178, 0.08215068280696869, 0.1308041512966156, 0.1794576197862625, 0.22811108827590942, 0.27676457166671753, 0.32541802525520325, 0.37407147884368896, 0.4227250814437866, 0.4713785648345947, 0.5200320482254028, 0.5686854720115662, 0.6173389554023743, 0.6659924387931824, 0.7146458625793457, 0.7632993459701538, 0.8119528293609619, 0.86060631275177, 0.9092597961425781, 0.9579132199287415, 1.0065667629241943, 1.055220127105713, 1.103873610496521, 1.152527093887329, 1.2011805772781372, 1.2498340606689453, 1.2984875440597534, 1.3471410274505615, 1.39579439163208, 1.4444478750228882, 1.4931013584136963, 1.5417548418045044, 1.5904083251953125, 1.6390618085861206, 1.6877152919769287, 1.7363687753677368, 1.785022258758545, 1.8336756229400635, 1.8823291063308716, 1.9309825897216797, 1.9796360731124878]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 6.0, 4.0, 11.0, 18.0, 20.0, 25.0, 34.0, 30.0, 48.0, 53.0, 47.0, 71.0, 75.0, 56.0, 80.0, 53.0, 68.0, 55.0, 70.0, 39.0, 37.0, 36.0, 26.0, 14.0, 20.0, 10.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7447429895401001, -0.7064555883407593, -0.6681681275367737, -0.6298807263374329, -0.5915932655334473, -0.5533058643341064, -0.5150184631347656, -0.47673100233078003, -0.4384435713291168, -0.4001561403274536, -0.3618687093257904, -0.3235812783241272, -0.2852938771247864, -0.24700643122196198, -0.20871901512145996, -0.17043158411979675, -0.13214415311813354, -0.09385672211647034, -0.055569298565387726, -0.017281875014305115, 0.021005555987358093, 0.0592929869890213, 0.09758040308952332, 0.13586783409118652, 0.17415526509284973, 0.21244269609451294, 0.25073012709617615, 0.28901755809783936, 0.3273049592971802, 0.36559242010116577, 0.4038798213005066, 0.4421672523021698, 0.480454683303833, 0.5187420845031738, 0.5570295453071594, 0.5953169465065002, 0.6336044073104858, 0.6718918085098267, 0.7101792097091675, 0.7484666705131531, 0.7867541313171387, 0.8250415325164795, 0.8633289933204651, 0.9016163945198059, 0.9399038553237915, 0.9781912565231323, 1.0164786577224731, 1.0547661781311035, 1.0930535793304443, 1.1313409805297852, 1.169628381729126, 1.2079159021377563, 1.2462033033370972, 1.284490704536438, 1.3227781057357788, 1.3610656261444092, 1.3993529081344604, 1.4376403093338013, 1.475927710533142, 1.5142152309417725, 1.5525026321411133, 1.590790033340454, 1.629077434539795, 1.6673648357391357, 1.7056523561477661]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 4.0, 3.0, 9.0, 12.0, 11.0, 14.0, 37.0, 43.0, 62.0, 90.0, 147.0, 233.0, 346.0, 600.0, 1009.0, 1828.0, 3260.0, 6548.0, 17044.0, 67973.0, 575906.0, 304825.0, 44025.0, 12819.0, 5258.0, 2702.0, 1457.0, 850.0, 525.0, 328.0, 191.0, 127.0, 98.0, 49.0, 47.0, 21.0, 18.0, 20.0, 7.0, 7.0, 9.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.697265625, -0.669219970703125, -0.64117431640625, -0.613128662109375, -0.5850830078125, -0.557037353515625, -0.52899169921875, -0.500946044921875, -0.472900390625, -0.444854736328125, -0.41680908203125, -0.388763427734375, -0.3607177734375, -0.332672119140625, -0.30462646484375, -0.276580810546875, -0.24853515625, -0.220489501953125, -0.19244384765625, -0.164398193359375, -0.1363525390625, -0.108306884765625, -0.08026123046875, -0.052215576171875, -0.024169921875, 0.003875732421875, 0.03192138671875, 0.059967041015625, 0.0880126953125, 0.116058349609375, 0.14410400390625, 0.172149658203125, 0.2001953125, 0.228240966796875, 0.25628662109375, 0.284332275390625, 0.3123779296875, 0.340423583984375, 0.36846923828125, 0.396514892578125, 0.424560546875, 0.452606201171875, 0.48065185546875, 0.508697509765625, 0.5367431640625, 0.564788818359375, 0.59283447265625, 0.620880126953125, 0.64892578125, 0.676971435546875, 0.70501708984375, 0.733062744140625, 0.7611083984375, 0.789154052734375, 0.81719970703125, 0.845245361328125, 0.873291015625, 0.901336669921875, 0.92938232421875, 0.957427978515625, 0.9854736328125, 1.013519287109375, 1.04156494140625, 1.069610595703125, 1.09765625]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 5.0, 7.0, 3.0, 9.0, 14.0, 29.0, 30.0, 34.0, 48.0, 55.0, 74.0, 87.0, 79.0, 93.0, 84.0, 69.0, 63.0, 69.0, 53.0, 34.0, 33.0, 17.0, 11.0, 7.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.427734375, -1.340240478515625, -1.25274658203125, -1.165252685546875, -1.0777587890625, -0.990264892578125, -0.90277099609375, -0.815277099609375, -0.727783203125, -0.640289306640625, -0.55279541015625, -0.465301513671875, -0.3778076171875, -0.290313720703125, -0.20281982421875, -0.115325927734375, -0.02783203125, 0.059661865234375, 0.14715576171875, 0.234649658203125, 0.3221435546875, 0.409637451171875, 0.49713134765625, 0.584625244140625, 0.672119140625, 0.759613037109375, 0.84710693359375, 0.934600830078125, 1.0220947265625, 1.109588623046875, 1.19708251953125, 1.284576416015625, 1.3720703125, 1.459564208984375, 1.54705810546875, 1.634552001953125, 1.7220458984375, 1.809539794921875, 1.89703369140625, 1.984527587890625, 2.072021484375, 2.159515380859375, 2.24700927734375, 2.334503173828125, 2.4219970703125, 2.509490966796875, 2.59698486328125, 2.684478759765625, 2.77197265625, 2.859466552734375, 2.94696044921875, 3.034454345703125, 3.1219482421875, 3.209442138671875, 3.29693603515625, 3.384429931640625, 3.471923828125, 3.559417724609375, 3.64691162109375, 3.734405517578125, 3.8218994140625, 3.909393310546875, 3.99688720703125, 4.084381103515625, 4.171875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 2.0, 6.0, 8.0, 6.0, 18.0, 14.0, 19.0, 19.0, 16.0, 28.0, 44.0, 38.0, 67.0, 83.0, 174.0, 791.0, 20019.0, 1019826.0, 6318.0, 497.0, 133.0, 88.0, 80.0, 41.0, 51.0, 24.0, 33.0, 16.0, 12.0, 13.0, 10.0, 19.0, 8.0, 5.0, 4.0, 2.0, 4.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.88671875, -3.74468994140625, -3.6026611328125, -3.46063232421875, -3.318603515625, -3.17657470703125, -3.0345458984375, -2.89251708984375, -2.75048828125, -2.60845947265625, -2.4664306640625, -2.32440185546875, -2.182373046875, -2.04034423828125, -1.8983154296875, -1.75628662109375, -1.6142578125, -1.47222900390625, -1.3302001953125, -1.18817138671875, -1.046142578125, -0.90411376953125, -0.7620849609375, -0.62005615234375, -0.47802734375, -0.33599853515625, -0.1939697265625, -0.05194091796875, 0.090087890625, 0.23211669921875, 0.3741455078125, 0.51617431640625, 0.658203125, 0.80023193359375, 0.9422607421875, 1.08428955078125, 1.226318359375, 1.36834716796875, 1.5103759765625, 1.65240478515625, 1.79443359375, 1.93646240234375, 2.0784912109375, 2.22052001953125, 2.362548828125, 2.50457763671875, 2.6466064453125, 2.78863525390625, 2.9306640625, 3.07269287109375, 3.2147216796875, 3.35675048828125, 3.498779296875, 3.64080810546875, 3.7828369140625, 3.92486572265625, 4.06689453125, 4.20892333984375, 4.3509521484375, 4.49298095703125, 4.635009765625, 4.77703857421875, 4.9190673828125, 5.06109619140625, 5.203125]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 7.0, 3.0, 9.0, 5.0, 12.0, 20.0, 13.0, 19.0, 15.0, 23.0, 39.0, 25.0, 39.0, 35.0, 47.0, 54.0, 60.0, 51.0, 63.0, 62.0, 47.0, 53.0, 60.0, 39.0, 36.0, 29.0, 34.0, 15.0, 13.0, 8.0, 17.0, 10.0, 11.0, 5.0, 5.0, 2.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.716796875, -1.65679931640625, -1.5968017578125, -1.53680419921875, -1.476806640625, -1.41680908203125, -1.3568115234375, -1.29681396484375, -1.23681640625, -1.17681884765625, -1.1168212890625, -1.05682373046875, -0.996826171875, -0.93682861328125, -0.8768310546875, -0.81683349609375, -0.7568359375, -0.69683837890625, -0.6368408203125, -0.57684326171875, -0.516845703125, -0.45684814453125, -0.3968505859375, -0.33685302734375, -0.27685546875, -0.21685791015625, -0.1568603515625, -0.09686279296875, -0.036865234375, 0.02313232421875, 0.0831298828125, 0.14312744140625, 0.203125, 0.26312255859375, 0.3231201171875, 0.38311767578125, 0.443115234375, 0.50311279296875, 0.5631103515625, 0.62310791015625, 0.68310546875, 0.74310302734375, 0.8031005859375, 0.86309814453125, 0.923095703125, 0.98309326171875, 1.0430908203125, 1.10308837890625, 1.1630859375, 1.22308349609375, 1.2830810546875, 1.34307861328125, 1.403076171875, 1.46307373046875, 1.5230712890625, 1.58306884765625, 1.64306640625, 1.70306396484375, 1.7630615234375, 1.82305908203125, 1.883056640625, 1.94305419921875, 2.0030517578125, 2.06304931640625, 2.123046875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 5.0, 8.0, 8.0, 11.0, 18.0, 28.0, 53.0, 133.0, 416.0, 2364.0, 41760.0, 991346.0, 10786.0, 1134.0, 271.0, 93.0, 33.0, 23.0, 18.0, 13.0, 14.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0], "bins": [-1.9453125, -1.8945465087890625, -1.843780517578125, -1.7930145263671875, -1.74224853515625, -1.6914825439453125, -1.640716552734375, -1.5899505615234375, -1.5391845703125, -1.4884185791015625, -1.437652587890625, -1.3868865966796875, -1.33612060546875, -1.2853546142578125, -1.234588623046875, -1.1838226318359375, -1.133056640625, -1.0822906494140625, -1.031524658203125, -0.9807586669921875, -0.92999267578125, -0.8792266845703125, -0.828460693359375, -0.7776947021484375, -0.7269287109375, -0.6761627197265625, -0.625396728515625, -0.5746307373046875, -0.52386474609375, -0.4730987548828125, -0.422332763671875, -0.3715667724609375, -0.32080078125, -0.2700347900390625, -0.219268798828125, -0.1685028076171875, -0.11773681640625, -0.0669708251953125, -0.016204833984375, 0.0345611572265625, 0.0853271484375, 0.1360931396484375, 0.186859130859375, 0.2376251220703125, 0.28839111328125, 0.3391571044921875, 0.389923095703125, 0.4406890869140625, 0.491455078125, 0.5422210693359375, 0.592987060546875, 0.6437530517578125, 0.69451904296875, 0.7452850341796875, 0.796051025390625, 0.8468170166015625, 0.8975830078125, 0.9483489990234375, 0.999114990234375, 1.0498809814453125, 1.10064697265625, 1.1514129638671875, 1.202178955078125, 1.2529449462890625, 1.3037109375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 6.0, 4.0, 5.0, 10.0, 8.0, 14.0, 22.0, 39.0, 55.0, 140.0, 321.0, 163.0, 76.0, 33.0, 29.0, 14.0, 13.0, 8.0, 8.0, 6.0, 4.0, 3.0, 3.0, 3.0, 3.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.728006362915039e-05, -5.474220961332321e-05, -5.220435559749603e-05, -4.9666501581668854e-05, -4.7128647565841675e-05, -4.4590793550014496e-05, -4.205293953418732e-05, -3.951508551836014e-05, -3.697723150253296e-05, -3.443937748670578e-05, -3.19015234708786e-05, -2.9363669455051422e-05, -2.6825815439224243e-05, -2.4287961423397064e-05, -2.1750107407569885e-05, -1.9212253391742706e-05, -1.6674399375915527e-05, -1.4136545360088348e-05, -1.159869134426117e-05, -9.06083732843399e-06, -6.5229833126068115e-06, -3.9851292967796326e-06, -1.4472752809524536e-06, 1.0905787348747253e-06, 3.6284327507019043e-06, 6.166286766529083e-06, 8.704140782356262e-06, 1.1241994798183441e-05, 1.377984881401062e-05, 1.63177028298378e-05, 1.8855556845664978e-05, 2.1393410861492157e-05, 2.3931264877319336e-05, 2.6469118893146515e-05, 2.9006972908973694e-05, 3.154482692480087e-05, 3.408268094062805e-05, 3.662053495645523e-05, 3.915838897228241e-05, 4.169624298810959e-05, 4.423409700393677e-05, 4.6771951019763947e-05, 4.9309805035591125e-05, 5.1847659051418304e-05, 5.4385513067245483e-05, 5.692336708307266e-05, 5.946122109889984e-05, 6.199907511472702e-05, 6.45369291305542e-05, 6.707478314638138e-05, 6.961263716220856e-05, 7.215049117803574e-05, 7.468834519386292e-05, 7.72261992096901e-05, 7.976405322551727e-05, 8.230190724134445e-05, 8.483976125717163e-05, 8.737761527299881e-05, 8.991546928882599e-05, 9.245332330465317e-05, 9.499117732048035e-05, 9.752903133630753e-05, 0.0001000668853521347, 0.00010260473936796188, 0.00010514259338378906]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 10.0, 11.0, 10.0, 20.0, 24.0, 46.0, 70.0, 166.0, 605.0, 3116.0, 32659.0, 970540.0, 36698.0, 3488.0, 650.0, 213.0, 92.0, 56.0, 28.0, 12.0, 17.0, 11.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94873046875, -0.9115524291992188, -0.8743743896484375, -0.8371963500976562, -0.800018310546875, -0.7628402709960938, -0.7256622314453125, -0.6884841918945312, -0.65130615234375, -0.6141281127929688, -0.5769500732421875, -0.5397720336914062, -0.502593994140625, -0.46541595458984375, -0.4282379150390625, -0.39105987548828125, -0.3538818359375, -0.31670379638671875, -0.2795257568359375, -0.24234771728515625, -0.205169677734375, -0.16799163818359375, -0.1308135986328125, -0.09363555908203125, -0.05645751953125, -0.01927947998046875, 0.0178985595703125, 0.05507659912109375, 0.092254638671875, 0.12943267822265625, 0.1666107177734375, 0.20378875732421875, 0.240966796875, 0.27814483642578125, 0.3153228759765625, 0.35250091552734375, 0.389678955078125, 0.42685699462890625, 0.4640350341796875, 0.5012130737304688, 0.53839111328125, 0.5755691528320312, 0.6127471923828125, 0.6499252319335938, 0.687103271484375, 0.7242813110351562, 0.7614593505859375, 0.7986373901367188, 0.8358154296875, 0.8729934692382812, 0.9101715087890625, 0.9473495483398438, 0.984527587890625, 1.0217056274414062, 1.0588836669921875, 1.0960617065429688, 1.13323974609375, 1.1704177856445312, 1.2075958251953125, 1.2447738647460938, 1.281951904296875, 1.3191299438476562, 1.3563079833984375, 1.3934860229492188, 1.4306640625]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 5.0, 7.0, 8.0, 10.0, 7.0, 21.0, 19.0, 33.0, 44.0, 85.0, 142.0, 264.0, 117.0, 66.0, 46.0, 27.0, 20.0, 16.0, 16.0, 6.0, 6.0, 7.0, 5.0, 2.0, 5.0, 2.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.2310791015625, -0.22473716735839844, -0.21839523315429688, -0.2120532989501953, -0.20571136474609375, -0.1993694305419922, -0.19302749633789062, -0.18668556213378906, -0.1803436279296875, -0.17400169372558594, -0.16765975952148438, -0.1613178253173828, -0.15497589111328125, -0.1486339569091797, -0.14229202270507812, -0.13595008850097656, -0.129608154296875, -0.12326622009277344, -0.11692428588867188, -0.11058235168457031, -0.10424041748046875, -0.09789848327636719, -0.09155654907226562, -0.08521461486816406, -0.0788726806640625, -0.07253074645996094, -0.06618881225585938, -0.05984687805175781, -0.05350494384765625, -0.04716300964355469, -0.040821075439453125, -0.03447914123535156, -0.02813720703125, -0.021795272827148438, -0.015453338623046875, -0.009111404418945312, -0.00276947021484375, 0.0035724639892578125, 0.009914398193359375, 0.016256332397460938, 0.0225982666015625, 0.028940200805664062, 0.035282135009765625, 0.04162406921386719, 0.04796600341796875, 0.05430793762207031, 0.060649871826171875, 0.06699180603027344, 0.073333740234375, 0.07967567443847656, 0.08601760864257812, 0.09235954284667969, 0.09870147705078125, 0.10504341125488281, 0.11138534545898438, 0.11772727966308594, 0.1240692138671875, 0.13041114807128906, 0.13675308227539062, 0.1430950164794922, 0.14943695068359375, 0.1557788848876953, 0.16212081909179688, 0.16846275329589844, 0.1748046875]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 48.0, 340.0, 529.0, 83.0, 12.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.88618803024292, -2.3323416709899902, -1.7784953117370605, -1.2246489524841309, -0.6708025932312012, -0.11695623397827148, 0.4368901252746582, 0.9907364845275879, 1.5445828437805176, 2.0984292030334473, 2.652275562286377, 3.2061219215393066, 3.7599682807922363, 4.313814640045166, 4.867660999298096, 5.421507358551025, 5.975353717803955, 6.529200077056885, 7.0830464363098145, 7.636892795562744, 8.190738677978516, 8.744585037231445, 9.298431396484375, 9.852277755737305, 10.406124114990234, 10.959970474243164, 11.513816833496094, 12.067663192749023, 12.621509552001953, 13.175355911254883, 13.729202270507812, 14.283048629760742, 14.836894989013672, 15.390741348266602, 15.944587707519531, 16.49843406677246, 17.05228042602539, 17.60612678527832, 18.15997314453125, 18.71381950378418, 19.26766586303711, 19.82151222229004, 20.37535858154297, 20.9292049407959, 21.483051300048828, 22.036897659301758, 22.590744018554688, 23.144590377807617, 23.698436737060547, 24.252283096313477, 24.806129455566406, 25.359975814819336, 25.913822174072266, 26.467668533325195, 27.021514892578125, 27.575361251831055, 28.129207611083984, 28.683053970336914, 29.236900329589844, 29.790746688842773, 30.344593048095703, 30.898439407348633, 31.452285766601562, 32.006134033203125, 32.55997848510742]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 11.0, 5.0, 6.0, 9.0, 21.0, 21.0, 35.0, 40.0, 57.0, 59.0, 51.0, 66.0, 62.0, 56.0, 70.0, 55.0, 74.0, 48.0, 50.0, 53.0, 41.0, 31.0, 24.0, 20.0, 12.0, 9.0, 7.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1350769996643066, -2.024895429611206, -1.9147138595581055, -1.8045322895050049, -1.6943506002426147, -1.5841690301895142, -1.4739874601364136, -1.3638057708740234, -1.2536242008209229, -1.1434426307678223, -1.0332610607147217, -0.9230794310569763, -0.812897801399231, -0.7027162313461304, -0.5925346612930298, -0.4823530316352844, -0.3721715211868286, -0.26198992133140564, -0.15180833637714386, -0.04162675142288208, 0.0685548484325409, 0.17873644828796387, 0.28891801834106445, 0.3990996479988098, 0.5092812180519104, 0.619462788105011, 0.7296444177627563, 0.8398259878158569, 0.9500075578689575, 1.0601892471313477, 1.1703708171844482, 1.2805523872375488, 1.3907339572906494, 1.50091552734375, 1.6110970973968506, 1.7212786674499512, 1.8314603567123413, 1.941641926765442, 2.051823616027832, 2.1620051860809326, 2.272186756134033, 2.382368326187134, 2.4925498962402344, 2.602731466293335, 2.7129130363464355, 2.8230948448181152, 2.9332761764526367, 3.0434579849243164, 3.153639316558838, 3.2638208866119385, 3.374002456665039, 3.4841840267181396, 3.5943655967712402, 3.70454740524292, 3.8147287368774414, 3.924910545349121, 4.035092353820801, 4.1452741622924805, 4.255455493927002, 4.365637302398682, 4.475818634033203, 4.586000442504883, 4.696181774139404, 4.806363582611084, 4.9165449142456055]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 3.0, 4.0, 12.0, 17.0, 17.0, 28.0, 42.0, 67.0, 72.0, 120.0, 207.0, 327.0, 498.0, 913.0, 1686.0, 3269.0, 7009.0, 17463.0, 61431.0, 462632.0, 2601840.0, 890741.0, 102447.0, 24788.0, 9423.0, 4167.0, 2178.0, 1109.0, 649.0, 363.0, 272.0, 141.0, 107.0, 70.0, 39.0, 30.0, 34.0, 19.0, 17.0, 12.0, 8.0, 5.0, 4.0, 4.0, 1.0, 2.0], "bins": [-2.08203125, -2.028167724609375, -1.97430419921875, -1.920440673828125, -1.8665771484375, -1.812713623046875, -1.75885009765625, -1.704986572265625, -1.651123046875, -1.597259521484375, -1.54339599609375, -1.489532470703125, -1.4356689453125, -1.381805419921875, -1.32794189453125, -1.274078369140625, -1.22021484375, -1.166351318359375, -1.11248779296875, -1.058624267578125, -1.0047607421875, -0.950897216796875, -0.89703369140625, -0.843170166015625, -0.789306640625, -0.735443115234375, -0.68157958984375, -0.627716064453125, -0.5738525390625, -0.519989013671875, -0.46612548828125, -0.412261962890625, -0.3583984375, -0.304534912109375, -0.25067138671875, -0.196807861328125, -0.1429443359375, -0.089080810546875, -0.03521728515625, 0.018646240234375, 0.072509765625, 0.126373291015625, 0.18023681640625, 0.234100341796875, 0.2879638671875, 0.341827392578125, 0.39569091796875, 0.449554443359375, 0.50341796875, 0.557281494140625, 0.61114501953125, 0.665008544921875, 0.7188720703125, 0.772735595703125, 0.82659912109375, 0.880462646484375, 0.934326171875, 0.988189697265625, 1.04205322265625, 1.095916748046875, 1.1497802734375, 1.203643798828125, 1.25750732421875, 1.311370849609375, 1.365234375]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 9.0, 6.0, 16.0, 17.0, 21.0, 14.0, 19.0, 27.0, 33.0, 38.0, 49.0, 56.0, 43.0, 50.0, 51.0, 59.0, 49.0, 37.0, 56.0, 57.0, 43.0, 47.0, 33.0, 20.0, 23.0, 37.0, 17.0, 21.0, 16.0, 10.0, 5.0, 10.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1025390625, -1.069793701171875, -1.03704833984375, -1.004302978515625, -0.9715576171875, -0.938812255859375, -0.90606689453125, -0.873321533203125, -0.840576171875, -0.807830810546875, -0.77508544921875, -0.742340087890625, -0.7095947265625, -0.676849365234375, -0.64410400390625, -0.611358642578125, -0.57861328125, -0.545867919921875, -0.51312255859375, -0.480377197265625, -0.4476318359375, -0.414886474609375, -0.38214111328125, -0.349395751953125, -0.316650390625, -0.283905029296875, -0.25115966796875, -0.218414306640625, -0.1856689453125, -0.152923583984375, -0.12017822265625, -0.087432861328125, -0.0546875, -0.021942138671875, 0.01080322265625, 0.043548583984375, 0.0762939453125, 0.109039306640625, 0.14178466796875, 0.174530029296875, 0.207275390625, 0.240020751953125, 0.27276611328125, 0.305511474609375, 0.3382568359375, 0.371002197265625, 0.40374755859375, 0.436492919921875, 0.46923828125, 0.501983642578125, 0.53472900390625, 0.567474365234375, 0.6002197265625, 0.632965087890625, 0.66571044921875, 0.698455810546875, 0.731201171875, 0.763946533203125, 0.79669189453125, 0.829437255859375, 0.8621826171875, 0.894927978515625, 0.92767333984375, 0.960418701171875, 0.9931640625]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 6.0, 8.0, 5.0, 5.0, 10.0, 18.0, 21.0, 34.0, 52.0, 66.0, 125.0, 206.0, 351.0, 716.0, 1653.0, 5264.0, 26523.0, 385369.0, 3640898.0, 113759.0, 13522.0, 3250.0, 1124.0, 518.0, 269.0, 175.0, 107.0, 51.0, 49.0, 43.0, 26.0, 15.0, 13.0, 3.0, 7.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.703125, -2.61395263671875, -2.5247802734375, -2.43560791015625, -2.346435546875, -2.25726318359375, -2.1680908203125, -2.07891845703125, -1.98974609375, -1.90057373046875, -1.8114013671875, -1.72222900390625, -1.633056640625, -1.54388427734375, -1.4547119140625, -1.36553955078125, -1.2763671875, -1.18719482421875, -1.0980224609375, -1.00885009765625, -0.919677734375, -0.83050537109375, -0.7413330078125, -0.65216064453125, -0.56298828125, -0.47381591796875, -0.3846435546875, -0.29547119140625, -0.206298828125, -0.11712646484375, -0.0279541015625, 0.06121826171875, 0.150390625, 0.23956298828125, 0.3287353515625, 0.41790771484375, 0.507080078125, 0.59625244140625, 0.6854248046875, 0.77459716796875, 0.86376953125, 0.95294189453125, 1.0421142578125, 1.13128662109375, 1.220458984375, 1.30963134765625, 1.3988037109375, 1.48797607421875, 1.5771484375, 1.66632080078125, 1.7554931640625, 1.84466552734375, 1.933837890625, 2.02301025390625, 2.1121826171875, 2.20135498046875, 2.29052734375, 2.37969970703125, 2.4688720703125, 2.55804443359375, 2.647216796875, 2.73638916015625, 2.8255615234375, 2.91473388671875, 3.00390625]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 4.0, 8.0, 8.0, 16.0, 12.0, 27.0, 35.0, 33.0, 75.0, 88.0, 133.0, 222.0, 440.0, 718.0, 863.0, 530.0, 293.0, 178.0, 116.0, 81.0, 54.0, 56.0, 29.0, 15.0, 12.0, 5.0, 4.0, 6.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.65576171875, -0.636016845703125, -0.61627197265625, -0.596527099609375, -0.5767822265625, -0.557037353515625, -0.53729248046875, -0.517547607421875, -0.497802734375, -0.478057861328125, -0.45831298828125, -0.438568115234375, -0.4188232421875, -0.399078369140625, -0.37933349609375, -0.359588623046875, -0.33984375, -0.320098876953125, -0.30035400390625, -0.280609130859375, -0.2608642578125, -0.241119384765625, -0.22137451171875, -0.201629638671875, -0.181884765625, -0.162139892578125, -0.14239501953125, -0.122650146484375, -0.1029052734375, -0.083160400390625, -0.06341552734375, -0.043670654296875, -0.02392578125, -0.004180908203125, 0.01556396484375, 0.035308837890625, 0.0550537109375, 0.074798583984375, 0.09454345703125, 0.114288330078125, 0.134033203125, 0.153778076171875, 0.17352294921875, 0.193267822265625, 0.2130126953125, 0.232757568359375, 0.25250244140625, 0.272247314453125, 0.2919921875, 0.311737060546875, 0.33148193359375, 0.351226806640625, 0.3709716796875, 0.390716552734375, 0.41046142578125, 0.430206298828125, 0.449951171875, 0.469696044921875, 0.48944091796875, 0.509185791015625, 0.5289306640625, 0.548675537109375, 0.56842041015625, 0.588165283203125, 0.60791015625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 2.0, 3.0, 6.0, 16.0, 24.0, 23.0, 26.0, 37.0, 61.0, 84.0, 90.0, 105.0, 102.0, 98.0, 83.0, 77.0, 55.0, 36.0, 22.0, 15.0, 10.0, 7.0, 9.0, 4.0, 2.0, 0.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3182934522628784, -1.2503814697265625, -1.1824694871902466, -1.1145575046539307, -1.0466454029083252, -0.9787334203720093, -0.9108214378356934, -0.8429094552993774, -0.7749974131584167, -0.7070854306221008, -0.6391733884811401, -0.5712614059448242, -0.5033494234085083, -0.4354373812675476, -0.3675253987312317, -0.2996133863925934, -0.23170137405395508, -0.16378936171531677, -0.09587736427783966, -0.02796536684036255, 0.03994664549827576, 0.10785865783691406, 0.17577064037322998, 0.2436826527118683, 0.3115946650505066, 0.3795066773891449, 0.4474186897277832, 0.5153306722640991, 0.583242654800415, 0.6511546969413757, 0.7190666794776917, 0.7869787216186523, 0.8548908233642578, 0.9228028059005737, 0.9907148480415344, 1.0586268901824951, 1.126538872718811, 1.194450855255127, 1.2623628377914429, 1.3302748203277588, 1.3981869220733643, 1.4660989046096802, 1.534010887145996, 1.6019229888916016, 1.6698349714279175, 1.7377469539642334, 1.8056589365005493, 1.8735709190368652, 1.9414829015731812, 2.009394884109497, 2.0773069858551025, 2.145218849182129, 2.2131309509277344, 2.28104305267334, 2.348954916000366, 2.4168670177459717, 2.484778881072998, 2.5526909828186035, 2.62060284614563, 2.6885149478912354, 2.7564268112182617, 2.824338912963867, 2.8922510147094727, 2.960162878036499, 3.0280749797821045]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 6.0, 7.0, 5.0, 8.0, 4.0, 16.0, 21.0, 18.0, 20.0, 17.0, 22.0, 27.0, 29.0, 31.0, 35.0, 43.0, 41.0, 23.0, 33.0, 38.0, 43.0, 45.0, 46.0, 45.0, 42.0, 43.0, 46.0, 37.0, 22.0, 26.0, 27.0, 21.0, 13.0, 20.0, 13.0, 20.0, 9.0, 12.0, 7.0, 5.0, 5.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.0496314764022827, -1.0173304080963135, -0.985029399394989, -0.9527283310890198, -0.9204273223876953, -0.8881262540817261, -0.8558251857757568, -0.8235241174697876, -0.7912231087684631, -0.7589220404624939, -0.7266210317611694, -0.6943199634552002, -0.662018895149231, -0.6297178864479065, -0.5974168181419373, -0.5651158094406128, -0.5328147411346436, -0.5005136728286743, -0.46821266412734985, -0.4359115958213806, -0.40361055731773376, -0.3713095188140869, -0.3390084505081177, -0.3067074120044708, -0.274406373500824, -0.24210533499717712, -0.20980428159236908, -0.17750322818756104, -0.14520218968391418, -0.11290115118026733, -0.08060009777545929, -0.048299044370651245, -0.015998125076293945, 0.016302920877933502, 0.04860396683216095, 0.0809050127863884, 0.11320605874061584, 0.1455070972442627, 0.17780815064907074, 0.21010920405387878, 0.24241024255752563, 0.2747112810611725, 0.30701231956481934, 0.3393133878707886, 0.3716144263744354, 0.4039154648780823, 0.4362165331840515, 0.46851757168769836, 0.5008186101913452, 0.5331196784973145, 0.5654206871986389, 0.5977217555046082, 0.6300227642059326, 0.6623238325119019, 0.6946249008178711, 0.7269259691238403, 0.7592269778251648, 0.791528046131134, 0.8238290548324585, 0.8561301231384277, 0.888431191444397, 0.9207322001457214, 0.9530332684516907, 0.9853342771530151, 1.0176353454589844]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 10.0, 7.0, 17.0, 13.0, 33.0, 42.0, 78.0, 129.0, 216.0, 360.0, 538.0, 1060.0, 1768.0, 3337.0, 6686.0, 13540.0, 30924.0, 82037.0, 275035.0, 421301.0, 129731.0, 44717.0, 18580.0, 8571.0, 4443.0, 2236.0, 1330.0, 753.0, 397.0, 261.0, 141.0, 92.0, 59.0, 36.0, 23.0, 19.0, 9.0, 7.0, 4.0, 5.0, 8.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.58837890625, -0.5682296752929688, -0.5480804443359375, -0.5279312133789062, -0.507781982421875, -0.48763275146484375, -0.4674835205078125, -0.44733428955078125, -0.42718505859375, -0.40703582763671875, -0.3868865966796875, -0.36673736572265625, -0.346588134765625, -0.32643890380859375, -0.3062896728515625, -0.28614044189453125, -0.2659912109375, -0.24584197998046875, -0.2256927490234375, -0.20554351806640625, -0.185394287109375, -0.16524505615234375, -0.1450958251953125, -0.12494659423828125, -0.10479736328125, -0.08464813232421875, -0.0644989013671875, -0.04434967041015625, -0.024200439453125, -0.00405120849609375, 0.0160980224609375, 0.03624725341796875, 0.056396484375, 0.07654571533203125, 0.0966949462890625, 0.11684417724609375, 0.136993408203125, 0.15714263916015625, 0.1772918701171875, 0.19744110107421875, 0.21759033203125, 0.23773956298828125, 0.2578887939453125, 0.27803802490234375, 0.298187255859375, 0.31833648681640625, 0.3384857177734375, 0.35863494873046875, 0.3787841796875, 0.39893341064453125, 0.4190826416015625, 0.43923187255859375, 0.459381103515625, 0.47953033447265625, 0.4996795654296875, 0.5198287963867188, 0.53997802734375, 0.5601272583007812, 0.5802764892578125, 0.6004257202148438, 0.620574951171875, 0.6407241821289062, 0.6608734130859375, 0.6810226440429688, 0.701171875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 4.0, 5.0, 13.0, 8.0, 16.0, 20.0, 22.0, 34.0, 34.0, 49.0, 52.0, 46.0, 51.0, 55.0, 57.0, 51.0, 67.0, 63.0, 73.0, 58.0, 45.0, 35.0, 35.0, 26.0, 17.0, 14.0, 18.0, 11.0, 9.0, 4.0, 7.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6708984375, -0.643524169921875, -0.61614990234375, -0.588775634765625, -0.5614013671875, -0.534027099609375, -0.50665283203125, -0.479278564453125, -0.451904296875, -0.424530029296875, -0.39715576171875, -0.369781494140625, -0.3424072265625, -0.315032958984375, -0.28765869140625, -0.260284423828125, -0.23291015625, -0.205535888671875, -0.17816162109375, -0.150787353515625, -0.1234130859375, -0.096038818359375, -0.06866455078125, -0.041290283203125, -0.013916015625, 0.013458251953125, 0.04083251953125, 0.068206787109375, 0.0955810546875, 0.122955322265625, 0.15032958984375, 0.177703857421875, 0.205078125, 0.232452392578125, 0.25982666015625, 0.287200927734375, 0.3145751953125, 0.341949462890625, 0.36932373046875, 0.396697998046875, 0.424072265625, 0.451446533203125, 0.47882080078125, 0.506195068359375, 0.5335693359375, 0.560943603515625, 0.58831787109375, 0.615692138671875, 0.64306640625, 0.670440673828125, 0.69781494140625, 0.725189208984375, 0.7525634765625, 0.779937744140625, 0.80731201171875, 0.834686279296875, 0.862060546875, 0.889434814453125, 0.91680908203125, 0.944183349609375, 0.9715576171875, 0.998931884765625, 1.02630615234375, 1.053680419921875, 1.0810546875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 1.0, 5.0, 5.0, 8.0, 16.0, 19.0, 12.0, 21.0, 22.0, 22.0, 35.0, 76.0, 83.0, 113.0, 171.0, 319.0, 558.0, 1151.0, 2504.0, 6093.0, 17086.0, 55322.0, 234944.0, 531443.0, 140880.0, 37043.0, 12070.0, 4466.0, 1971.0, 852.0, 441.0, 242.0, 152.0, 107.0, 90.0, 55.0, 43.0, 20.0, 20.0, 19.0, 14.0, 10.0, 9.0, 5.0, 9.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.7470703125, -0.725311279296875, -0.70355224609375, -0.681793212890625, -0.6600341796875, -0.638275146484375, -0.61651611328125, -0.594757080078125, -0.572998046875, -0.551239013671875, -0.52947998046875, -0.507720947265625, -0.4859619140625, -0.464202880859375, -0.44244384765625, -0.420684814453125, -0.39892578125, -0.377166748046875, -0.35540771484375, -0.333648681640625, -0.3118896484375, -0.290130615234375, -0.26837158203125, -0.246612548828125, -0.224853515625, -0.203094482421875, -0.18133544921875, -0.159576416015625, -0.1378173828125, -0.116058349609375, -0.09429931640625, -0.072540283203125, -0.05078125, -0.029022216796875, -0.00726318359375, 0.014495849609375, 0.0362548828125, 0.058013916015625, 0.07977294921875, 0.101531982421875, 0.123291015625, 0.145050048828125, 0.16680908203125, 0.188568115234375, 0.2103271484375, 0.232086181640625, 0.25384521484375, 0.275604248046875, 0.29736328125, 0.319122314453125, 0.34088134765625, 0.362640380859375, 0.3843994140625, 0.406158447265625, 0.42791748046875, 0.449676513671875, 0.471435546875, 0.493194580078125, 0.51495361328125, 0.536712646484375, 0.5584716796875, 0.580230712890625, 0.60198974609375, 0.623748779296875, 0.6455078125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 2.0, 8.0, 11.0, 20.0, 17.0, 16.0, 23.0, 18.0, 18.0, 34.0, 31.0, 47.0, 56.0, 60.0, 52.0, 56.0, 56.0, 46.0, 56.0, 40.0, 47.0, 41.0, 31.0, 39.0, 34.0, 31.0, 22.0, 19.0, 5.0, 19.0, 14.0, 11.0, 5.0, 3.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0], "bins": [-1.6572265625, -1.6152496337890625, -1.573272705078125, -1.5312957763671875, -1.48931884765625, -1.4473419189453125, -1.405364990234375, -1.3633880615234375, -1.3214111328125, -1.2794342041015625, -1.237457275390625, -1.1954803466796875, -1.15350341796875, -1.1115264892578125, -1.069549560546875, -1.0275726318359375, -0.985595703125, -0.9436187744140625, -0.901641845703125, -0.8596649169921875, -0.81768798828125, -0.7757110595703125, -0.733734130859375, -0.6917572021484375, -0.6497802734375, -0.6078033447265625, -0.565826416015625, -0.5238494873046875, -0.48187255859375, -0.4398956298828125, -0.397918701171875, -0.3559417724609375, -0.31396484375, -0.2719879150390625, -0.230010986328125, -0.1880340576171875, -0.14605712890625, -0.1040802001953125, -0.062103271484375, -0.0201263427734375, 0.0218505859375, 0.0638275146484375, 0.105804443359375, 0.1477813720703125, 0.18975830078125, 0.2317352294921875, 0.273712158203125, 0.3156890869140625, 0.357666015625, 0.3996429443359375, 0.441619873046875, 0.4835968017578125, 0.52557373046875, 0.5675506591796875, 0.609527587890625, 0.6515045166015625, 0.6934814453125, 0.7354583740234375, 0.777435302734375, 0.8194122314453125, 0.86138916015625, 0.9033660888671875, 0.945343017578125, 0.9873199462890625, 1.029296875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 6.0, 7.0, 15.0, 27.0, 35.0, 49.0, 77.0, 123.0, 174.0, 263.0, 519.0, 1024.0, 1830.0, 3536.0, 7130.0, 15384.0, 37065.0, 105709.0, 388704.0, 333899.0, 91908.0, 33033.0, 14083.0, 6609.0, 3271.0, 1762.0, 909.0, 535.0, 321.0, 202.0, 108.0, 85.0, 42.0, 37.0, 22.0, 16.0, 8.0, 11.0, 5.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.166015625, -0.16047096252441406, -0.15492630004882812, -0.1493816375732422, -0.14383697509765625, -0.1382923126220703, -0.13274765014648438, -0.12720298767089844, -0.1216583251953125, -0.11611366271972656, -0.11056900024414062, -0.10502433776855469, -0.09947967529296875, -0.09393501281738281, -0.08839035034179688, -0.08284568786621094, -0.077301025390625, -0.07175636291503906, -0.06621170043945312, -0.06066703796386719, -0.05512237548828125, -0.04957771301269531, -0.044033050537109375, -0.03848838806152344, -0.0329437255859375, -0.027399063110351562, -0.021854400634765625, -0.016309738159179688, -0.01076507568359375, -0.0052204132080078125, 0.000324249267578125, 0.0058689117431640625, 0.01141357421875, 0.016958236694335938, 0.022502899169921875, 0.028047561645507812, 0.03359222412109375, 0.03913688659667969, 0.044681549072265625, 0.05022621154785156, 0.0557708740234375, 0.06131553649902344, 0.06686019897460938, 0.07240486145019531, 0.07794952392578125, 0.08349418640136719, 0.08903884887695312, 0.09458351135253906, 0.100128173828125, 0.10567283630371094, 0.11121749877929688, 0.11676216125488281, 0.12230682373046875, 0.1278514862060547, 0.13339614868164062, 0.13894081115722656, 0.1444854736328125, 0.15003013610839844, 0.15557479858398438, 0.1611194610595703, 0.16666412353515625, 0.1722087860107422, 0.17775344848632812, 0.18329811096191406, 0.1888427734375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 4.0, 6.0, 9.0, 12.0, 12.0, 14.0, 24.0, 36.0, 45.0, 72.0, 103.0, 166.0, 159.0, 126.0, 58.0, 46.0, 37.0, 19.0, 20.0, 11.0, 5.0, 4.0, 3.0, 5.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022602081298828125, -0.00022023916244506836, -0.00021445751190185547, -0.00020867586135864258, -0.0002028942108154297, -0.0001971125602722168, -0.0001913309097290039, -0.00018554925918579102, -0.00017976760864257812, -0.00017398595809936523, -0.00016820430755615234, -0.00016242265701293945, -0.00015664100646972656, -0.00015085935592651367, -0.00014507770538330078, -0.0001392960548400879, -0.000133514404296875, -0.0001277327537536621, -0.00012195110321044922, -0.00011616945266723633, -0.00011038780212402344, -0.00010460615158081055, -9.882450103759766e-05, -9.304285049438477e-05, -8.726119995117188e-05, -8.147954940795898e-05, -7.56978988647461e-05, -6.99162483215332e-05, -6.413459777832031e-05, -5.835294723510742e-05, -5.257129669189453e-05, -4.678964614868164e-05, -4.100799560546875e-05, -3.522634506225586e-05, -2.944469451904297e-05, -2.3663043975830078e-05, -1.7881393432617188e-05, -1.2099742889404297e-05, -6.318092346191406e-06, -5.364418029785156e-07, 5.245208740234375e-06, 1.1026859283447266e-05, 1.6808509826660156e-05, 2.2590160369873047e-05, 2.8371810913085938e-05, 3.415346145629883e-05, 3.993511199951172e-05, 4.571676254272461e-05, 5.14984130859375e-05, 5.728006362915039e-05, 6.306171417236328e-05, 6.884336471557617e-05, 7.462501525878906e-05, 8.040666580200195e-05, 8.618831634521484e-05, 9.196996688842773e-05, 9.775161743164062e-05, 0.00010353326797485352, 0.0001093149185180664, 0.0001150965690612793, 0.00012087821960449219, 0.00012665987014770508, 0.00013244152069091797, 0.00013822317123413086, 0.00014400482177734375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 8.0, 5.0, 8.0, 19.0, 18.0, 25.0, 39.0, 69.0, 93.0, 151.0, 268.0, 481.0, 946.0, 2157.0, 5311.0, 16334.0, 65700.0, 376411.0, 469874.0, 80505.0, 19345.0, 6090.0, 2334.0, 1062.0, 536.0, 292.0, 178.0, 107.0, 67.0, 34.0, 28.0, 12.0, 9.0, 5.0, 7.0, 5.0, 7.0, 6.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.248291015625, -0.2407817840576172, -0.23327255249023438, -0.22576332092285156, -0.21825408935546875, -0.21074485778808594, -0.20323562622070312, -0.1957263946533203, -0.1882171630859375, -0.1807079315185547, -0.17319869995117188, -0.16568946838378906, -0.15818023681640625, -0.15067100524902344, -0.14316177368164062, -0.1356525421142578, -0.128143310546875, -0.12063407897949219, -0.11312484741210938, -0.10561561584472656, -0.09810638427734375, -0.09059715270996094, -0.08308792114257812, -0.07557868957519531, -0.0680694580078125, -0.06056022644042969, -0.053050994873046875, -0.04554176330566406, -0.03803253173828125, -0.030523300170898438, -0.023014068603515625, -0.015504837036132812, -0.00799560546875, -0.0004863739013671875, 0.007022857666015625, 0.014532089233398438, 0.02204132080078125, 0.029550552368164062, 0.037059783935546875, 0.04456901550292969, 0.0520782470703125, 0.05958747863769531, 0.06709671020507812, 0.07460594177246094, 0.08211517333984375, 0.08962440490722656, 0.09713363647460938, 0.10464286804199219, 0.112152099609375, 0.11966133117675781, 0.12717056274414062, 0.13467979431152344, 0.14218902587890625, 0.14969825744628906, 0.15720748901367188, 0.1647167205810547, 0.1722259521484375, 0.1797351837158203, 0.18724441528320312, 0.19475364685058594, 0.20226287841796875, 0.20977210998535156, 0.21728134155273438, 0.2247905731201172, 0.2322998046875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 6.0, 1.0, 2.0, 9.0, 8.0, 10.0, 5.0, 11.0, 16.0, 22.0, 34.0, 26.0, 28.0, 53.0, 68.0, 73.0, 98.0, 103.0, 88.0, 60.0, 59.0, 45.0, 36.0, 24.0, 28.0, 11.0, 18.0, 8.0, 13.0, 8.0, 9.0, 5.0, 3.0, 6.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0504150390625, -0.04898500442504883, -0.047554969787597656, -0.046124935150146484, -0.04469490051269531, -0.04326486587524414, -0.04183483123779297, -0.0404047966003418, -0.038974761962890625, -0.03754472732543945, -0.03611469268798828, -0.03468465805053711, -0.03325462341308594, -0.031824588775634766, -0.030394554138183594, -0.028964519500732422, -0.02753448486328125, -0.026104450225830078, -0.024674415588378906, -0.023244380950927734, -0.021814346313476562, -0.02038431167602539, -0.01895427703857422, -0.017524242401123047, -0.016094207763671875, -0.014664173126220703, -0.013234138488769531, -0.01180410385131836, -0.010374069213867188, -0.008944034576416016, -0.007513999938964844, -0.006083965301513672, -0.0046539306640625, -0.003223896026611328, -0.0017938613891601562, -0.0003638267517089844, 0.0010662078857421875, 0.0024962425231933594, 0.003926277160644531, 0.005356311798095703, 0.006786346435546875, 0.008216381072998047, 0.009646415710449219, 0.01107645034790039, 0.012506484985351562, 0.013936519622802734, 0.015366554260253906, 0.016796588897705078, 0.01822662353515625, 0.019656658172607422, 0.021086692810058594, 0.022516727447509766, 0.023946762084960938, 0.02537679672241211, 0.02680683135986328, 0.028236865997314453, 0.029666900634765625, 0.031096935272216797, 0.03252696990966797, 0.03395700454711914, 0.03538703918457031, 0.036817073822021484, 0.038247108459472656, 0.03967714309692383, 0.041107177734375]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 6.0, 14.0, 24.0, 37.0, 39.0, 99.0, 133.0, 162.0, 155.0, 146.0, 87.0, 36.0, 23.0, 15.0, 6.0, 5.0, 4.0, 5.0, 1.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.797158420085907, -0.7399975657463074, -0.6828367114067078, -0.6256759166717529, -0.5685150623321533, -0.5113542079925537, -0.4541933536529541, -0.3970325291156769, -0.33987167477607727, -0.28271082043647766, -0.22554999589920044, -0.16838914155960083, -0.11122830212116241, -0.054067462682724, 0.0030933916568756104, 0.06025421619415283, 0.11741507053375244, 0.17457590997219086, 0.23173674941062927, 0.2888976037502289, 0.3460584282875061, 0.4032192826271057, 0.4603801369667053, 0.5175409317016602, 0.5747017860412598, 0.6318626403808594, 0.689023494720459, 0.7461843490600586, 0.8033451437950134, 0.860505998134613, 0.9176668524742126, 0.9748276472091675, 1.031988501548767, 1.0891493558883667, 1.1463102102279663, 1.203471064567566, 1.2606319189071655, 1.3177926540374756, 1.3749535083770752, 1.4321143627166748, 1.4892752170562744, 1.546436071395874, 1.6035969257354736, 1.6607577800750732, 1.7179186344146729, 1.7750794887542725, 1.832240343093872, 1.8894010782241821, 1.9465620517730713, 2.003722906112671, 2.0608837604522705, 2.11804461479187, 2.1752054691314697, 2.2323663234710693, 2.289527177810669, 2.3466880321502686, 2.403848648071289, 2.4610095024108887, 2.5181703567504883, 2.575331211090088, 2.6324920654296875, 2.689652919769287, 2.7468137741088867, 2.8039746284484863, 2.861135482788086]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 6.0, 9.0, 22.0, 25.0, 37.0, 42.0, 56.0, 77.0, 78.0, 84.0, 87.0, 105.0, 94.0, 74.0, 56.0, 51.0, 41.0, 28.0, 11.0, 12.0, 7.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6645477414131165, -0.6246712803840637, -0.584794819355011, -0.5449183583259583, -0.5050418972969055, -0.4651654362678528, -0.42528897523880005, -0.3854125142097473, -0.3455360531806946, -0.30565959215164185, -0.2657831311225891, -0.22590667009353638, -0.18603020906448364, -0.1461537480354309, -0.10627728700637817, -0.06640082597732544, -0.026524364948272705, 0.01335209608078003, 0.053228557109832764, 0.0931050181388855, 0.13298147916793823, 0.17285794019699097, 0.2127344012260437, 0.25261086225509644, 0.29248732328414917, 0.3323637843132019, 0.37224024534225464, 0.4121167063713074, 0.4519931674003601, 0.49186962842941284, 0.5317460894584656, 0.5716225504875183, 0.6114989519119263, 0.651375412940979, 0.6912518739700317, 0.7311283349990845, 0.7710047960281372, 0.8108812570571899, 0.8507577180862427, 0.8906341791152954, 0.9305106401443481, 0.9703871011734009, 1.0102635622024536, 1.0501400232315063, 1.090016484260559, 1.1298929452896118, 1.1697694063186646, 1.2096458673477173, 1.24952232837677, 1.2893987894058228, 1.3292752504348755, 1.3691517114639282, 1.409028172492981, 1.4489046335220337, 1.4887810945510864, 1.5286575555801392, 1.568534016609192, 1.6084104776382446, 1.6482869386672974, 1.68816339969635, 1.7280398607254028, 1.7679163217544556, 1.8077927827835083, 1.847669243812561, 1.8875457048416138]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 5.0, 9.0, 33.0, 36.0, 50.0, 95.0, 125.0, 212.0, 320.0, 501.0, 857.0, 1509.0, 2631.0, 4965.0, 9928.0, 22923.0, 82828.0, 564716.0, 277208.0, 46972.0, 16103.0, 7344.0, 3891.0, 2169.0, 1179.0, 742.0, 476.0, 248.0, 160.0, 104.0, 63.0, 55.0, 21.0, 22.0, 15.0, 8.0, 8.0, 6.0, 4.0, 5.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77783203125, -0.7561111450195312, -0.7343902587890625, -0.7126693725585938, -0.690948486328125, -0.6692276000976562, -0.6475067138671875, -0.6257858276367188, -0.60406494140625, -0.5823440551757812, -0.5606231689453125, -0.5389022827148438, -0.517181396484375, -0.49546051025390625, -0.4737396240234375, -0.45201873779296875, -0.4302978515625, -0.40857696533203125, -0.3868560791015625, -0.36513519287109375, -0.343414306640625, -0.32169342041015625, -0.2999725341796875, -0.27825164794921875, -0.25653076171875, -0.23480987548828125, -0.2130889892578125, -0.19136810302734375, -0.169647216796875, -0.14792633056640625, -0.1262054443359375, -0.10448455810546875, -0.082763671875, -0.06104278564453125, -0.0393218994140625, -0.01760101318359375, 0.004119873046875, 0.02584075927734375, 0.0475616455078125, 0.06928253173828125, 0.09100341796875, 0.11272430419921875, 0.1344451904296875, 0.15616607666015625, 0.177886962890625, 0.19960784912109375, 0.2213287353515625, 0.24304962158203125, 0.2647705078125, 0.28649139404296875, 0.3082122802734375, 0.32993316650390625, 0.351654052734375, 0.37337493896484375, 0.3950958251953125, 0.41681671142578125, 0.43853759765625, 0.46025848388671875, 0.4819793701171875, 0.5037002563476562, 0.525421142578125, 0.5471420288085938, 0.5688629150390625, 0.5905838012695312, 0.6123046875]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 10.0, 5.0, 11.0, 23.0, 23.0, 43.0, 48.0, 58.0, 69.0, 65.0, 101.0, 88.0, 79.0, 93.0, 69.0, 50.0, 48.0, 36.0, 28.0, 19.0, 18.0, 10.0, 8.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.474609375, -1.399444580078125, -1.32427978515625, -1.249114990234375, -1.1739501953125, -1.098785400390625, -1.02362060546875, -0.948455810546875, -0.873291015625, -0.798126220703125, -0.72296142578125, -0.647796630859375, -0.5726318359375, -0.497467041015625, -0.42230224609375, -0.347137451171875, -0.27197265625, -0.196807861328125, -0.12164306640625, -0.046478271484375, 0.0286865234375, 0.103851318359375, 0.17901611328125, 0.254180908203125, 0.329345703125, 0.404510498046875, 0.47967529296875, 0.554840087890625, 0.6300048828125, 0.705169677734375, 0.78033447265625, 0.855499267578125, 0.9306640625, 1.005828857421875, 1.08099365234375, 1.156158447265625, 1.2313232421875, 1.306488037109375, 1.38165283203125, 1.456817626953125, 1.531982421875, 1.607147216796875, 1.68231201171875, 1.757476806640625, 1.8326416015625, 1.907806396484375, 1.98297119140625, 2.058135986328125, 2.13330078125, 2.208465576171875, 2.28363037109375, 2.358795166015625, 2.4339599609375, 2.509124755859375, 2.58428955078125, 2.659454345703125, 2.734619140625, 2.809783935546875, 2.88494873046875, 2.960113525390625, 3.0352783203125, 3.110443115234375, 3.18560791015625, 3.260772705078125, 3.3359375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 1.0, 6.0, 8.0, 13.0, 15.0, 17.0, 11.0, 17.0, 27.0, 19.0, 22.0, 24.0, 23.0, 34.0, 42.0, 54.0, 61.0, 101.0, 295.0, 2734.0, 992537.0, 51054.0, 863.0, 179.0, 72.0, 50.0, 39.0, 27.0, 28.0, 21.0, 20.0, 13.0, 16.0, 20.0, 17.0, 9.0, 6.0, 11.0, 6.0, 7.0, 8.0, 2.0, 5.0, 4.0, 6.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.32421875, -4.17913818359375, -4.0340576171875, -3.88897705078125, -3.743896484375, -3.59881591796875, -3.4537353515625, -3.30865478515625, -3.16357421875, -3.01849365234375, -2.8734130859375, -2.72833251953125, -2.583251953125, -2.43817138671875, -2.2930908203125, -2.14801025390625, -2.0029296875, -1.85784912109375, -1.7127685546875, -1.56768798828125, -1.422607421875, -1.27752685546875, -1.1324462890625, -0.98736572265625, -0.84228515625, -0.69720458984375, -0.5521240234375, -0.40704345703125, -0.261962890625, -0.11688232421875, 0.0281982421875, 0.17327880859375, 0.318359375, 0.46343994140625, 0.6085205078125, 0.75360107421875, 0.898681640625, 1.04376220703125, 1.1888427734375, 1.33392333984375, 1.47900390625, 1.62408447265625, 1.7691650390625, 1.91424560546875, 2.059326171875, 2.20440673828125, 2.3494873046875, 2.49456787109375, 2.6396484375, 2.78472900390625, 2.9298095703125, 3.07489013671875, 3.219970703125, 3.36505126953125, 3.5101318359375, 3.65521240234375, 3.80029296875, 3.94537353515625, 4.0904541015625, 4.23553466796875, 4.380615234375, 4.52569580078125, 4.6707763671875, 4.81585693359375, 4.9609375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 12.0, 10.0, 10.0, 12.0, 17.0, 22.0, 19.0, 28.0, 25.0, 24.0, 19.0, 27.0, 29.0, 47.0, 43.0, 42.0, 30.0, 52.0, 42.0, 47.0, 35.0, 43.0, 38.0, 30.0, 33.0, 24.0, 33.0, 24.0, 23.0, 19.0, 24.0, 21.0, 15.0, 8.0, 8.0, 8.0, 12.0, 8.0, 8.0, 3.0, 7.0, 5.0, 8.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.1025390625, -1.066192626953125, -1.02984619140625, -0.993499755859375, -0.9571533203125, -0.920806884765625, -0.88446044921875, -0.848114013671875, -0.811767578125, -0.775421142578125, -0.73907470703125, -0.702728271484375, -0.6663818359375, -0.630035400390625, -0.59368896484375, -0.557342529296875, -0.52099609375, -0.484649658203125, -0.44830322265625, -0.411956787109375, -0.3756103515625, -0.339263916015625, -0.30291748046875, -0.266571044921875, -0.230224609375, -0.193878173828125, -0.15753173828125, -0.121185302734375, -0.0848388671875, -0.048492431640625, -0.01214599609375, 0.024200439453125, 0.060546875, 0.096893310546875, 0.13323974609375, 0.169586181640625, 0.2059326171875, 0.242279052734375, 0.27862548828125, 0.314971923828125, 0.351318359375, 0.387664794921875, 0.42401123046875, 0.460357666015625, 0.4967041015625, 0.533050537109375, 0.56939697265625, 0.605743408203125, 0.64208984375, 0.678436279296875, 0.71478271484375, 0.751129150390625, 0.7874755859375, 0.823822021484375, 0.86016845703125, 0.896514892578125, 0.932861328125, 0.969207763671875, 1.00555419921875, 1.041900634765625, 1.0782470703125, 1.114593505859375, 1.15093994140625, 1.187286376953125, 1.2236328125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 7.0, 10.0, 21.0, 28.0, 31.0, 81.0, 177.0, 415.0, 1279.0, 5759.0, 62228.0, 928172.0, 43763.0, 4748.0, 1114.0, 380.0, 137.0, 75.0, 43.0, 17.0, 22.0, 10.0, 8.0, 5.0, 2.0, 2.0, 2.0, 2.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.490478515625, -0.4712028503417969, -0.45192718505859375, -0.4326515197753906, -0.4133758544921875, -0.3941001892089844, -0.37482452392578125, -0.3555488586425781, -0.336273193359375, -0.3169975280761719, -0.29772186279296875, -0.2784461975097656, -0.2591705322265625, -0.23989486694335938, -0.22061920166015625, -0.20134353637695312, -0.18206787109375, -0.16279220581054688, -0.14351654052734375, -0.12424087524414062, -0.1049652099609375, -0.08568954467773438, -0.06641387939453125, -0.047138214111328125, -0.027862548828125, -0.008586883544921875, 0.01068878173828125, 0.029964447021484375, 0.0492401123046875, 0.06851577758789062, 0.08779144287109375, 0.10706710815429688, 0.1263427734375, 0.14561843872070312, 0.16489410400390625, 0.18416976928710938, 0.2034454345703125, 0.22272109985351562, 0.24199676513671875, 0.2612724304199219, 0.280548095703125, 0.2998237609863281, 0.31909942626953125, 0.3383750915527344, 0.3576507568359375, 0.3769264221191406, 0.39620208740234375, 0.4154777526855469, 0.43475341796875, 0.4540290832519531, 0.47330474853515625, 0.4925804138183594, 0.5118560791015625, 0.5311317443847656, 0.5504074096679688, 0.5696830749511719, 0.588958740234375, 0.6082344055175781, 0.6275100708007812, 0.6467857360839844, 0.6660614013671875, 0.6853370666503906, 0.7046127319335938, 0.7238883972167969, 0.7431640625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 6.0, 10.0, 14.0, 19.0, 28.0, 47.0, 57.0, 107.0, 197.0, 198.0, 123.0, 67.0, 46.0, 27.0, 20.0, 7.0, 5.0, 5.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.14984130859375e-05, -4.959758371114731e-05, -4.769675433635712e-05, -4.5795924961566925e-05, -4.3895095586776733e-05, -4.199426621198654e-05, -4.009343683719635e-05, -3.819260746240616e-05, -3.629177808761597e-05, -3.4390948712825775e-05, -3.2490119338035583e-05, -3.058928996324539e-05, -2.86884605884552e-05, -2.678763121366501e-05, -2.4886801838874817e-05, -2.2985972464084625e-05, -2.1085143089294434e-05, -1.9184313714504242e-05, -1.728348433971405e-05, -1.538265496492386e-05, -1.3481825590133667e-05, -1.1580996215343475e-05, -9.680166840553284e-06, -7.779337465763092e-06, -5.8785080909729e-06, -3.977678716182709e-06, -2.076849341392517e-06, -1.7601996660232544e-07, 1.7248094081878662e-06, 3.625638782978058e-06, 5.5264681577682495e-06, 7.427297532558441e-06, 9.328126907348633e-06, 1.1228956282138824e-05, 1.3129785656929016e-05, 1.5030615031719208e-05, 1.69314444065094e-05, 1.883227378129959e-05, 2.0733103156089783e-05, 2.2633932530879974e-05, 2.4534761905670166e-05, 2.6435591280460358e-05, 2.833642065525055e-05, 3.023725003004074e-05, 3.213807940483093e-05, 3.4038908779621124e-05, 3.5939738154411316e-05, 3.784056752920151e-05, 3.97413969039917e-05, 4.164222627878189e-05, 4.354305565357208e-05, 4.5443885028362274e-05, 4.7344714403152466e-05, 4.924554377794266e-05, 5.114637315273285e-05, 5.304720252752304e-05, 5.494803190231323e-05, 5.6848861277103424e-05, 5.8749690651893616e-05, 6.065052002668381e-05, 6.2551349401474e-05, 6.445217877626419e-05, 6.635300815105438e-05, 6.825383752584457e-05, 7.015466690063477e-05]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 4.0, 4.0, 1.0, 2.0, 6.0, 3.0, 10.0, 12.0, 16.0, 19.0, 32.0, 47.0, 71.0, 91.0, 140.0, 236.0, 388.0, 744.0, 1523.0, 3405.0, 8188.0, 23471.0, 92830.0, 647027.0, 208717.0, 40035.0, 12270.0, 4782.0, 2121.0, 1020.0, 501.0, 285.0, 180.0, 108.0, 77.0, 50.0, 39.0, 22.0, 21.0, 15.0, 12.0, 9.0, 5.0, 6.0, 4.0, 3.0, 4.0, 1.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2099609375, -0.20238494873046875, -0.1948089599609375, -0.18723297119140625, -0.179656982421875, -0.17208099365234375, -0.1645050048828125, -0.15692901611328125, -0.14935302734375, -0.14177703857421875, -0.1342010498046875, -0.12662506103515625, -0.119049072265625, -0.11147308349609375, -0.1038970947265625, -0.09632110595703125, -0.0887451171875, -0.08116912841796875, -0.0735931396484375, -0.06601715087890625, -0.058441162109375, -0.05086517333984375, -0.0432891845703125, -0.03571319580078125, -0.02813720703125, -0.02056121826171875, -0.0129852294921875, -0.00540924072265625, 0.002166748046875, 0.00974273681640625, 0.0173187255859375, 0.02489471435546875, 0.032470703125, 0.04004669189453125, 0.0476226806640625, 0.05519866943359375, 0.062774658203125, 0.07035064697265625, 0.0779266357421875, 0.08550262451171875, 0.09307861328125, 0.10065460205078125, 0.1082305908203125, 0.11580657958984375, 0.123382568359375, 0.13095855712890625, 0.1385345458984375, 0.14611053466796875, 0.1536865234375, 0.16126251220703125, 0.1688385009765625, 0.17641448974609375, 0.183990478515625, 0.19156646728515625, 0.1991424560546875, 0.20671844482421875, 0.21429443359375, 0.22187042236328125, 0.2294464111328125, 0.23702239990234375, 0.244598388671875, 0.25217437744140625, 0.2597503662109375, 0.26732635498046875, 0.27490234375]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 1.0, 6.0, 9.0, 9.0, 9.0, 17.0, 14.0, 13.0, 25.0, 29.0, 38.0, 55.0, 54.0, 88.0, 170.0, 108.0, 73.0, 59.0, 51.0, 35.0, 23.0, 22.0, 21.0, 13.0, 10.0, 7.0, 13.0, 8.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0986328125, -0.09519672393798828, -0.09176063537597656, -0.08832454681396484, -0.08488845825195312, -0.0814523696899414, -0.07801628112792969, -0.07458019256591797, -0.07114410400390625, -0.06770801544189453, -0.06427192687988281, -0.060835838317871094, -0.057399749755859375, -0.053963661193847656, -0.05052757263183594, -0.04709148406982422, -0.0436553955078125, -0.04021930694580078, -0.03678321838378906, -0.033347129821777344, -0.029911041259765625, -0.026474952697753906, -0.023038864135742188, -0.01960277557373047, -0.01616668701171875, -0.012730598449707031, -0.009294509887695312, -0.005858421325683594, -0.002422332763671875, 0.0010137557983398438, 0.0044498443603515625, 0.007885932922363281, 0.011322021484375, 0.014758110046386719, 0.018194198608398438, 0.021630287170410156, 0.025066375732421875, 0.028502464294433594, 0.03193855285644531, 0.03537464141845703, 0.03881072998046875, 0.04224681854248047, 0.04568290710449219, 0.049118995666503906, 0.052555084228515625, 0.055991172790527344, 0.05942726135253906, 0.06286334991455078, 0.0662994384765625, 0.06973552703857422, 0.07317161560058594, 0.07660770416259766, 0.08004379272460938, 0.0834798812866211, 0.08691596984863281, 0.09035205841064453, 0.09378814697265625, 0.09722423553466797, 0.10066032409667969, 0.1040964126586914, 0.10753250122070312, 0.11096858978271484, 0.11440467834472656, 0.11784076690673828, 0.12127685546875]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 5.0, 5.0, 8.0, 21.0, 20.0, 23.0, 49.0, 70.0, 92.0, 113.0, 145.0, 119.0, 117.0, 85.0, 44.0, 29.0, 17.0, 11.0, 9.0, 7.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.66201651096344, -1.5733721256256104, -1.4847277402877808, -1.3960833549499512, -1.3074389696121216, -1.218794584274292, -1.1301500797271729, -1.0415058135986328, -0.9528613686561584, -0.8642169833183289, -0.7755725979804993, -0.6869281530380249, -0.5982837677001953, -0.5096393823623657, -0.42099499702453613, -0.33235061168670654, -0.24370622634887695, -0.15506184101104736, -0.06641744077205658, 0.022226959466934204, 0.1108713448047638, 0.19951573014259338, 0.28816014528274536, 0.37680453062057495, 0.46544891595840454, 0.5540933012962341, 0.6427376866340637, 0.7313821315765381, 0.8200265169143677, 0.9086709022521973, 0.9973152875900269, 1.0859596729278564, 1.1746041774749756, 1.2632485628128052, 1.3518929481506348, 1.4405373334884644, 1.529181718826294, 1.6178261041641235, 1.7064704895019531, 1.7951149940490723, 1.8837592601776123, 1.972403645515442, 2.0610480308532715, 2.1496925354003906, 2.2383368015289307, 2.32698130607605, 2.41562557220459, 2.504270076751709, 2.592914581298828, 2.6815590858459473, 2.7702033519744873, 2.8588478565216064, 2.9474921226501465, 3.0361366271972656, 3.1247808933258057, 3.213425397872925, 3.302069664001465, 3.390714168548584, 3.479358434677124, 3.568002939224243, 3.656647205352783, 3.7452917098999023, 3.8339359760284424, 3.9225804805755615, 4.011224746704102]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 3.0, 8.0, 4.0, 13.0, 23.0, 20.0, 18.0, 24.0, 24.0, 25.0, 32.0, 56.0, 55.0, 46.0, 59.0, 45.0, 52.0, 62.0, 43.0, 60.0, 45.0, 40.0, 31.0, 34.0, 34.0, 33.0, 21.0, 18.0, 27.0, 18.0, 15.0, 7.0, 5.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5478681325912476, -1.4752188920974731, -1.4025695323944092, -1.3299202919006348, -1.2572710514068604, -1.1846216917037964, -1.111972451210022, -1.039323091506958, -0.9666738510131836, -0.8940245509147644, -0.8213752508163452, -0.7487260103225708, -0.6760767102241516, -0.6034274101257324, -0.530778169631958, -0.4581288695335388, -0.38547956943511963, -0.31283026933670044, -0.24018099904060364, -0.16753171384334564, -0.09488242864608765, -0.022233128547668457, 0.050416141748428345, 0.12306541204452515, 0.19571471214294434, 0.2683640122413635, 0.3410132825374603, 0.41366255283355713, 0.4863118529319763, 0.5589611530303955, 0.6316103935241699, 0.7042596936225891, 0.7769088745117188, 0.8495581746101379, 0.9222074747085571, 0.9948567152023315, 1.0675060749053955, 1.14015531539917, 1.2128045558929443, 1.2854537963867188, 1.3581031560897827, 1.4307523965835571, 1.503401756286621, 1.5760509967803955, 1.64870023727417, 1.7213495969772339, 1.7939988374710083, 1.8666481971740723, 1.9392974376678467, 2.011946678161621, 2.0845959186553955, 2.157245397567749, 2.2298946380615234, 2.302543878555298, 2.3751931190490723, 2.4478423595428467, 2.520491600036621, 2.5931408405303955, 2.66579008102417, 2.7384395599365234, 2.811088800430298, 2.8837380409240723, 2.9563872814178467, 3.029036521911621, 3.1016860008239746]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 7.0, 3.0, 7.0, 6.0, 16.0, 10.0, 20.0, 37.0, 36.0, 62.0, 79.0, 90.0, 140.0, 173.0, 285.0, 427.0, 615.0, 935.0, 1615.0, 2961.0, 5675.0, 13459.0, 42762.0, 240226.0, 1572765.0, 1920515.0, 305205.0, 54410.0, 16419.0, 6877.0, 3406.0, 1850.0, 1111.0, 663.0, 431.0, 277.0, 205.0, 136.0, 97.0, 72.0, 57.0, 43.0, 26.0, 16.0, 19.0, 12.0, 6.0, 8.0, 3.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2099609375, -1.1710205078125, -1.132080078125, -1.0931396484375, -1.05419921875, -1.0152587890625, -0.976318359375, -0.9373779296875, -0.8984375, -0.8594970703125, -0.820556640625, -0.7816162109375, -0.74267578125, -0.7037353515625, -0.664794921875, -0.6258544921875, -0.5869140625, -0.5479736328125, -0.509033203125, -0.4700927734375, -0.43115234375, -0.3922119140625, -0.353271484375, -0.3143310546875, -0.275390625, -0.2364501953125, -0.197509765625, -0.1585693359375, -0.11962890625, -0.0806884765625, -0.041748046875, -0.0028076171875, 0.0361328125, 0.0750732421875, 0.114013671875, 0.1529541015625, 0.19189453125, 0.2308349609375, 0.269775390625, 0.3087158203125, 0.34765625, 0.3865966796875, 0.425537109375, 0.4644775390625, 0.50341796875, 0.5423583984375, 0.581298828125, 0.6202392578125, 0.6591796875, 0.6981201171875, 0.737060546875, 0.7760009765625, 0.81494140625, 0.8538818359375, 0.892822265625, 0.9317626953125, 0.970703125, 1.0096435546875, 1.048583984375, 1.0875244140625, 1.12646484375, 1.1654052734375, 1.204345703125, 1.2432861328125, 1.2822265625]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 1.0, 4.0, 2.0, 2.0, 5.0, 6.0, 16.0, 7.0, 22.0, 21.0, 26.0, 34.0, 43.0, 48.0, 46.0, 51.0, 62.0, 58.0, 63.0, 56.0, 48.0, 49.0, 61.0, 47.0, 45.0, 40.0, 28.0, 22.0, 25.0, 16.0, 15.0, 6.0, 9.0, 9.0, 2.0, 4.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1435546875, -1.1107330322265625, -1.077911376953125, -1.0450897216796875, -1.01226806640625, -0.9794464111328125, -0.946624755859375, -0.9138031005859375, -0.8809814453125, -0.8481597900390625, -0.815338134765625, -0.7825164794921875, -0.74969482421875, -0.7168731689453125, -0.684051513671875, -0.6512298583984375, -0.618408203125, -0.5855865478515625, -0.552764892578125, -0.5199432373046875, -0.48712158203125, -0.4542999267578125, -0.421478271484375, -0.3886566162109375, -0.3558349609375, -0.3230133056640625, -0.290191650390625, -0.2573699951171875, -0.22454833984375, -0.1917266845703125, -0.158905029296875, -0.1260833740234375, -0.09326171875, -0.0604400634765625, -0.027618408203125, 0.0052032470703125, 0.03802490234375, 0.0708465576171875, 0.103668212890625, 0.1364898681640625, 0.1693115234375, 0.2021331787109375, 0.234954833984375, 0.2677764892578125, 0.30059814453125, 0.3334197998046875, 0.366241455078125, 0.3990631103515625, 0.431884765625, 0.4647064208984375, 0.497528076171875, 0.5303497314453125, 0.56317138671875, 0.5959930419921875, 0.628814697265625, 0.6616363525390625, 0.6944580078125, 0.7272796630859375, 0.760101318359375, 0.7929229736328125, 0.82574462890625, 0.8585662841796875, 0.891387939453125, 0.9242095947265625, 0.95703125]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 8.0, 3.0, 11.0, 16.0, 41.0, 37.0, 73.0, 148.0, 283.0, 690.0, 2514.0, 15559.0, 419342.0, 3695858.0, 52356.0, 5274.0, 1202.0, 405.0, 197.0, 85.0, 61.0, 35.0, 28.0, 17.0, 8.0, 15.0, 6.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.767578125, -2.678955078125, -2.59033203125, -2.501708984375, -2.4130859375, -2.324462890625, -2.23583984375, -2.147216796875, -2.05859375, -1.969970703125, -1.88134765625, -1.792724609375, -1.7041015625, -1.615478515625, -1.52685546875, -1.438232421875, -1.349609375, -1.260986328125, -1.17236328125, -1.083740234375, -0.9951171875, -0.906494140625, -0.81787109375, -0.729248046875, -0.640625, -0.552001953125, -0.46337890625, -0.374755859375, -0.2861328125, -0.197509765625, -0.10888671875, -0.020263671875, 0.068359375, 0.156982421875, 0.24560546875, 0.334228515625, 0.4228515625, 0.511474609375, 0.60009765625, 0.688720703125, 0.77734375, 0.865966796875, 0.95458984375, 1.043212890625, 1.1318359375, 1.220458984375, 1.30908203125, 1.397705078125, 1.486328125, 1.574951171875, 1.66357421875, 1.752197265625, 1.8408203125, 1.929443359375, 2.01806640625, 2.106689453125, 2.1953125, 2.283935546875, 2.37255859375, 2.461181640625, 2.5498046875, 2.638427734375, 2.72705078125, 2.815673828125, 2.904296875]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 5.0, 6.0, 8.0, 8.0, 17.0, 15.0, 14.0, 31.0, 59.0, 68.0, 103.0, 160.0, 239.0, 475.0, 708.0, 789.0, 537.0, 311.0, 165.0, 129.0, 66.0, 44.0, 28.0, 27.0, 19.0, 13.0, 16.0, 2.0, 4.0, 5.0, 2.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.437255859375, -0.4222831726074219, -0.40731048583984375, -0.3923377990722656, -0.3773651123046875, -0.3623924255371094, -0.34741973876953125, -0.3324470520019531, -0.317474365234375, -0.3025016784667969, -0.28752899169921875, -0.2725563049316406, -0.2575836181640625, -0.24261093139648438, -0.22763824462890625, -0.21266555786132812, -0.19769287109375, -0.18272018432617188, -0.16774749755859375, -0.15277481079101562, -0.1378021240234375, -0.12282943725585938, -0.10785675048828125, -0.09288406372070312, -0.077911376953125, -0.06293869018554688, -0.04796600341796875, -0.032993316650390625, -0.0180206298828125, -0.003047943115234375, 0.01192474365234375, 0.026897430419921875, 0.0418701171875, 0.056842803955078125, 0.07181549072265625, 0.08678817749023438, 0.1017608642578125, 0.11673355102539062, 0.13170623779296875, 0.14667892456054688, 0.161651611328125, 0.17662429809570312, 0.19159698486328125, 0.20656967163085938, 0.2215423583984375, 0.23651504516601562, 0.25148773193359375, 0.2664604187011719, 0.28143310546875, 0.2964057922363281, 0.31137847900390625, 0.3263511657714844, 0.3413238525390625, 0.3562965393066406, 0.37126922607421875, 0.3862419128417969, 0.401214599609375, 0.4161872863769531, 0.43115997314453125, 0.4461326599121094, 0.4611053466796875, 0.4760780334472656, 0.49105072021484375, 0.5060234069824219, 0.52099609375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [4.0, 2.0, 4.0, 2.0, 2.0, 4.0, 11.0, 18.0, 18.0, 30.0, 49.0, 80.0, 95.0, 131.0, 135.0, 136.0, 102.0, 56.0, 49.0, 33.0, 24.0, 9.0, 6.0, 6.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0353268384933472, -0.9643552899360657, -0.8933836817741394, -0.8224121332168579, -0.7514405250549316, -0.6804689764976501, -0.6094974279403687, -0.5385258197784424, -0.4675542712211609, -0.396582692861557, -0.3256111145019531, -0.25463956594467163, -0.18366798758506775, -0.11269640922546387, -0.04172486066818237, 0.02924671769142151, 0.10021829605102539, 0.17118987441062927, 0.24216143786907196, 0.31313300132751465, 0.38410457968711853, 0.4550761580467224, 0.5260477066040039, 0.5970193147659302, 0.6679908633232117, 0.7389624118804932, 0.8099340200424194, 0.8809055685997009, 0.9518771171569824, 1.0228487253189087, 1.093820333480835, 1.1647918224334717, 1.2357635498046875, 1.3067351579666138, 1.3777066469192505, 1.4486782550811768, 1.519649863243103, 1.5906214714050293, 1.661592960357666, 1.7325645685195923, 1.8035361766815186, 1.8745077848434448, 1.9454792737960815, 2.016450881958008, 2.0874223709106445, 2.1583940982818604, 2.229365587234497, 2.300337076187134, 2.3713088035583496, 2.4422802925109863, 2.513252019882202, 2.584223508834839, 2.6551949977874756, 2.7261667251586914, 2.797138214111328, 2.868109703063965, 2.9390811920166016, 3.0100526809692383, 3.081024408340454, 3.151995897293091, 3.2229673862457275, 3.2939391136169434, 3.36491060256958, 3.435882091522217, 3.5068538188934326]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 7.0, 10.0, 4.0, 10.0, 17.0, 19.0, 21.0, 24.0, 46.0, 33.0, 62.0, 33.0, 58.0, 43.0, 42.0, 62.0, 70.0, 50.0, 42.0, 56.0, 44.0, 39.0, 30.0, 40.0, 25.0, 27.0, 7.0, 17.0, 12.0, 14.0, 8.0, 4.0, 7.0, 8.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.235758662223816, -1.2023282051086426, -1.1688977479934692, -1.135467290878296, -1.102036714553833, -1.0686062574386597, -1.0351758003234863, -1.001745343208313, -0.9683148860931396, -0.9348844289779663, -0.901453971862793, -0.8680234551429749, -0.8345929980278015, -0.8011625409126282, -0.7677320241928101, -0.7343015670776367, -0.7008711099624634, -0.66744065284729, -0.6340101957321167, -0.6005796790122986, -0.5671492218971252, -0.5337187647819519, -0.5002882480621338, -0.46685779094696045, -0.4334273338317871, -0.39999687671661377, -0.36656638979911804, -0.3331359028816223, -0.299705445766449, -0.26627498865127563, -0.2328445017337799, -0.19941402971744537, -0.16598361730575562, -0.13255314528942108, -0.09912267327308655, -0.06569220125675201, -0.03226172924041748, 0.0011687427759170532, 0.03459921479225159, 0.06802968680858612, 0.10146015882492065, 0.1348906308412552, 0.16832110285758972, 0.20175157487392426, 0.2351820468902588, 0.26861250400543213, 0.30204299092292786, 0.3354734778404236, 0.3689039349555969, 0.40233439207077026, 0.435764878988266, 0.4691953659057617, 0.5026258230209351, 0.5360562801361084, 0.5694867372512817, 0.6029172539710999, 0.6363477110862732, 0.6697781682014465, 0.7032086849212646, 0.736639142036438, 0.7700695991516113, 0.8035000562667847, 0.836930513381958, 0.8703610301017761, 0.9037914872169495]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 3.0, 5.0, 11.0, 7.0, 10.0, 21.0, 11.0, 24.0, 52.0, 100.0, 250.0, 680.0, 2334.0, 10116.0, 79330.0, 880376.0, 62839.0, 9020.0, 2186.0, 687.0, 243.0, 102.0, 48.0, 28.0, 19.0, 10.0, 9.0, 9.0, 5.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.69140625, -1.643707275390625, -1.59600830078125, -1.548309326171875, -1.5006103515625, -1.452911376953125, -1.40521240234375, -1.357513427734375, -1.309814453125, -1.262115478515625, -1.21441650390625, -1.166717529296875, -1.1190185546875, -1.071319580078125, -1.02362060546875, -0.975921630859375, -0.92822265625, -0.880523681640625, -0.83282470703125, -0.785125732421875, -0.7374267578125, -0.689727783203125, -0.64202880859375, -0.594329833984375, -0.546630859375, -0.498931884765625, -0.45123291015625, -0.403533935546875, -0.3558349609375, -0.308135986328125, -0.26043701171875, -0.212738037109375, -0.1650390625, -0.117340087890625, -0.06964111328125, -0.021942138671875, 0.0257568359375, 0.073455810546875, 0.12115478515625, 0.168853759765625, 0.216552734375, 0.264251708984375, 0.31195068359375, 0.359649658203125, 0.4073486328125, 0.455047607421875, 0.50274658203125, 0.550445556640625, 0.59814453125, 0.645843505859375, 0.69354248046875, 0.741241455078125, 0.7889404296875, 0.836639404296875, 0.88433837890625, 0.932037353515625, 0.979736328125, 1.027435302734375, 1.07513427734375, 1.122833251953125, 1.1705322265625, 1.218231201171875, 1.26593017578125, 1.313629150390625, 1.361328125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 14.0, 10.0, 25.0, 54.0, 82.0, 109.0, 149.0, 174.0, 114.0, 113.0, 73.0, 35.0, 25.0, 14.0, 4.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73486328125, -0.6840133666992188, -0.6331634521484375, -0.5823135375976562, -0.531463623046875, -0.48061370849609375, -0.4297637939453125, -0.37891387939453125, -0.32806396484375, -0.27721405029296875, -0.2263641357421875, -0.17551422119140625, -0.124664306640625, -0.07381439208984375, -0.0229644775390625, 0.02788543701171875, 0.0787353515625, 0.12958526611328125, 0.1804351806640625, 0.23128509521484375, 0.282135009765625, 0.33298492431640625, 0.3838348388671875, 0.43468475341796875, 0.48553466796875, 0.5363845825195312, 0.5872344970703125, 0.6380844116210938, 0.688934326171875, 0.7397842407226562, 0.7906341552734375, 0.8414840698242188, 0.892333984375, 0.9431838989257812, 0.9940338134765625, 1.0448837280273438, 1.095733642578125, 1.1465835571289062, 1.1974334716796875, 1.2482833862304688, 1.29913330078125, 1.3499832153320312, 1.4008331298828125, 1.4516830444335938, 1.502532958984375, 1.5533828735351562, 1.6042327880859375, 1.6550827026367188, 1.7059326171875, 1.7567825317382812, 1.8076324462890625, 1.8584823608398438, 1.909332275390625, 1.9601821899414062, 2.0110321044921875, 2.0618820190429688, 2.11273193359375, 2.1635818481445312, 2.2144317626953125, 2.2652816772460938, 2.316131591796875, 2.3669815063476562, 2.4178314208984375, 2.4686813354492188, 2.51953125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 14.0, 9.0, 8.0, 14.0, 26.0, 34.0, 45.0, 85.0, 133.0, 269.0, 555.0, 1358.0, 4006.0, 15443.0, 87510.0, 645565.0, 249448.0, 32739.0, 7386.0, 2121.0, 836.0, 393.0, 201.0, 114.0, 76.0, 59.0, 31.0, 22.0, 19.0, 9.0, 8.0, 3.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.84375, -0.8235321044921875, -0.803314208984375, -0.7830963134765625, -0.76287841796875, -0.7426605224609375, -0.722442626953125, -0.7022247314453125, -0.6820068359375, -0.6617889404296875, -0.641571044921875, -0.6213531494140625, -0.60113525390625, -0.5809173583984375, -0.560699462890625, -0.5404815673828125, -0.520263671875, -0.5000457763671875, -0.479827880859375, -0.4596099853515625, -0.43939208984375, -0.4191741943359375, -0.398956298828125, -0.3787384033203125, -0.3585205078125, -0.3383026123046875, -0.318084716796875, -0.2978668212890625, -0.27764892578125, -0.2574310302734375, -0.237213134765625, -0.2169952392578125, -0.19677734375, -0.1765594482421875, -0.156341552734375, -0.1361236572265625, -0.11590576171875, -0.0956878662109375, -0.075469970703125, -0.0552520751953125, -0.0350341796875, -0.0148162841796875, 0.005401611328125, 0.0256195068359375, 0.04583740234375, 0.0660552978515625, 0.086273193359375, 0.1064910888671875, 0.126708984375, 0.1469268798828125, 0.167144775390625, 0.1873626708984375, 0.20758056640625, 0.2277984619140625, 0.248016357421875, 0.2682342529296875, 0.2884521484375, 0.3086700439453125, 0.328887939453125, 0.3491058349609375, 0.36932373046875, 0.3895416259765625, 0.409759521484375, 0.4299774169921875, 0.4501953125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 3.0, 3.0, 13.0, 18.0, 26.0, 42.0, 34.0, 35.0, 45.0, 51.0, 71.0, 66.0, 74.0, 84.0, 78.0, 71.0, 57.0, 55.0, 41.0, 27.0, 33.0, 29.0, 18.0, 6.0, 9.0, 6.0, 8.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.025390625, -1.9768829345703125, -1.928375244140625, -1.8798675537109375, -1.83135986328125, -1.7828521728515625, -1.734344482421875, -1.6858367919921875, -1.6373291015625, -1.5888214111328125, -1.540313720703125, -1.4918060302734375, -1.44329833984375, -1.3947906494140625, -1.346282958984375, -1.2977752685546875, -1.249267578125, -1.2007598876953125, -1.152252197265625, -1.1037445068359375, -1.05523681640625, -1.0067291259765625, -0.958221435546875, -0.9097137451171875, -0.8612060546875, -0.8126983642578125, -0.764190673828125, -0.7156829833984375, -0.66717529296875, -0.6186676025390625, -0.570159912109375, -0.5216522216796875, -0.47314453125, -0.4246368408203125, -0.376129150390625, -0.3276214599609375, -0.27911376953125, -0.2306060791015625, -0.182098388671875, -0.1335906982421875, -0.0850830078125, -0.0365753173828125, 0.011932373046875, 0.0604400634765625, 0.10894775390625, 0.1574554443359375, 0.205963134765625, 0.2544708251953125, 0.302978515625, 0.3514862060546875, 0.399993896484375, 0.4485015869140625, 0.49700927734375, 0.5455169677734375, 0.594024658203125, 0.6425323486328125, 0.6910400390625, 0.7395477294921875, 0.788055419921875, 0.8365631103515625, 0.88507080078125, 0.9335784912109375, 0.982086181640625, 1.0305938720703125, 1.0791015625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 5.0, 5.0, 4.0, 7.0, 7.0, 5.0, 6.0, 11.0, 12.0, 19.0, 30.0, 47.0, 60.0, 92.0, 190.0, 374.0, 711.0, 1439.0, 3159.0, 8069.0, 24650.0, 106645.0, 549638.0, 280676.0, 49532.0, 13751.0, 5013.0, 2235.0, 1000.0, 470.0, 270.0, 147.0, 94.0, 48.0, 27.0, 24.0, 14.0, 23.0, 16.0, 9.0, 6.0, 6.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1370849609375, -0.1327686309814453, -0.12845230102539062, -0.12413597106933594, -0.11981964111328125, -0.11550331115722656, -0.11118698120117188, -0.10687065124511719, -0.1025543212890625, -0.09823799133300781, -0.09392166137695312, -0.08960533142089844, -0.08528900146484375, -0.08097267150878906, -0.07665634155273438, -0.07234001159667969, -0.068023681640625, -0.06370735168457031, -0.059391021728515625, -0.05507469177246094, -0.05075836181640625, -0.04644203186035156, -0.042125701904296875, -0.03780937194824219, -0.0334930419921875, -0.029176712036132812, -0.024860382080078125, -0.020544052124023438, -0.01622772216796875, -0.011911392211914062, -0.007595062255859375, -0.0032787322998046875, 0.00103759765625, 0.0053539276123046875, 0.009670257568359375, 0.013986587524414062, 0.01830291748046875, 0.022619247436523438, 0.026935577392578125, 0.03125190734863281, 0.0355682373046875, 0.03988456726074219, 0.044200897216796875, 0.04851722717285156, 0.05283355712890625, 0.05714988708496094, 0.061466217041015625, 0.06578254699707031, 0.070098876953125, 0.07441520690917969, 0.07873153686523438, 0.08304786682128906, 0.08736419677734375, 0.09168052673339844, 0.09599685668945312, 0.10031318664550781, 0.1046295166015625, 0.10894584655761719, 0.11326217651367188, 0.11757850646972656, 0.12189483642578125, 0.12621116638183594, 0.13052749633789062, 0.1348438262939453, 0.13916015625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 8.0, 9.0, 18.0, 14.0, 27.0, 31.0, 55.0, 89.0, 112.0, 130.0, 131.0, 106.0, 79.0, 58.0, 50.0, 22.0, 20.0, 15.0, 7.0, 6.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.414817810058594e-05, -7.139705121517181e-05, -6.864592432975769e-05, -6.589479744434357e-05, -6.314367055892944e-05, -6.039254367351532e-05, -5.7641416788101196e-05, -5.489028990268707e-05, -5.213916301727295e-05, -4.9388036131858826e-05, -4.66369092464447e-05, -4.388578236103058e-05, -4.1134655475616455e-05, -3.838352859020233e-05, -3.563240170478821e-05, -3.2881274819374084e-05, -3.013014793395996e-05, -2.7379021048545837e-05, -2.4627894163131714e-05, -2.187676727771759e-05, -1.9125640392303467e-05, -1.6374513506889343e-05, -1.362338662147522e-05, -1.0872259736061096e-05, -8.121132850646973e-06, -5.370005965232849e-06, -2.6188790798187256e-06, 1.3224780559539795e-07, 2.8833746910095215e-06, 5.634501576423645e-06, 8.385628461837769e-06, 1.1136755347251892e-05, 1.3887882232666016e-05, 1.663900911808014e-05, 1.9390136003494263e-05, 2.2141262888908386e-05, 2.489238977432251e-05, 2.7643516659736633e-05, 3.0394643545150757e-05, 3.314577043056488e-05, 3.5896897315979004e-05, 3.864802420139313e-05, 4.139915108680725e-05, 4.4150277972221375e-05, 4.69014048576355e-05, 4.965253174304962e-05, 5.2403658628463745e-05, 5.515478551387787e-05, 5.790591239929199e-05, 6.0657039284706116e-05, 6.340816617012024e-05, 6.615929305553436e-05, 6.891041994094849e-05, 7.166154682636261e-05, 7.441267371177673e-05, 7.716380059719086e-05, 7.991492748260498e-05, 8.26660543680191e-05, 8.541718125343323e-05, 8.816830813884735e-05, 9.091943502426147e-05, 9.36705619096756e-05, 9.642168879508972e-05, 9.917281568050385e-05, 0.00010192394256591797]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 10.0, 13.0, 15.0, 19.0, 30.0, 52.0, 94.0, 150.0, 275.0, 490.0, 1090.0, 2646.0, 7006.0, 22290.0, 114716.0, 580552.0, 259032.0, 41905.0, 11124.0, 3944.0, 1575.0, 678.0, 356.0, 186.0, 113.0, 65.0, 42.0, 31.0, 13.0, 5.0, 12.0, 5.0, 5.0, 6.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1439208984375, -0.1392345428466797, -0.13454818725585938, -0.12986183166503906, -0.12517547607421875, -0.12048912048339844, -0.11580276489257812, -0.11111640930175781, -0.1064300537109375, -0.10174369812011719, -0.09705734252929688, -0.09237098693847656, -0.08768463134765625, -0.08299827575683594, -0.07831192016601562, -0.07362556457519531, -0.068939208984375, -0.06425285339355469, -0.059566497802734375, -0.05488014221191406, -0.05019378662109375, -0.04550743103027344, -0.040821075439453125, -0.03613471984863281, -0.0314483642578125, -0.026762008666992188, -0.022075653076171875, -0.017389297485351562, -0.01270294189453125, -0.008016586303710938, -0.003330230712890625, 0.0013561248779296875, 0.00604248046875, 0.010728836059570312, 0.015415191650390625, 0.020101547241210938, 0.02478790283203125, 0.029474258422851562, 0.034160614013671875, 0.03884696960449219, 0.0435333251953125, 0.04821968078613281, 0.052906036376953125, 0.05759239196777344, 0.06227874755859375, 0.06696510314941406, 0.07165145874023438, 0.07633781433105469, 0.081024169921875, 0.08571052551269531, 0.09039688110351562, 0.09508323669433594, 0.09976959228515625, 0.10445594787597656, 0.10914230346679688, 0.11382865905761719, 0.1185150146484375, 0.12320137023925781, 0.12788772583007812, 0.13257408142089844, 0.13726043701171875, 0.14194679260253906, 0.14663314819335938, 0.1513195037841797, 0.156005859375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 4.0, 6.0, 4.0, 9.0, 11.0, 12.0, 28.0, 27.0, 33.0, 53.0, 69.0, 85.0, 73.0, 93.0, 87.0, 72.0, 61.0, 50.0, 54.0, 30.0, 34.0, 28.0, 19.0, 7.0, 7.0, 5.0, 3.0, 10.0, 1.0, 3.0, 1.0, 5.0, 3.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.02655029296875, -0.02562856674194336, -0.02470684051513672, -0.023785114288330078, -0.022863388061523438, -0.021941661834716797, -0.021019935607910156, -0.020098209381103516, -0.019176483154296875, -0.018254756927490234, -0.017333030700683594, -0.016411304473876953, -0.015489578247070312, -0.014567852020263672, -0.013646125793457031, -0.01272439956665039, -0.01180267333984375, -0.01088094711303711, -0.009959220886230469, -0.009037494659423828, -0.008115768432617188, -0.007194042205810547, -0.006272315979003906, -0.005350589752197266, -0.004428863525390625, -0.0035071372985839844, -0.0025854110717773438, -0.0016636848449707031, -0.0007419586181640625, 0.00017976760864257812, 0.0011014938354492188, 0.0020232200622558594, 0.0029449462890625, 0.0038666725158691406, 0.004788398742675781, 0.005710124969482422, 0.0066318511962890625, 0.007553577423095703, 0.008475303649902344, 0.009397029876708984, 0.010318756103515625, 0.011240482330322266, 0.012162208557128906, 0.013083934783935547, 0.014005661010742188, 0.014927387237548828, 0.01584911346435547, 0.01677083969116211, 0.01769256591796875, 0.01861429214477539, 0.01953601837158203, 0.020457744598388672, 0.021379470825195312, 0.022301197052001953, 0.023222923278808594, 0.024144649505615234, 0.025066375732421875, 0.025988101959228516, 0.026909828186035156, 0.027831554412841797, 0.028753280639648438, 0.029675006866455078, 0.03059673309326172, 0.03151845932006836, 0.032440185546875]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 3.0, 5.0, 4.0, 12.0, 16.0, 28.0, 46.0, 72.0, 137.0, 206.0, 169.0, 134.0, 83.0, 47.0, 16.0, 7.0, 10.0, 8.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6545525193214417, -0.6040771007537842, -0.5536017417907715, -0.503126323223114, -0.45265090465545654, -0.4021754860877991, -0.351700097322464, -0.3012247085571289, -0.25074928998947144, -0.20027388632297516, -0.14979848265647888, -0.0993230789899826, -0.04884767532348633, 0.0016277432441711426, 0.052103132009506226, 0.10257852077484131, 0.15305393934249878, 0.20352934300899506, 0.25400474667549133, 0.3044801354408264, 0.3549555540084839, 0.40543097257614136, 0.45590636134147644, 0.5063817501068115, 0.556857168674469, 0.6073325872421265, 0.6578079462051392, 0.7082833647727966, 0.7587587833404541, 0.8092342019081116, 0.859709620475769, 0.9101849794387817, 0.960660457611084, 1.0111358165740967, 1.061611294746399, 1.1120866537094116, 1.1625621318817139, 1.2130374908447266, 1.2635128498077393, 1.313988208770752, 1.3644636869430542, 1.414939045906067, 1.4654145240783691, 1.5158898830413818, 1.5663652420043945, 1.6168407201766968, 1.6673160791397095, 1.7177915573120117, 1.7682669162750244, 1.818742275238037, 1.8692177534103394, 1.919693112373352, 1.9701685905456543, 2.020643949508667, 2.0711193084716797, 2.1215946674346924, 2.172070026397705, 2.2225453853607178, 2.2730207443237305, 2.3234963417053223, 2.373971700668335, 2.4244470596313477, 2.4749224185943604, 2.525397777557373, 2.575873374938965]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 11.0, 17.0, 31.0, 54.0, 92.0, 125.0, 130.0, 147.0, 119.0, 106.0, 65.0, 41.0, 29.0, 17.0, 12.0, 4.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7525411248207092, -0.7066251039505005, -0.6607090830802917, -0.614793062210083, -0.568877100944519, -0.5229610800743103, -0.47704505920410156, -0.4311290681362152, -0.38521304726600647, -0.33929702639579773, -0.2933810353279114, -0.24746501445770264, -0.2015490084886551, -0.15563300251960754, -0.1097169816493988, -0.06380099058151245, -0.01788496971130371, 0.028031039983034134, 0.07394704967737198, 0.11986306309700012, 0.16577906906604767, 0.21169507503509521, 0.25761109590530396, 0.3035270869731903, 0.34944310784339905, 0.3953591287136078, 0.44127511978149414, 0.4871911406517029, 0.5331071615219116, 0.5790231227874756, 0.6249392032623291, 0.6708551645278931, 0.7167712450027466, 0.7626872658729553, 0.8086032867431641, 0.854519248008728, 0.9004352688789368, 0.9463512897491455, 0.9922673106193542, 1.038183331489563, 1.084099292755127, 1.130015254020691, 1.1759313344955444, 1.2218472957611084, 1.267763376235962, 1.3136793375015259, 1.3595952987670898, 1.4055113792419434, 1.4514274597167969, 1.4973434209823608, 1.5432595014572144, 1.5891754627227783, 1.6350915431976318, 1.6810075044631958, 1.7269234657287598, 1.7728395462036133, 1.8187555074691772, 1.8646714687347412, 1.9105875492095947, 1.9565035104751587, 2.0024194717407227, 2.048335552215576, 2.0942516326904297, 2.140167474746704, 2.1860835552215576]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 8.0, 12.0, 17.0, 44.0, 98.0, 148.0, 337.0, 798.0, 1916.0, 4919.0, 15207.0, 86139.0, 793889.0, 117410.0, 18334.0, 5544.0, 2091.0, 871.0, 380.0, 174.0, 89.0, 50.0, 31.0, 10.0, 9.0, 3.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-2.08203125, -2.0294036865234375, -1.976776123046875, -1.9241485595703125, -1.87152099609375, -1.8188934326171875, -1.766265869140625, -1.7136383056640625, -1.6610107421875, -1.6083831787109375, -1.555755615234375, -1.5031280517578125, -1.45050048828125, -1.3978729248046875, -1.345245361328125, -1.2926177978515625, -1.239990234375, -1.1873626708984375, -1.134735107421875, -1.0821075439453125, -1.02947998046875, -0.9768524169921875, -0.924224853515625, -0.8715972900390625, -0.8189697265625, -0.7663421630859375, -0.713714599609375, -0.6610870361328125, -0.60845947265625, -0.5558319091796875, -0.503204345703125, -0.4505767822265625, -0.39794921875, -0.3453216552734375, -0.292694091796875, -0.2400665283203125, -0.18743896484375, -0.1348114013671875, -0.082183837890625, -0.0295562744140625, 0.0230712890625, 0.0756988525390625, 0.128326416015625, 0.1809539794921875, 0.23358154296875, 0.2862091064453125, 0.338836669921875, 0.3914642333984375, 0.444091796875, 0.4967193603515625, 0.549346923828125, 0.6019744873046875, 0.65460205078125, 0.7072296142578125, 0.759857177734375, 0.8124847412109375, 0.8651123046875, 0.9177398681640625, 0.970367431640625, 1.0229949951171875, 1.07562255859375, 1.1282501220703125, 1.180877685546875, 1.2335052490234375, 1.2861328125]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 21.0, 35.0, 43.0, 61.0, 84.0, 117.0, 115.0, 118.0, 116.0, 83.0, 73.0, 37.0, 30.0, 23.0, 15.0, 10.0, 9.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2607421875, -1.1877899169921875, -1.114837646484375, -1.0418853759765625, -0.96893310546875, -0.8959808349609375, -0.823028564453125, -0.7500762939453125, -0.6771240234375, -0.6041717529296875, -0.531219482421875, -0.4582672119140625, -0.38531494140625, -0.3123626708984375, -0.239410400390625, -0.1664581298828125, -0.093505859375, -0.0205535888671875, 0.052398681640625, 0.1253509521484375, 0.19830322265625, 0.2712554931640625, 0.344207763671875, 0.4171600341796875, 0.4901123046875, 0.5630645751953125, 0.636016845703125, 0.7089691162109375, 0.78192138671875, 0.8548736572265625, 0.927825927734375, 1.0007781982421875, 1.07373046875, 1.1466827392578125, 1.219635009765625, 1.2925872802734375, 1.36553955078125, 1.4384918212890625, 1.511444091796875, 1.5843963623046875, 1.6573486328125, 1.7303009033203125, 1.803253173828125, 1.8762054443359375, 1.94915771484375, 2.0221099853515625, 2.095062255859375, 2.1680145263671875, 2.240966796875, 2.3139190673828125, 2.386871337890625, 2.4598236083984375, 2.53277587890625, 2.6057281494140625, 2.678680419921875, 2.7516326904296875, 2.8245849609375, 2.8975372314453125, 2.970489501953125, 3.0434417724609375, 3.11639404296875, 3.1893463134765625, 3.262298583984375, 3.3352508544921875, 3.408203125]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 4.0, 3.0, 2.0, 5.0, 4.0, 9.0, 6.0, 16.0, 10.0, 15.0, 12.0, 19.0, 26.0, 32.0, 38.0, 61.0, 68.0, 85.0, 180.0, 321.0, 880.0, 4620.0, 72323.0, 934151.0, 31380.0, 2868.0, 620.0, 248.0, 146.0, 88.0, 56.0, 47.0, 34.0, 35.0, 27.0, 21.0, 20.0, 18.0, 16.0, 3.0, 9.0, 5.0, 10.0, 2.0, 4.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.9375, -2.85205078125, -2.7666015625, -2.68115234375, -2.595703125, -2.51025390625, -2.4248046875, -2.33935546875, -2.25390625, -2.16845703125, -2.0830078125, -1.99755859375, -1.912109375, -1.82666015625, -1.7412109375, -1.65576171875, -1.5703125, -1.48486328125, -1.3994140625, -1.31396484375, -1.228515625, -1.14306640625, -1.0576171875, -0.97216796875, -0.88671875, -0.80126953125, -0.7158203125, -0.63037109375, -0.544921875, -0.45947265625, -0.3740234375, -0.28857421875, -0.203125, -0.11767578125, -0.0322265625, 0.05322265625, 0.138671875, 0.22412109375, 0.3095703125, 0.39501953125, 0.48046875, 0.56591796875, 0.6513671875, 0.73681640625, 0.822265625, 0.90771484375, 0.9931640625, 1.07861328125, 1.1640625, 1.24951171875, 1.3349609375, 1.42041015625, 1.505859375, 1.59130859375, 1.6767578125, 1.76220703125, 1.84765625, 1.93310546875, 2.0185546875, 2.10400390625, 2.189453125, 2.27490234375, 2.3603515625, 2.44580078125, 2.53125]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 7.0, 8.0, 5.0, 5.0, 4.0, 6.0, 10.0, 10.0, 11.0, 25.0, 17.0, 23.0, 24.0, 31.0, 43.0, 35.0, 32.0, 43.0, 45.0, 57.0, 36.0, 34.0, 43.0, 51.0, 38.0, 46.0, 42.0, 41.0, 27.0, 34.0, 23.0, 29.0, 22.0, 21.0, 16.0, 14.0, 9.0, 6.0, 6.0, 8.0, 8.0, 6.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.0302734375, -1.0003662109375, -0.970458984375, -0.9405517578125, -0.91064453125, -0.8807373046875, -0.850830078125, -0.8209228515625, -0.791015625, -0.7611083984375, -0.731201171875, -0.7012939453125, -0.67138671875, -0.6414794921875, -0.611572265625, -0.5816650390625, -0.5517578125, -0.5218505859375, -0.491943359375, -0.4620361328125, -0.43212890625, -0.4022216796875, -0.372314453125, -0.3424072265625, -0.3125, -0.2825927734375, -0.252685546875, -0.2227783203125, -0.19287109375, -0.1629638671875, -0.133056640625, -0.1031494140625, -0.0732421875, -0.0433349609375, -0.013427734375, 0.0164794921875, 0.04638671875, 0.0762939453125, 0.106201171875, 0.1361083984375, 0.166015625, 0.1959228515625, 0.225830078125, 0.2557373046875, 0.28564453125, 0.3155517578125, 0.345458984375, 0.3753662109375, 0.4052734375, 0.4351806640625, 0.465087890625, 0.4949951171875, 0.52490234375, 0.5548095703125, 0.584716796875, 0.6146240234375, 0.64453125, 0.6744384765625, 0.704345703125, 0.7342529296875, 0.76416015625, 0.7940673828125, 0.823974609375, 0.8538818359375, 0.8837890625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 6.0, 10.0, 11.0, 13.0, 32.0, 38.0, 63.0, 124.0, 203.0, 420.0, 858.0, 2075.0, 6351.0, 24757.0, 199992.0, 731518.0, 63790.0, 12095.0, 3614.0, 1338.0, 580.0, 287.0, 168.0, 73.0, 57.0, 33.0, 15.0, 13.0, 9.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.472900390625, -0.4567375183105469, -0.44057464599609375, -0.4244117736816406, -0.4082489013671875, -0.3920860290527344, -0.37592315673828125, -0.3597602844238281, -0.343597412109375, -0.3274345397949219, -0.31127166748046875, -0.2951087951660156, -0.2789459228515625, -0.2627830505371094, -0.24662017822265625, -0.23045730590820312, -0.21429443359375, -0.19813156127929688, -0.18196868896484375, -0.16580581665039062, -0.1496429443359375, -0.13348007202148438, -0.11731719970703125, -0.10115432739257812, -0.084991455078125, -0.06882858276367188, -0.05266571044921875, -0.036502838134765625, -0.0203399658203125, -0.004177093505859375, 0.01198577880859375, 0.028148651123046875, 0.0443115234375, 0.060474395751953125, 0.07663726806640625, 0.09280014038085938, 0.1089630126953125, 0.12512588500976562, 0.14128875732421875, 0.15745162963867188, 0.173614501953125, 0.18977737426757812, 0.20594024658203125, 0.22210311889648438, 0.2382659912109375, 0.2544288635253906, 0.27059173583984375, 0.2867546081542969, 0.30291748046875, 0.3190803527832031, 0.33524322509765625, 0.3514060974121094, 0.3675689697265625, 0.3837318420410156, 0.39989471435546875, 0.4160575866699219, 0.432220458984375, 0.4483833312988281, 0.46454620361328125, 0.4807090759277344, 0.4968719482421875, 0.5130348205566406, 0.5291976928710938, 0.5453605651855469, 0.5615234375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 7.0, 1.0, 4.0, 2.0, 5.0, 8.0, 4.0, 10.0, 9.0, 7.0, 24.0, 29.0, 49.0, 49.0, 77.0, 80.0, 136.0, 153.0, 98.0, 76.0, 47.0, 28.0, 23.0, 17.0, 12.0, 14.0, 6.0, 3.0, 5.0, 4.0, 4.0, 2.0, 1.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.073713302612305e-05, -5.8708712458610535e-05, -5.668029189109802e-05, -5.465187132358551e-05, -5.2623450756073e-05, -5.0595030188560486e-05, -4.8566609621047974e-05, -4.653818905353546e-05, -4.450976848602295e-05, -4.248134791851044e-05, -4.0452927350997925e-05, -3.842450678348541e-05, -3.63960862159729e-05, -3.436766564846039e-05, -3.2339245080947876e-05, -3.0310824513435364e-05, -2.828240394592285e-05, -2.625398337841034e-05, -2.4225562810897827e-05, -2.2197142243385315e-05, -2.0168721675872803e-05, -1.814030110836029e-05, -1.611188054084778e-05, -1.4083459973335266e-05, -1.2055039405822754e-05, -1.0026618838310242e-05, -7.99819827079773e-06, -5.969777703285217e-06, -3.941357135772705e-06, -1.912936568260193e-06, 1.1548399925231934e-07, 2.1439045667648315e-06, 4.172325134277344e-06, 6.200745701789856e-06, 8.229166269302368e-06, 1.025758683681488e-05, 1.2286007404327393e-05, 1.4314427971839905e-05, 1.6342848539352417e-05, 1.837126910686493e-05, 2.039968967437744e-05, 2.2428110241889954e-05, 2.4456530809402466e-05, 2.6484951376914978e-05, 2.851337194442749e-05, 3.054179251194e-05, 3.2570213079452515e-05, 3.459863364696503e-05, 3.662705421447754e-05, 3.865547478199005e-05, 4.0683895349502563e-05, 4.2712315917015076e-05, 4.474073648452759e-05, 4.67691570520401e-05, 4.879757761955261e-05, 5.0825998187065125e-05, 5.285441875457764e-05, 5.488283932209015e-05, 5.691125988960266e-05, 5.893968045711517e-05, 6.0968101024627686e-05, 6.29965215921402e-05, 6.502494215965271e-05, 6.705336272716522e-05, 6.908178329467773e-05]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 11.0, 11.0, 9.0, 27.0, 32.0, 51.0, 73.0, 107.0, 167.0, 331.0, 721.0, 1590.0, 4572.0, 17522.0, 106061.0, 751930.0, 136196.0, 20440.0, 5265.0, 1821.0, 694.0, 368.0, 212.0, 102.0, 70.0, 45.0, 36.0, 24.0, 16.0, 10.0, 6.0, 7.0, 6.0, 5.0, 3.0, 1.0, 0.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.427978515625, -0.4134979248046875, -0.399017333984375, -0.3845367431640625, -0.37005615234375, -0.3555755615234375, -0.341094970703125, -0.3266143798828125, -0.3121337890625, -0.2976531982421875, -0.283172607421875, -0.2686920166015625, -0.25421142578125, -0.2397308349609375, -0.225250244140625, -0.2107696533203125, -0.1962890625, -0.1818084716796875, -0.167327880859375, -0.1528472900390625, -0.13836669921875, -0.1238861083984375, -0.109405517578125, -0.0949249267578125, -0.0804443359375, -0.0659637451171875, -0.051483154296875, -0.0370025634765625, -0.02252197265625, -0.0080413818359375, 0.006439208984375, 0.0209197998046875, 0.035400390625, 0.0498809814453125, 0.064361572265625, 0.0788421630859375, 0.09332275390625, 0.1078033447265625, 0.122283935546875, 0.1367645263671875, 0.1512451171875, 0.1657257080078125, 0.180206298828125, 0.1946868896484375, 0.20916748046875, 0.2236480712890625, 0.238128662109375, 0.2526092529296875, 0.26708984375, 0.2815704345703125, 0.296051025390625, 0.3105316162109375, 0.32501220703125, 0.3394927978515625, 0.353973388671875, 0.3684539794921875, 0.3829345703125, 0.3974151611328125, 0.411895751953125, 0.4263763427734375, 0.44085693359375, 0.4553375244140625, 0.469818115234375, 0.4842987060546875, 0.498779296875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 6.0, 4.0, 7.0, 3.0, 8.0, 13.0, 12.0, 14.0, 21.0, 21.0, 30.0, 30.0, 51.0, 36.0, 71.0, 77.0, 112.0, 120.0, 85.0, 64.0, 38.0, 37.0, 29.0, 20.0, 27.0, 11.0, 12.0, 6.0, 3.0, 7.0, 8.0, 3.0, 3.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.138916015625, -0.13480091094970703, -0.13068580627441406, -0.1265707015991211, -0.12245559692382812, -0.11834049224853516, -0.11422538757324219, -0.11011028289794922, -0.10599517822265625, -0.10188007354736328, -0.09776496887207031, -0.09364986419677734, -0.08953475952148438, -0.0854196548461914, -0.08130455017089844, -0.07718944549560547, -0.0730743408203125, -0.06895923614501953, -0.06484413146972656, -0.060729026794433594, -0.056613922119140625, -0.052498817443847656, -0.04838371276855469, -0.04426860809326172, -0.04015350341796875, -0.03603839874267578, -0.03192329406738281, -0.027808189392089844, -0.023693084716796875, -0.019577980041503906, -0.015462875366210938, -0.011347770690917969, -0.007232666015625, -0.0031175613403320312, 0.0009975433349609375, 0.005112648010253906, 0.009227752685546875, 0.013342857360839844, 0.017457962036132812, 0.02157306671142578, 0.02568817138671875, 0.02980327606201172, 0.03391838073730469, 0.038033485412597656, 0.042148590087890625, 0.046263694763183594, 0.05037879943847656, 0.05449390411376953, 0.0586090087890625, 0.06272411346435547, 0.06683921813964844, 0.0709543228149414, 0.07506942749023438, 0.07918453216552734, 0.08329963684082031, 0.08741474151611328, 0.09152984619140625, 0.09564495086669922, 0.09976005554199219, 0.10387516021728516, 0.10799026489257812, 0.1121053695678711, 0.11622047424316406, 0.12033557891845703, 0.12445068359375]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 6.0, 22.0, 101.0, 454.0, 363.0, 54.0, 13.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7026970386505127, -1.356335163116455, -1.009973168373108, -0.6636111736297607, -0.3172492980957031, 0.029112577438354492, 0.3754746913909912, 0.7218365669250488, 1.0681984424591064, 1.414560317993164, 1.7609223127365112, 2.1072843074798584, 2.453646183013916, 2.8000080585479736, 3.1463701725006104, 3.492732048034668, 3.8390939235687256, 4.185455799102783, 4.53181791305542, 4.878179550170898, 5.224541664123535, 5.570903778076172, 5.917265892028809, 6.263627529144287, 6.609989166259766, 6.956351280212402, 7.302712917327881, 7.649075031280518, 7.995436668395996, 8.341798782348633, 8.68816089630127, 9.034523010253906, 9.380884170532227, 9.727246284484863, 10.0736083984375, 10.41996955871582, 10.766331672668457, 11.112693786621094, 11.45905590057373, 11.805418014526367, 12.151779174804688, 12.498141288757324, 12.844503402709961, 13.190864562988281, 13.537226676940918, 13.883588790893555, 14.229950904846191, 14.576313018798828, 14.922675132751465, 15.269037246704102, 15.615399360656738, 15.961761474609375, 16.308122634887695, 16.654483795166016, 17.00084686279297, 17.34720802307129, 17.693571090698242, 18.039932250976562, 18.386295318603516, 18.732656478881836, 19.07901954650879, 19.42538070678711, 19.771743774414062, 20.118104934692383, 20.464466094970703]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 7.0, 10.0, 7.0, 12.0, 18.0, 23.0, 24.0, 34.0, 33.0, 60.0, 59.0, 62.0, 63.0, 63.0, 83.0, 69.0, 57.0, 65.0, 58.0, 45.0, 32.0, 29.0, 28.0, 18.0, 11.0, 17.0, 6.0, 7.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.812613844871521, -1.7350279092788696, -1.6574418544769287, -1.5798559188842773, -1.502269983291626, -1.424683928489685, -1.3470979928970337, -1.2695119380950928, -1.1919260025024414, -1.11434006690979, -1.0367540121078491, -0.9591680765151978, -0.8815820813179016, -0.8039960861206055, -0.7264101505279541, -0.648824155330658, -0.5712381601333618, -0.4936521649360657, -0.4160661995410919, -0.33848023414611816, -0.260894238948822, -0.18330824375152588, -0.10572227835655212, -0.02813631296157837, 0.04944968223571777, 0.12703566253185272, 0.20462164282798767, 0.2822076082229614, 0.35979360342025757, 0.4373795986175537, 0.5149655342102051, 0.5925515294075012, 0.6701374053955078, 0.747723400592804, 0.8253093957901001, 0.9028953313827515, 0.9804813265800476, 1.0580673217773438, 1.1356532573699951, 1.2132391929626465, 1.2908252477645874, 1.3684111833572388, 1.4459972381591797, 1.523583173751831, 1.6011691093444824, 1.6787551641464233, 1.7563410997390747, 1.8339271545410156, 1.911513090133667, 1.9890990257263184, 2.0666849613189697, 2.1442711353302, 2.2218570709228516, 2.299443006515503, 2.3770289421081543, 2.4546148777008057, 2.532200813293457, 2.6097867488861084, 2.6873726844787598, 2.7649588584899902, 2.8425447940826416, 2.920130729675293, 2.9977166652679443, 3.0753026008605957, 3.152888774871826]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 5.0, 4.0, 9.0, 16.0, 25.0, 30.0, 49.0, 97.0, 205.0, 397.0, 1160.0, 4712.0, 44125.0, 3222709.0, 897542.0, 18333.0, 3129.0, 979.0, 374.0, 168.0, 84.0, 50.0, 26.0, 21.0, 8.0, 8.0, 9.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.4609375, -3.366973876953125, -3.27301025390625, -3.179046630859375, -3.0850830078125, -2.991119384765625, -2.89715576171875, -2.803192138671875, -2.709228515625, -2.615264892578125, -2.52130126953125, -2.427337646484375, -2.3333740234375, -2.239410400390625, -2.14544677734375, -2.051483154296875, -1.95751953125, -1.863555908203125, -1.76959228515625, -1.675628662109375, -1.5816650390625, -1.487701416015625, -1.39373779296875, -1.299774169921875, -1.205810546875, -1.111846923828125, -1.01788330078125, -0.923919677734375, -0.8299560546875, -0.735992431640625, -0.64202880859375, -0.548065185546875, -0.4541015625, -0.360137939453125, -0.26617431640625, -0.172210693359375, -0.0782470703125, 0.015716552734375, 0.10968017578125, 0.203643798828125, 0.297607421875, 0.391571044921875, 0.48553466796875, 0.579498291015625, 0.6734619140625, 0.767425537109375, 0.86138916015625, 0.955352783203125, 1.04931640625, 1.143280029296875, 1.23724365234375, 1.331207275390625, 1.4251708984375, 1.519134521484375, 1.61309814453125, 1.707061767578125, 1.801025390625, 1.894989013671875, 1.98895263671875, 2.082916259765625, 2.1768798828125, 2.270843505859375, 2.36480712890625, 2.458770751953125, 2.552734375]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 8.0, 5.0, 18.0, 11.0, 32.0, 25.0, 27.0, 45.0, 44.0, 76.0, 71.0, 69.0, 68.0, 62.0, 76.0, 69.0, 62.0, 54.0, 38.0, 34.0, 26.0, 19.0, 18.0, 10.0, 10.0, 8.0, 5.0, 2.0, 3.0, 0.0, 0.0, 3.0, 5.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.3486328125, -1.3150558471679688, -1.2814788818359375, -1.2479019165039062, -1.214324951171875, -1.1807479858398438, -1.1471710205078125, -1.1135940551757812, -1.08001708984375, -1.0464401245117188, -1.0128631591796875, -0.9792861938476562, -0.945709228515625, -0.9121322631835938, -0.8785552978515625, -0.8449783325195312, -0.8114013671875, -0.7778244018554688, -0.7442474365234375, -0.7106704711914062, -0.677093505859375, -0.6435165405273438, -0.6099395751953125, -0.5763626098632812, -0.54278564453125, -0.5092086791992188, -0.4756317138671875, -0.44205474853515625, -0.408477783203125, -0.37490081787109375, -0.3413238525390625, -0.30774688720703125, -0.274169921875, -0.24059295654296875, -0.2070159912109375, -0.17343902587890625, -0.139862060546875, -0.10628509521484375, -0.0727081298828125, -0.03913116455078125, -0.00555419921875, 0.02802276611328125, 0.0615997314453125, 0.09517669677734375, 0.128753662109375, 0.16233062744140625, 0.1959075927734375, 0.22948455810546875, 0.2630615234375, 0.29663848876953125, 0.3302154541015625, 0.36379241943359375, 0.397369384765625, 0.43094635009765625, 0.4645233154296875, 0.49810028076171875, 0.53167724609375, 0.5652542114257812, 0.5988311767578125, 0.6324081420898438, 0.665985107421875, 0.6995620727539062, 0.7331390380859375, 0.7667160034179688, 0.80029296875]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 5.0, 6.0, 6.0, 10.0, 10.0, 7.0, 18.0, 25.0, 35.0, 36.0, 57.0, 74.0, 122.0, 235.0, 501.0, 1374.0, 5856.0, 54700.0, 3414845.0, 689196.0, 22207.0, 3107.0, 951.0, 327.0, 210.0, 95.0, 75.0, 38.0, 38.0, 22.0, 12.0, 14.0, 21.0, 7.0, 13.0, 10.0, 2.0, 4.0, 4.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 3.0], "bins": [-2.357421875, -2.2934112548828125, -2.229400634765625, -2.1653900146484375, -2.10137939453125, -2.0373687744140625, -1.973358154296875, -1.9093475341796875, -1.8453369140625, -1.7813262939453125, -1.717315673828125, -1.6533050537109375, -1.58929443359375, -1.5252838134765625, -1.461273193359375, -1.3972625732421875, -1.333251953125, -1.2692413330078125, -1.205230712890625, -1.1412200927734375, -1.07720947265625, -1.0131988525390625, -0.949188232421875, -0.8851776123046875, -0.8211669921875, -0.7571563720703125, -0.693145751953125, -0.6291351318359375, -0.56512451171875, -0.5011138916015625, -0.437103271484375, -0.3730926513671875, -0.30908203125, -0.2450714111328125, -0.181060791015625, -0.1170501708984375, -0.05303955078125, 0.0109710693359375, 0.074981689453125, 0.1389923095703125, 0.2030029296875, 0.2670135498046875, 0.331024169921875, 0.3950347900390625, 0.45904541015625, 0.5230560302734375, 0.587066650390625, 0.6510772705078125, 0.715087890625, 0.7790985107421875, 0.843109130859375, 0.9071197509765625, 0.97113037109375, 1.0351409912109375, 1.099151611328125, 1.1631622314453125, 1.2271728515625, 1.2911834716796875, 1.355194091796875, 1.4192047119140625, 1.48321533203125, 1.5472259521484375, 1.611236572265625, 1.6752471923828125, 1.7392578125]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 6.0, 8.0, 8.0, 10.0, 17.0, 16.0, 21.0, 36.0, 54.0, 66.0, 105.0, 148.0, 216.0, 397.0, 553.0, 670.0, 559.0, 373.0, 248.0, 164.0, 117.0, 85.0, 59.0, 33.0, 29.0, 18.0, 18.0, 8.0, 7.0, 8.0, 4.0, 2.0, 6.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23486328125, -0.22488784790039062, -0.21491241455078125, -0.20493698120117188, -0.1949615478515625, -0.18498611450195312, -0.17501068115234375, -0.16503524780273438, -0.155059814453125, -0.14508438110351562, -0.13510894775390625, -0.12513351440429688, -0.1151580810546875, -0.10518264770507812, -0.09520721435546875, -0.08523178100585938, -0.07525634765625, -0.06528091430664062, -0.05530548095703125, -0.045330047607421875, -0.0353546142578125, -0.025379180908203125, -0.01540374755859375, -0.005428314208984375, 0.004547119140625, 0.014522552490234375, 0.02449798583984375, 0.034473419189453125, 0.0444488525390625, 0.054424285888671875, 0.06439971923828125, 0.07437515258789062, 0.0843505859375, 0.09432601928710938, 0.10430145263671875, 0.11427688598632812, 0.1242523193359375, 0.13422775268554688, 0.14420318603515625, 0.15417861938476562, 0.164154052734375, 0.17412948608398438, 0.18410491943359375, 0.19408035278320312, 0.2040557861328125, 0.21403121948242188, 0.22400665283203125, 0.23398208618164062, 0.24395751953125, 0.2539329528808594, 0.26390838623046875, 0.2738838195800781, 0.2838592529296875, 0.2938346862792969, 0.30381011962890625, 0.3137855529785156, 0.323760986328125, 0.3337364196777344, 0.34371185302734375, 0.3536872863769531, 0.3636627197265625, 0.3736381530761719, 0.38361358642578125, 0.3935890197753906, 0.403564453125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 5.0, 5.0, 6.0, 8.0, 10.0, 21.0, 32.0, 47.0, 58.0, 91.0, 113.0, 145.0, 113.0, 92.0, 77.0, 59.0, 39.0, 35.0, 15.0, 8.0, 5.0, 11.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0261210203170776, -0.97418612241745, -0.9222512245178223, -0.8703163862228394, -0.8183814883232117, -0.766446590423584, -0.7145117521286011, -0.6625768542289734, -0.6106419563293457, -0.558707058429718, -0.5067721605300903, -0.4548373222351074, -0.40290242433547974, -0.35096752643585205, -0.29903265833854675, -0.24709779024124146, -0.19516289234161377, -0.14322800934314728, -0.09129312634468079, -0.039358243346214294, 0.012576639652252197, 0.06451153755187988, 0.11644640564918518, 0.16838127374649048, 0.22031617164611816, 0.27225106954574585, 0.32418593764305115, 0.37612080574035645, 0.42805570363998413, 0.4799906015396118, 0.5319254398345947, 0.5838603377342224, 0.6357951164245605, 0.6877300143241882, 0.7396649122238159, 0.7915997505187988, 0.8435346484184265, 0.8954695463180542, 0.9474043846130371, 0.9993392825126648, 1.0512741804122925, 1.1032090187072754, 1.1551439762115479, 1.2070788145065308, 1.2590136528015137, 1.3109486103057861, 1.362883448600769, 1.414818286895752, 1.4667532444000244, 1.5186880826950073, 1.5706230401992798, 1.6225578784942627, 1.6744928359985352, 1.726427674293518, 1.778362512588501, 1.8302974700927734, 1.8822323083877563, 1.9341671466827393, 1.9861021041870117, 2.038037061691284, 2.0899717807769775, 2.14190673828125, 2.1938416957855225, 2.245776414871216, 2.2977113723754883]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 6.0, 6.0, 12.0, 9.0, 12.0, 20.0, 21.0, 27.0, 26.0, 32.0, 40.0, 58.0, 49.0, 53.0, 57.0, 62.0, 46.0, 55.0, 52.0, 49.0, 47.0, 42.0, 32.0, 33.0, 23.0, 26.0, 15.0, 21.0, 21.0, 9.0, 13.0, 8.0, 6.0, 5.0, 3.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.990574061870575, -0.9623443484306335, -0.9341146945953369, -0.9058849811553955, -0.8776552677154541, -0.8494255542755127, -0.8211958408355713, -0.7929661870002747, -0.7647364735603333, -0.7365067601203918, -0.7082771062850952, -0.6800473928451538, -0.6518176794052124, -0.623587965965271, -0.5953582525253296, -0.567128598690033, -0.5388988852500916, -0.5106691718101501, -0.48243948817253113, -0.4542098045349121, -0.4259800910949707, -0.3977503776550293, -0.3695206940174103, -0.34129101037979126, -0.31306129693984985, -0.28483158349990845, -0.25660189986228943, -0.22837220132350922, -0.200142502784729, -0.1719128042459488, -0.14368310570716858, -0.11545340716838837, -0.08722364902496338, -0.058993950486183167, -0.030764251947402954, -0.0025345534086227417, 0.02569514513015747, 0.05392484366893768, 0.0821545422077179, 0.11038424074649811, 0.13861393928527832, 0.16684363782405853, 0.19507333636283875, 0.22330303490161896, 0.25153273344039917, 0.2797624468803406, 0.3079921305179596, 0.3362218141555786, 0.36445152759552, 0.3926812410354614, 0.42091092467308044, 0.44914060831069946, 0.47737032175064087, 0.5056000351905823, 0.5338296890258789, 0.5620594024658203, 0.5902891159057617, 0.6185188293457031, 0.6467485427856445, 0.6749781966209412, 0.7032079100608826, 0.731437623500824, 0.7596672773361206, 0.787896990776062, 0.8161267042160034]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 1.0, 4.0, 3.0, 1.0, 10.0, 15.0, 11.0, 21.0, 24.0, 28.0, 32.0, 55.0, 99.0, 246.0, 682.0, 3123.0, 18770.0, 241007.0, 719379.0, 55718.0, 7125.0, 1483.0, 334.0, 144.0, 71.0, 49.0, 20.0, 17.0, 14.0, 14.0, 12.0, 7.0, 5.0, 7.0, 6.0, 5.0, 6.0, 1.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.525390625, -0.5080184936523438, -0.4906463623046875, -0.47327423095703125, -0.455902099609375, -0.43852996826171875, -0.4211578369140625, -0.40378570556640625, -0.38641357421875, -0.36904144287109375, -0.3516693115234375, -0.33429718017578125, -0.316925048828125, -0.29955291748046875, -0.2821807861328125, -0.26480865478515625, -0.2474365234375, -0.23006439208984375, -0.2126922607421875, -0.19532012939453125, -0.177947998046875, -0.16057586669921875, -0.1432037353515625, -0.12583160400390625, -0.10845947265625, -0.09108734130859375, -0.0737152099609375, -0.05634307861328125, -0.038970947265625, -0.02159881591796875, -0.0042266845703125, 0.01314544677734375, 0.030517578125, 0.04788970947265625, 0.0652618408203125, 0.08263397216796875, 0.100006103515625, 0.11737823486328125, 0.1347503662109375, 0.15212249755859375, 0.16949462890625, 0.18686676025390625, 0.2042388916015625, 0.22161102294921875, 0.238983154296875, 0.25635528564453125, 0.2737274169921875, 0.29109954833984375, 0.3084716796875, 0.32584381103515625, 0.3432159423828125, 0.36058807373046875, 0.377960205078125, 0.39533233642578125, 0.4127044677734375, 0.43007659912109375, 0.44744873046875, 0.46482086181640625, 0.4821929931640625, 0.49956512451171875, 0.516937255859375, 0.5343093872070312, 0.5516815185546875, 0.5690536499023438, 0.58642578125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 11.0, 20.0, 28.0, 37.0, 58.0, 87.0, 104.0, 106.0, 115.0, 103.0, 95.0, 77.0, 49.0, 29.0, 38.0, 18.0, 11.0, 9.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.720703125, -0.683624267578125, -0.64654541015625, -0.609466552734375, -0.5723876953125, -0.535308837890625, -0.49822998046875, -0.461151123046875, -0.424072265625, -0.386993408203125, -0.34991455078125, -0.312835693359375, -0.2757568359375, -0.238677978515625, -0.20159912109375, -0.164520263671875, -0.12744140625, -0.090362548828125, -0.05328369140625, -0.016204833984375, 0.0208740234375, 0.057952880859375, 0.09503173828125, 0.132110595703125, 0.169189453125, 0.206268310546875, 0.24334716796875, 0.280426025390625, 0.3175048828125, 0.354583740234375, 0.39166259765625, 0.428741455078125, 0.4658203125, 0.502899169921875, 0.53997802734375, 0.577056884765625, 0.6141357421875, 0.651214599609375, 0.68829345703125, 0.725372314453125, 0.762451171875, 0.799530029296875, 0.83660888671875, 0.873687744140625, 0.9107666015625, 0.947845458984375, 0.98492431640625, 1.022003173828125, 1.05908203125, 1.096160888671875, 1.13323974609375, 1.170318603515625, 1.2073974609375, 1.244476318359375, 1.28155517578125, 1.318634033203125, 1.355712890625, 1.392791748046875, 1.42987060546875, 1.466949462890625, 1.5040283203125, 1.541107177734375, 1.57818603515625, 1.615264892578125, 1.65234375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 4.0, 4.0, 7.0, 8.0, 8.0, 13.0, 13.0, 21.0, 22.0, 26.0, 30.0, 54.0, 101.0, 129.0, 170.0, 253.0, 520.0, 1127.0, 2991.0, 9122.0, 34599.0, 209043.0, 609902.0, 142515.0, 25815.0, 7324.0, 2529.0, 960.0, 477.0, 240.0, 138.0, 81.0, 85.0, 57.0, 35.0, 27.0, 25.0, 21.0, 14.0, 6.0, 11.0, 11.0, 7.0, 8.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.373291015625, -0.363037109375, -0.352783203125, -0.342529296875, -0.332275390625, -0.322021484375, -0.311767578125, -0.301513671875, -0.291259765625, -0.281005859375, -0.270751953125, -0.260498046875, -0.250244140625, -0.239990234375, -0.229736328125, -0.219482421875, -0.209228515625, -0.198974609375, -0.188720703125, -0.178466796875, -0.168212890625, -0.157958984375, -0.147705078125, -0.137451171875, -0.127197265625, -0.116943359375, -0.106689453125, -0.096435546875, -0.086181640625, -0.075927734375, -0.065673828125, -0.055419921875, -0.045166015625, -0.034912109375, -0.024658203125, -0.014404296875, -0.004150390625, 0.006103515625, 0.016357421875, 0.026611328125, 0.036865234375, 0.047119140625, 0.057373046875, 0.067626953125, 0.077880859375, 0.088134765625, 0.098388671875, 0.108642578125, 0.118896484375, 0.129150390625, 0.139404296875, 0.149658203125, 0.159912109375, 0.170166015625, 0.180419921875, 0.190673828125, 0.200927734375, 0.211181640625, 0.221435546875, 0.231689453125, 0.241943359375, 0.252197265625, 0.262451171875, 0.272705078125, 0.282958984375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 8.0, 3.0, 10.0, 9.0, 11.0, 21.0, 17.0, 23.0, 45.0, 44.0, 49.0, 46.0, 64.0, 77.0, 71.0, 78.0, 61.0, 58.0, 58.0, 47.0, 35.0, 35.0, 42.0, 22.0, 24.0, 14.0, 15.0, 6.0, 8.0, 2.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.37890625, -1.334503173828125, -1.29010009765625, -1.245697021484375, -1.2012939453125, -1.156890869140625, -1.11248779296875, -1.068084716796875, -1.023681640625, -0.979278564453125, -0.93487548828125, -0.890472412109375, -0.8460693359375, -0.801666259765625, -0.75726318359375, -0.712860107421875, -0.66845703125, -0.624053955078125, -0.57965087890625, -0.535247802734375, -0.4908447265625, -0.446441650390625, -0.40203857421875, -0.357635498046875, -0.313232421875, -0.268829345703125, -0.22442626953125, -0.180023193359375, -0.1356201171875, -0.091217041015625, -0.04681396484375, -0.002410888671875, 0.0419921875, 0.086395263671875, 0.13079833984375, 0.175201416015625, 0.2196044921875, 0.264007568359375, 0.30841064453125, 0.352813720703125, 0.397216796875, 0.441619873046875, 0.48602294921875, 0.530426025390625, 0.5748291015625, 0.619232177734375, 0.66363525390625, 0.708038330078125, 0.75244140625, 0.796844482421875, 0.84124755859375, 0.885650634765625, 0.9300537109375, 0.974456787109375, 1.01885986328125, 1.063262939453125, 1.107666015625, 1.152069091796875, 1.19647216796875, 1.240875244140625, 1.2852783203125, 1.329681396484375, 1.37408447265625, 1.418487548828125, 1.462890625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 9.0, 12.0, 13.0, 18.0, 44.0, 61.0, 102.0, 219.0, 383.0, 767.0, 1804.0, 4400.0, 13520.0, 53637.0, 408290.0, 479303.0, 62555.0, 14931.0, 4881.0, 1846.0, 831.0, 393.0, 210.0, 120.0, 81.0, 52.0, 11.0, 16.0, 13.0, 10.0, 7.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1444091796875, -0.14061355590820312, -0.13681793212890625, -0.13302230834960938, -0.1292266845703125, -0.12543106079101562, -0.12163543701171875, -0.11783981323242188, -0.114044189453125, -0.11024856567382812, -0.10645294189453125, -0.10265731811523438, -0.0988616943359375, -0.09506607055664062, -0.09127044677734375, -0.08747482299804688, -0.08367919921875, -0.07988357543945312, -0.07608795166015625, -0.07229232788085938, -0.0684967041015625, -0.06470108032226562, -0.06090545654296875, -0.057109832763671875, -0.053314208984375, -0.049518585205078125, -0.04572296142578125, -0.041927337646484375, -0.0381317138671875, -0.034336090087890625, -0.03054046630859375, -0.026744842529296875, -0.02294921875, -0.019153594970703125, -0.01535797119140625, -0.011562347412109375, -0.0077667236328125, -0.003971099853515625, -0.00017547607421875, 0.003620147705078125, 0.007415771484375, 0.011211395263671875, 0.01500701904296875, 0.018802642822265625, 0.0225982666015625, 0.026393890380859375, 0.03018951416015625, 0.033985137939453125, 0.03778076171875, 0.041576385498046875, 0.04537200927734375, 0.049167633056640625, 0.0529632568359375, 0.056758880615234375, 0.06055450439453125, 0.06435012817382812, 0.068145751953125, 0.07194137573242188, 0.07573699951171875, 0.07953262329101562, 0.0833282470703125, 0.08712387084960938, 0.09091949462890625, 0.09471511840820312, 0.0985107421875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 13.0, 15.0, 25.0, 47.0, 72.0, 65.0, 116.0, 140.0, 157.0, 93.0, 76.0, 55.0, 38.0, 21.0, 16.0, 8.0, 10.0, 4.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.967782974243164e-05, -6.783567368984222e-05, -6.599351763725281e-05, -6.415136158466339e-05, -6.230920553207397e-05, -6.046704947948456e-05, -5.862489342689514e-05, -5.6782737374305725e-05, -5.494058132171631e-05, -5.309842526912689e-05, -5.1256269216537476e-05, -4.941411316394806e-05, -4.757195711135864e-05, -4.5729801058769226e-05, -4.388764500617981e-05, -4.204548895359039e-05, -4.0203332901000977e-05, -3.836117684841156e-05, -3.6519020795822144e-05, -3.467686474323273e-05, -3.283470869064331e-05, -3.0992552638053894e-05, -2.9150396585464478e-05, -2.730824053287506e-05, -2.5466084480285645e-05, -2.3623928427696228e-05, -2.178177237510681e-05, -1.9939616322517395e-05, -1.809746026992798e-05, -1.6255304217338562e-05, -1.4413148164749146e-05, -1.2570992112159729e-05, -1.0728836059570312e-05, -8.886680006980896e-06, -7.0445239543914795e-06, -5.202367901802063e-06, -3.3602118492126465e-06, -1.51805579662323e-06, 3.241002559661865e-07, 2.166256308555603e-06, 4.0084123611450195e-06, 5.850568413734436e-06, 7.692724466323853e-06, 9.534880518913269e-06, 1.1377036571502686e-05, 1.3219192624092102e-05, 1.5061348676681519e-05, 1.6903504729270935e-05, 1.874566078186035e-05, 2.0587816834449768e-05, 2.2429972887039185e-05, 2.42721289396286e-05, 2.6114284992218018e-05, 2.7956441044807434e-05, 2.979859709739685e-05, 3.164075314998627e-05, 3.3482909202575684e-05, 3.53250652551651e-05, 3.7167221307754517e-05, 3.900937736034393e-05, 4.085153341293335e-05, 4.2693689465522766e-05, 4.453584551811218e-05, 4.63780015707016e-05, 4.8220157623291016e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 4.0, 4.0, 7.0, 10.0, 16.0, 17.0, 16.0, 37.0, 47.0, 52.0, 99.0, 137.0, 208.0, 355.0, 586.0, 1154.0, 2174.0, 4293.0, 9512.0, 23092.0, 64484.0, 209139.0, 421675.0, 206195.0, 63807.0, 22900.0, 9354.0, 4204.0, 2136.0, 1180.0, 632.0, 378.0, 214.0, 149.0, 84.0, 53.0, 31.0, 38.0, 21.0, 17.0, 9.0, 6.0, 9.0, 4.0, 2.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.062347412109375, -0.06023359298706055, -0.058119773864746094, -0.05600595474243164, -0.05389213562011719, -0.051778316497802734, -0.04966449737548828, -0.04755067825317383, -0.045436859130859375, -0.04332304000854492, -0.04120922088623047, -0.039095401763916016, -0.03698158264160156, -0.03486776351928711, -0.032753944396972656, -0.030640125274658203, -0.02852630615234375, -0.026412487030029297, -0.024298667907714844, -0.02218484878540039, -0.020071029663085938, -0.017957210540771484, -0.01584339141845703, -0.013729572296142578, -0.011615753173828125, -0.009501934051513672, -0.007388114929199219, -0.005274295806884766, -0.0031604766845703125, -0.0010466575622558594, 0.0010671615600585938, 0.003180980682373047, 0.0052947998046875, 0.007408618927001953, 0.009522438049316406, 0.01163625717163086, 0.013750076293945312, 0.015863895416259766, 0.01797771453857422, 0.020091533660888672, 0.022205352783203125, 0.024319171905517578, 0.02643299102783203, 0.028546810150146484, 0.030660629272460938, 0.03277444839477539, 0.034888267517089844, 0.0370020866394043, 0.03911590576171875, 0.0412297248840332, 0.043343544006347656, 0.04545736312866211, 0.04757118225097656, 0.049685001373291016, 0.05179882049560547, 0.05391263961791992, 0.056026458740234375, 0.05814027786254883, 0.06025409698486328, 0.062367916107177734, 0.06448173522949219, 0.06659555435180664, 0.0687093734741211, 0.07082319259643555, 0.07293701171875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 4.0, 2.0, 6.0, 9.0, 9.0, 7.0, 15.0, 14.0, 24.0, 27.0, 24.0, 26.0, 32.0, 56.0, 47.0, 50.0, 54.0, 51.0, 54.0, 52.0, 60.0, 51.0, 42.0, 46.0, 34.0, 35.0, 21.0, 22.0, 16.0, 16.0, 15.0, 11.0, 10.0, 12.0, 10.0, 2.0, 4.0, 6.0, 2.0, 4.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.01556396484375, -0.015073776245117188, -0.014583587646484375, -0.014093399047851562, -0.01360321044921875, -0.013113021850585938, -0.012622833251953125, -0.012132644653320312, -0.0116424560546875, -0.011152267456054688, -0.010662078857421875, -0.010171890258789062, -0.00968170166015625, -0.009191513061523438, -0.008701324462890625, -0.008211135864257812, -0.007720947265625, -0.0072307586669921875, -0.006740570068359375, -0.0062503814697265625, -0.00576019287109375, -0.0052700042724609375, -0.004779815673828125, -0.0042896270751953125, -0.0037994384765625, -0.0033092498779296875, -0.002819061279296875, -0.0023288726806640625, -0.00183868408203125, -0.0013484954833984375, -0.000858306884765625, -0.0003681182861328125, 0.0001220703125, 0.0006122589111328125, 0.001102447509765625, 0.0015926361083984375, 0.00208282470703125, 0.0025730133056640625, 0.003063201904296875, 0.0035533905029296875, 0.0040435791015625, 0.0045337677001953125, 0.005023956298828125, 0.0055141448974609375, 0.00600433349609375, 0.0064945220947265625, 0.006984710693359375, 0.0074748992919921875, 0.007965087890625, 0.008455276489257812, 0.008945465087890625, 0.009435653686523438, 0.00992584228515625, 0.010416030883789062, 0.010906219482421875, 0.011396408081054688, 0.0118865966796875, 0.012376785278320312, 0.012866973876953125, 0.013357162475585938, 0.01384735107421875, 0.014337539672851562, 0.014827728271484375, 0.015317916870117188, 0.01580810546875]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 8.0, 4.0, 7.0, 16.0, 56.0, 135.0, 306.0, 277.0, 138.0, 41.0, 14.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8986907601356506, -0.8168035745620728, -0.7349164485931396, -0.6530292630195618, -0.5711420774459839, -0.4892549514770508, -0.4073677659034729, -0.3254806399345398, -0.24359345436096191, -0.16170629858970642, -0.07981912791728973, 0.002068042755126953, 0.08395519852638245, 0.16584235429763794, 0.24772953987121582, 0.3296166658401489, 0.4115038514137268, 0.4933910071849823, 0.5752781629562378, 0.6571653485298157, 0.7390525341033936, 0.8209396600723267, 0.9028268456459045, 0.9847139716148376, 1.0666011571884155, 1.1484882831573486, 1.2303755283355713, 1.3122626543045044, 1.3941497802734375, 1.4760370254516602, 1.5579241514205933, 1.6398112773895264, 1.721698522567749, 1.8035856485366821, 1.8854728937149048, 1.967360019683838, 2.0492472648620605, 2.131134271621704, 2.2130215167999268, 2.2949085235595703, 2.376795768737793, 2.4586830139160156, 2.540570020675659, 2.622457265853882, 2.7043445110321045, 2.786231517791748, 2.8681187629699707, 2.9500060081481934, 3.031893253326416, 3.1137804985046387, 3.1956675052642822, 3.277554750442505, 3.3594419956207275, 3.441329002380371, 3.5232162475585938, 3.6051034927368164, 3.68699049949646, 3.7688777446746826, 3.850764751434326, 3.932651996612549, 4.0145392417907715, 4.096426486968994, 4.178313255310059, 4.260200500488281, 4.342087745666504]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 6.0, 12.0, 20.0, 33.0, 43.0, 60.0, 104.0, 113.0, 105.0, 124.0, 109.0, 79.0, 52.0, 51.0, 36.0, 25.0, 13.0, 9.0, 7.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8026885986328125, -0.7663175463676453, -0.729946494102478, -0.6935755014419556, -0.6572044491767883, -0.6208333969116211, -0.5844623446464539, -0.5480912923812866, -0.5117202997207642, -0.4753492474555969, -0.4389782249927521, -0.40260717272758484, -0.36623615026474, -0.32986509799957275, -0.2934940457344055, -0.25712302327156067, -0.22075194120407104, -0.184380903840065, -0.14800986647605896, -0.11163881421089172, -0.07526777684688568, -0.03889673948287964, -0.0025256872177124023, 0.033845335245132446, 0.07021638751029968, 0.10658742487430573, 0.14295846223831177, 0.179329514503479, 0.21570055186748505, 0.2520715892314911, 0.2884426414966583, 0.3248136639595032, 0.3611847162246704, 0.39755576848983765, 0.4339267909526825, 0.47029784321784973, 0.5066688656806946, 0.5430399179458618, 0.579410970211029, 0.6157820224761963, 0.6521530151367188, 0.688524067401886, 0.7248951196670532, 0.7612661123275757, 0.7976371645927429, 0.8340082168579102, 0.8703792691230774, 0.9067503213882446, 0.9431213736534119, 0.9794924259185791, 1.0158634185791016, 1.0522345304489136, 1.088605523109436, 1.124976634979248, 1.1613476276397705, 1.197718620300293, 1.234089732170105, 1.2704607248306274, 1.3068318367004395, 1.343202829360962, 1.379573941230774, 1.4159449338912964, 1.4523160457611084, 1.4886870384216309, 1.5250580310821533]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 3.0, 2.0, 3.0, 6.0, 2.0, 3.0, 11.0, 26.0, 51.0, 290.0, 118118.0, 929261.0, 629.0, 50.0, 15.0, 19.0, 10.0, 11.0, 5.0, 4.0, 2.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.84765625, -4.62835693359375, -4.4090576171875, -4.18975830078125, -3.970458984375, -3.75115966796875, -3.5318603515625, -3.31256103515625, -3.09326171875, -2.87396240234375, -2.6546630859375, -2.43536376953125, -2.216064453125, -1.99676513671875, -1.7774658203125, -1.55816650390625, -1.3388671875, -1.11956787109375, -0.9002685546875, -0.68096923828125, -0.461669921875, -0.24237060546875, -0.0230712890625, 0.19622802734375, 0.41552734375, 0.63482666015625, 0.8541259765625, 1.07342529296875, 1.292724609375, 1.51202392578125, 1.7313232421875, 1.95062255859375, 2.169921875, 2.38922119140625, 2.6085205078125, 2.82781982421875, 3.047119140625, 3.26641845703125, 3.4857177734375, 3.70501708984375, 3.92431640625, 4.14361572265625, 4.3629150390625, 4.58221435546875, 4.801513671875, 5.02081298828125, 5.2401123046875, 5.45941162109375, 5.6787109375, 5.89801025390625, 6.1173095703125, 6.33660888671875, 6.555908203125, 6.77520751953125, 6.9945068359375, 7.21380615234375, 7.43310546875, 7.65240478515625, 7.8717041015625, 8.09100341796875, 8.310302734375, 8.52960205078125, 8.7489013671875, 8.96820068359375, 9.1875]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 8.0, 24.0, 60.0, 169.0, 236.0, 237.0, 154.0, 72.0, 32.0, 16.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3251953125, -1.1802825927734375, -1.035369873046875, -0.8904571533203125, -0.74554443359375, -0.6006317138671875, -0.455718994140625, -0.3108062744140625, -0.1658935546875, -0.0209808349609375, 0.123931884765625, 0.2688446044921875, 0.41375732421875, 0.5586700439453125, 0.703582763671875, 0.8484954833984375, 0.993408203125, 1.1383209228515625, 1.283233642578125, 1.4281463623046875, 1.57305908203125, 1.7179718017578125, 1.862884521484375, 2.0077972412109375, 2.1527099609375, 2.2976226806640625, 2.442535400390625, 2.5874481201171875, 2.73236083984375, 2.8772735595703125, 3.022186279296875, 3.1670989990234375, 3.31201171875, 3.4569244384765625, 3.601837158203125, 3.7467498779296875, 3.89166259765625, 4.0365753173828125, 4.181488037109375, 4.3264007568359375, 4.4713134765625, 4.6162261962890625, 4.761138916015625, 4.9060516357421875, 5.05096435546875, 5.1958770751953125, 5.340789794921875, 5.4857025146484375, 5.630615234375, 5.7755279541015625, 5.920440673828125, 6.0653533935546875, 6.21026611328125, 6.3551788330078125, 6.500091552734375, 6.6450042724609375, 6.7899169921875, 6.9348297119140625, 7.079742431640625, 7.2246551513671875, 7.36956787109375, 7.5144805908203125, 7.659393310546875, 7.8043060302734375, 7.94921875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 4.0, 6.0, 2.0, 3.0, 12.0, 8.0, 15.0, 21.0, 30.0, 30.0, 54.0, 74.0, 110.0, 157.0, 232.0, 489.0, 1257.0, 5908.0, 67638.0, 916715.0, 48761.0, 4816.0, 1077.0, 407.0, 209.0, 140.0, 86.0, 79.0, 57.0, 39.0, 32.0, 25.0, 14.0, 15.0, 13.0, 10.0, 7.0, 7.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.046875, -1.9891357421875, -1.931396484375, -1.8736572265625, -1.81591796875, -1.7581787109375, -1.700439453125, -1.6427001953125, -1.5849609375, -1.5272216796875, -1.469482421875, -1.4117431640625, -1.35400390625, -1.2962646484375, -1.238525390625, -1.1807861328125, -1.123046875, -1.0653076171875, -1.007568359375, -0.9498291015625, -0.89208984375, -0.8343505859375, -0.776611328125, -0.7188720703125, -0.6611328125, -0.6033935546875, -0.545654296875, -0.4879150390625, -0.43017578125, -0.3724365234375, -0.314697265625, -0.2569580078125, -0.19921875, -0.1414794921875, -0.083740234375, -0.0260009765625, 0.03173828125, 0.0894775390625, 0.147216796875, 0.2049560546875, 0.2626953125, 0.3204345703125, 0.378173828125, 0.4359130859375, 0.49365234375, 0.5513916015625, 0.609130859375, 0.6668701171875, 0.724609375, 0.7823486328125, 0.840087890625, 0.8978271484375, 0.95556640625, 1.0133056640625, 1.071044921875, 1.1287841796875, 1.1865234375, 1.2442626953125, 1.302001953125, 1.3597412109375, 1.41748046875, 1.4752197265625, 1.532958984375, 1.5906982421875, 1.6484375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 4.0, 6.0, 7.0, 13.0, 12.0, 14.0, 14.0, 14.0, 23.0, 15.0, 27.0, 34.0, 33.0, 18.0, 35.0, 53.0, 50.0, 45.0, 39.0, 42.0, 47.0, 45.0, 51.0, 44.0, 32.0, 35.0, 40.0, 26.0, 24.0, 32.0, 20.0, 27.0, 11.0, 15.0, 15.0, 13.0, 8.0, 3.0, 8.0, 5.0, 1.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.0009765625, -0.97216796875, -0.943359375, -0.91455078125, -0.8857421875, -0.85693359375, -0.828125, -0.79931640625, -0.7705078125, -0.74169921875, -0.712890625, -0.68408203125, -0.6552734375, -0.62646484375, -0.59765625, -0.56884765625, -0.5400390625, -0.51123046875, -0.482421875, -0.45361328125, -0.4248046875, -0.39599609375, -0.3671875, -0.33837890625, -0.3095703125, -0.28076171875, -0.251953125, -0.22314453125, -0.1943359375, -0.16552734375, -0.13671875, -0.10791015625, -0.0791015625, -0.05029296875, -0.021484375, 0.00732421875, 0.0361328125, 0.06494140625, 0.09375, 0.12255859375, 0.1513671875, 0.18017578125, 0.208984375, 0.23779296875, 0.2666015625, 0.29541015625, 0.32421875, 0.35302734375, 0.3818359375, 0.41064453125, 0.439453125, 0.46826171875, 0.4970703125, 0.52587890625, 0.5546875, 0.58349609375, 0.6123046875, 0.64111328125, 0.669921875, 0.69873046875, 0.7275390625, 0.75634765625, 0.78515625, 0.81396484375, 0.8427734375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 5.0, 7.0, 17.0, 22.0, 33.0, 73.0, 138.0, 269.0, 580.0, 1540.0, 4740.0, 22099.0, 299289.0, 671176.0, 37910.0, 7101.0, 2088.0, 803.0, 313.0, 149.0, 78.0, 45.0, 24.0, 21.0, 8.0, 6.0, 10.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55224609375, -0.5369644165039062, -0.5216827392578125, -0.5064010620117188, -0.491119384765625, -0.47583770751953125, -0.4605560302734375, -0.44527435302734375, -0.42999267578125, -0.41471099853515625, -0.3994293212890625, -0.38414764404296875, -0.368865966796875, -0.35358428955078125, -0.3383026123046875, -0.32302093505859375, -0.3077392578125, -0.29245758056640625, -0.2771759033203125, -0.26189422607421875, -0.246612548828125, -0.23133087158203125, -0.2160491943359375, -0.20076751708984375, -0.18548583984375, -0.17020416259765625, -0.1549224853515625, -0.13964080810546875, -0.124359130859375, -0.10907745361328125, -0.0937957763671875, -0.07851409912109375, -0.063232421875, -0.04795074462890625, -0.0326690673828125, -0.01738739013671875, -0.002105712890625, 0.01317596435546875, 0.0284576416015625, 0.04373931884765625, 0.05902099609375, 0.07430267333984375, 0.0895843505859375, 0.10486602783203125, 0.120147705078125, 0.13542938232421875, 0.1507110595703125, 0.16599273681640625, 0.1812744140625, 0.19655609130859375, 0.2118377685546875, 0.22711944580078125, 0.242401123046875, 0.25768280029296875, 0.2729644775390625, 0.28824615478515625, 0.30352783203125, 0.31880950927734375, 0.3340911865234375, 0.34937286376953125, 0.364654541015625, 0.37993621826171875, 0.3952178955078125, 0.41049957275390625, 0.42578125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 3.0, 3.0, 7.0, 3.0, 11.0, 11.0, 17.0, 30.0, 54.0, 85.0, 135.0, 211.0, 156.0, 125.0, 53.0, 32.0, 18.0, 17.0, 8.0, 9.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7738037109375e-05, -8.5475854575634e-05, -8.3213672041893e-05, -8.095148950815201e-05, -7.868930697441101e-05, -7.642712444067001e-05, -7.416494190692902e-05, -7.190275937318802e-05, -6.964057683944702e-05, -6.737839430570602e-05, -6.511621177196503e-05, -6.285402923822403e-05, -6.059184670448303e-05, -5.8329664170742035e-05, -5.606748163700104e-05, -5.380529910326004e-05, -5.154311656951904e-05, -4.9280934035778046e-05, -4.701875150203705e-05, -4.475656896829605e-05, -4.2494386434555054e-05, -4.0232203900814056e-05, -3.797002136707306e-05, -3.570783883333206e-05, -3.3445656299591064e-05, -3.118347376585007e-05, -2.892129123210907e-05, -2.6659108698368073e-05, -2.4396926164627075e-05, -2.2134743630886078e-05, -1.987256109714508e-05, -1.7610378563404083e-05, -1.5348196029663086e-05, -1.3086013495922089e-05, -1.0823830962181091e-05, -8.561648428440094e-06, -6.299465894699097e-06, -4.037283360958099e-06, -1.775100827217102e-06, 4.870817065238953e-07, 2.7492642402648926e-06, 5.01144677400589e-06, 7.273629307746887e-06, 9.535811841487885e-06, 1.1797994375228882e-05, 1.4060176908969879e-05, 1.6322359442710876e-05, 1.8584541976451874e-05, 2.084672451019287e-05, 2.310890704393387e-05, 2.5371089577674866e-05, 2.7633272111415863e-05, 2.989545464515686e-05, 3.215763717889786e-05, 3.4419819712638855e-05, 3.668200224637985e-05, 3.894418478012085e-05, 4.120636731386185e-05, 4.3468549847602844e-05, 4.573073238134384e-05, 4.799291491508484e-05, 5.0255097448825836e-05, 5.2517279982566833e-05, 5.477946251630783e-05, 5.704164505004883e-05]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 11.0, 6.0, 7.0, 8.0, 10.0, 28.0, 28.0, 40.0, 58.0, 105.0, 140.0, 302.0, 611.0, 1483.0, 4819.0, 20521.0, 159645.0, 744476.0, 95794.0, 14555.0, 3583.0, 1249.0, 463.0, 241.0, 118.0, 71.0, 56.0, 33.0, 26.0, 18.0, 11.0, 8.0, 7.0, 8.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.4619140625, -0.4492225646972656, -0.43653106689453125, -0.4238395690917969, -0.4111480712890625, -0.3984565734863281, -0.38576507568359375, -0.3730735778808594, -0.360382080078125, -0.3476905822753906, -0.33499908447265625, -0.3223075866699219, -0.3096160888671875, -0.2969245910644531, -0.28423309326171875, -0.2715415954589844, -0.25885009765625, -0.24615859985351562, -0.23346710205078125, -0.22077560424804688, -0.2080841064453125, -0.19539260864257812, -0.18270111083984375, -0.17000961303710938, -0.157318115234375, -0.14462661743164062, -0.13193511962890625, -0.11924362182617188, -0.1065521240234375, -0.09386062622070312, -0.08116912841796875, -0.06847763061523438, -0.0557861328125, -0.043094635009765625, -0.03040313720703125, -0.017711639404296875, -0.0050201416015625, 0.007671356201171875, 0.02036285400390625, 0.033054351806640625, 0.045745849609375, 0.058437347412109375, 0.07112884521484375, 0.08382034301757812, 0.0965118408203125, 0.10920333862304688, 0.12189483642578125, 0.13458633422851562, 0.14727783203125, 0.15996932983398438, 0.17266082763671875, 0.18535232543945312, 0.1980438232421875, 0.21073532104492188, 0.22342681884765625, 0.23611831665039062, 0.248809814453125, 0.2615013122558594, 0.27419281005859375, 0.2868843078613281, 0.2995758056640625, 0.3122673034667969, 0.32495880126953125, 0.3376502990722656, 0.350341796875]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 6.0, 4.0, 10.0, 12.0, 13.0, 12.0, 16.0, 27.0, 30.0, 36.0, 60.0, 57.0, 84.0, 96.0, 80.0, 94.0, 71.0, 63.0, 41.0, 37.0, 36.0, 28.0, 19.0, 12.0, 6.0, 8.0, 6.0, 10.0, 6.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1339111328125, -0.13061046600341797, -0.12730979919433594, -0.1240091323852539, -0.12070846557617188, -0.11740779876708984, -0.11410713195800781, -0.11080646514892578, -0.10750579833984375, -0.10420513153076172, -0.10090446472167969, -0.09760379791259766, -0.09430313110351562, -0.0910024642944336, -0.08770179748535156, -0.08440113067626953, -0.0811004638671875, -0.07779979705810547, -0.07449913024902344, -0.0711984634399414, -0.06789779663085938, -0.06459712982177734, -0.06129646301269531, -0.05799579620361328, -0.05469512939453125, -0.05139446258544922, -0.04809379577636719, -0.044793128967285156, -0.041492462158203125, -0.038191795349121094, -0.03489112854003906, -0.03159046173095703, -0.028289794921875, -0.02498912811279297, -0.021688461303710938, -0.018387794494628906, -0.015087127685546875, -0.011786460876464844, -0.008485794067382812, -0.005185127258300781, -0.00188446044921875, 0.0014162063598632812, 0.0047168731689453125, 0.008017539978027344, 0.011318206787109375, 0.014618873596191406, 0.017919540405273438, 0.02122020721435547, 0.0245208740234375, 0.02782154083251953, 0.031122207641601562, 0.034422874450683594, 0.037723541259765625, 0.041024208068847656, 0.04432487487792969, 0.04762554168701172, 0.05092620849609375, 0.05422687530517578, 0.05752754211425781, 0.060828208923339844, 0.06412887573242188, 0.0674295425415039, 0.07073020935058594, 0.07403087615966797, 0.07733154296875]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 1.0, 5.0, 10.0, 15.0, 29.0, 53.0, 108.0, 180.0, 245.0, 176.0, 108.0, 38.0, 12.0, 11.0, 8.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.972425103187561, -1.8594374656677246, -1.7464498281478882, -1.6334621906280518, -1.5204745531082153, -1.407486915588379, -1.2944992780685425, -1.181511640548706, -1.0685240030288696, -0.9555363655090332, -0.8425487279891968, -0.7295610904693604, -0.6165734529495239, -0.5035858154296875, -0.3905981779098511, -0.27761054039001465, -0.16462290287017822, -0.0516352653503418, 0.06135237216949463, 0.17434000968933105, 0.2873276472091675, 0.4003152847290039, 0.5133029222488403, 0.6262905597686768, 0.7392781972885132, 0.8522658348083496, 0.965253472328186, 1.0782411098480225, 1.1912287473678589, 1.3042163848876953, 1.4172040224075317, 1.5301916599273682, 1.6431794166564941, 1.7561670541763306, 1.869154691696167, 1.9821423292160034, 2.09512996673584, 2.2081174850463867, 2.3211052417755127, 2.4340929985046387, 2.5470805168151855, 2.6600680351257324, 2.7730557918548584, 2.8860435485839844, 2.9990310668945312, 3.112018585205078, 3.225006341934204, 3.33799409866333, 3.450981616973877, 3.563969135284424, 3.67695689201355, 3.789944648742676, 3.9029321670532227, 4.0159196853637695, 4.128907203674316, 4.2418951988220215, 4.354882717132568, 4.467870235443115, 4.58085823059082, 4.693845748901367, 4.806833267211914, 4.919820785522461, 5.032808303833008, 5.145796298980713, 5.25878381729126]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 7.0, 15.0, 24.0, 52.0, 75.0, 96.0, 141.0, 112.0, 136.0, 100.0, 87.0, 75.0, 36.0, 24.0, 17.0, 7.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6904497146606445, -1.5481576919555664, -1.4058656692504883, -1.2635736465454102, -1.121281623840332, -0.9789896607398987, -0.8366976976394653, -0.6944056749343872, -0.5521136522293091, -0.40982162952423096, -0.2675296366214752, -0.12523764371871948, 0.017054378986358643, 0.15934640169143677, 0.3016383647918701, 0.44393038749694824, 0.5862224102020264, 0.7285144329071045, 0.8708064556121826, 1.0130984783172607, 1.1553905010223389, 1.297682523727417, 1.4399744272232056, 1.5822664499282837, 1.7245584726333618, 1.86685049533844, 2.0091423988342285, 2.1514344215393066, 2.2937264442443848, 2.436018466949463, 2.578310489654541, 2.720602512359619, 2.8628945350646973, 3.0051865577697754, 3.1474785804748535, 3.2897706031799316, 3.4320626258850098, 3.574354648590088, 3.716646671295166, 3.858938694000244, 4.001230716705322, 4.1435227394104, 4.2858147621154785, 4.428106784820557, 4.570398807525635, 4.712690830230713, 4.854982852935791, 4.997274875640869, 5.139566421508789, 5.281858444213867, 5.424150466918945, 5.566442489624023, 5.708734512329102, 5.85102653503418, 5.993318557739258, 6.135610580444336, 6.277902603149414, 6.420194625854492, 6.56248664855957, 6.704778671264648, 6.847070693969727, 6.989362716674805, 7.131654739379883, 7.273946762084961, 7.416238784790039]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 7.0, 10.0, 16.0, 22.0, 24.0, 49.0, 45.0, 95.0, 176.0, 316.0, 674.0, 1727.0, 7051.0, 70898.0, 3045925.0, 1032637.0, 26775.0, 4720.0, 1600.0, 662.0, 314.0, 191.0, 118.0, 71.0, 34.0, 32.0, 21.0, 14.0, 12.0, 15.0, 4.0, 6.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-2.14453125, -2.0811614990234375, -2.017791748046875, -1.9544219970703125, -1.89105224609375, -1.8276824951171875, -1.764312744140625, -1.7009429931640625, -1.6375732421875, -1.5742034912109375, -1.510833740234375, -1.4474639892578125, -1.38409423828125, -1.3207244873046875, -1.257354736328125, -1.1939849853515625, -1.130615234375, -1.0672454833984375, -1.003875732421875, -0.9405059814453125, -0.87713623046875, -0.8137664794921875, -0.750396728515625, -0.6870269775390625, -0.6236572265625, -0.5602874755859375, -0.496917724609375, -0.4335479736328125, -0.37017822265625, -0.3068084716796875, -0.243438720703125, -0.1800689697265625, -0.11669921875, -0.0533294677734375, 0.010040283203125, 0.0734100341796875, 0.13677978515625, 0.2001495361328125, 0.263519287109375, 0.3268890380859375, 0.3902587890625, 0.4536285400390625, 0.516998291015625, 0.5803680419921875, 0.64373779296875, 0.7071075439453125, 0.770477294921875, 0.8338470458984375, 0.897216796875, 0.9605865478515625, 1.023956298828125, 1.0873260498046875, 1.15069580078125, 1.2140655517578125, 1.277435302734375, 1.3408050537109375, 1.4041748046875, 1.4675445556640625, 1.530914306640625, 1.5942840576171875, 1.65765380859375, 1.7210235595703125, 1.784393310546875, 1.8477630615234375, 1.9111328125]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 6.0, 3.0, 9.0, 9.0, 11.0, 27.0, 20.0, 23.0, 43.0, 50.0, 59.0, 63.0, 63.0, 78.0, 66.0, 59.0, 76.0, 57.0, 58.0, 49.0, 26.0, 37.0, 27.0, 18.0, 18.0, 7.0, 15.0, 5.0, 3.0, 7.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9248046875, -0.895538330078125, -0.86627197265625, -0.837005615234375, -0.8077392578125, -0.778472900390625, -0.74920654296875, -0.719940185546875, -0.690673828125, -0.661407470703125, -0.63214111328125, -0.602874755859375, -0.5736083984375, -0.544342041015625, -0.51507568359375, -0.485809326171875, -0.45654296875, -0.427276611328125, -0.39801025390625, -0.368743896484375, -0.3394775390625, -0.310211181640625, -0.28094482421875, -0.251678466796875, -0.222412109375, -0.193145751953125, -0.16387939453125, -0.134613037109375, -0.1053466796875, -0.076080322265625, -0.04681396484375, -0.017547607421875, 0.01171875, 0.040985107421875, 0.07025146484375, 0.099517822265625, 0.1287841796875, 0.158050537109375, 0.18731689453125, 0.216583251953125, 0.245849609375, 0.275115966796875, 0.30438232421875, 0.333648681640625, 0.3629150390625, 0.392181396484375, 0.42144775390625, 0.450714111328125, 0.47998046875, 0.509246826171875, 0.53851318359375, 0.567779541015625, 0.5970458984375, 0.626312255859375, 0.65557861328125, 0.684844970703125, 0.714111328125, 0.743377685546875, 0.77264404296875, 0.801910400390625, 0.8311767578125, 0.860443115234375, 0.88970947265625, 0.918975830078125, 0.9482421875]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 8.0, 4.0, 9.0, 8.0, 22.0, 20.0, 53.0, 85.0, 199.0, 448.0, 1291.0, 6256.0, 89882.0, 3965488.0, 121010.0, 7088.0, 1439.0, 489.0, 198.0, 118.0, 62.0, 46.0, 21.0, 12.0, 4.0, 6.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5341796875, -1.4661102294921875, -1.398040771484375, -1.3299713134765625, -1.26190185546875, -1.1938323974609375, -1.125762939453125, -1.0576934814453125, -0.9896240234375, -0.9215545654296875, -0.853485107421875, -0.7854156494140625, -0.71734619140625, -0.6492767333984375, -0.581207275390625, -0.5131378173828125, -0.445068359375, -0.3769989013671875, -0.308929443359375, -0.2408599853515625, -0.17279052734375, -0.1047210693359375, -0.036651611328125, 0.0314178466796875, 0.0994873046875, 0.1675567626953125, 0.235626220703125, 0.3036956787109375, 0.37176513671875, 0.4398345947265625, 0.507904052734375, 0.5759735107421875, 0.64404296875, 0.7121124267578125, 0.780181884765625, 0.8482513427734375, 0.91632080078125, 0.9843902587890625, 1.052459716796875, 1.1205291748046875, 1.1885986328125, 1.2566680908203125, 1.324737548828125, 1.3928070068359375, 1.46087646484375, 1.5289459228515625, 1.597015380859375, 1.6650848388671875, 1.733154296875, 1.8012237548828125, 1.869293212890625, 1.9373626708984375, 2.00543212890625, 2.0735015869140625, 2.141571044921875, 2.2096405029296875, 2.2777099609375, 2.3457794189453125, 2.413848876953125, 2.4819183349609375, 2.54998779296875, 2.6180572509765625, 2.686126708984375, 2.7541961669921875, 2.822265625]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 9.0, 17.0, 17.0, 41.0, 69.0, 75.0, 142.0, 252.0, 472.0, 808.0, 920.0, 534.0, 294.0, 157.0, 93.0, 56.0, 40.0, 23.0, 11.0, 8.0, 11.0, 6.0, 9.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.472412109375, -0.46062469482421875, -0.4488372802734375, -0.43704986572265625, -0.425262451171875, -0.41347503662109375, -0.4016876220703125, -0.38990020751953125, -0.37811279296875, -0.36632537841796875, -0.3545379638671875, -0.34275054931640625, -0.330963134765625, -0.31917572021484375, -0.3073883056640625, -0.29560089111328125, -0.2838134765625, -0.27202606201171875, -0.2602386474609375, -0.24845123291015625, -0.236663818359375, -0.22487640380859375, -0.2130889892578125, -0.20130157470703125, -0.18951416015625, -0.17772674560546875, -0.1659393310546875, -0.15415191650390625, -0.142364501953125, -0.13057708740234375, -0.1187896728515625, -0.10700225830078125, -0.09521484375, -0.08342742919921875, -0.0716400146484375, -0.05985260009765625, -0.048065185546875, -0.03627777099609375, -0.0244903564453125, -0.01270294189453125, -0.00091552734375, 0.01087188720703125, 0.0226593017578125, 0.03444671630859375, 0.046234130859375, 0.05802154541015625, 0.0698089599609375, 0.08159637451171875, 0.0933837890625, 0.10517120361328125, 0.1169586181640625, 0.12874603271484375, 0.140533447265625, 0.15232086181640625, 0.1641082763671875, 0.17589569091796875, 0.18768310546875, 0.19947052001953125, 0.2112579345703125, 0.22304534912109375, 0.234832763671875, 0.24662017822265625, 0.2584075927734375, 0.27019500732421875, 0.281982421875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 9.0, 9.0, 8.0, 15.0, 11.0, 37.0, 52.0, 84.0, 111.0, 120.0, 148.0, 121.0, 96.0, 61.0, 48.0, 22.0, 12.0, 8.0, 14.0, 4.0, 4.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.199275255203247, -1.149665117263794, -1.1000548601150513, -1.0504447221755981, -1.0008344650268555, -0.9512243270874023, -0.9016141295433044, -0.8520039319992065, -0.8023937940597534, -0.7527835965156555, -0.7031733989715576, -0.6535632610321045, -0.6039530634880066, -0.5543428659439087, -0.5047326683998108, -0.4551225006580353, -0.405512273311615, -0.3559020757675171, -0.3062919080257416, -0.2566817104816437, -0.20707152783870697, -0.15746134519577026, -0.10785114765167236, -0.05824097990989685, -0.00863078236579895, 0.040979404002428055, 0.09058959037065506, 0.14019978046417236, 0.18980996310710907, 0.23942014575004578, 0.2890303432941437, 0.3386405110359192, 0.3882507085800171, 0.437860906124115, 0.4874710738658905, 0.537081241607666, 0.5866914391517639, 0.6363016366958618, 0.6859118342399597, 0.7355220317840576, 0.7851321697235107, 0.8347423672676086, 0.8843525648117065, 0.9339627027511597, 0.9835729002952576, 1.0331830978393555, 1.0827932357788086, 1.1324034929275513, 1.182013750076294, 1.231623888015747, 1.2812341451644897, 1.3308442831039429, 1.3804545402526855, 1.4300646781921387, 1.4796748161315918, 1.5292850732803345, 1.5788952112197876, 1.6285053491592407, 1.6781156063079834, 1.7277257442474365, 1.7773360013961792, 1.8269461393356323, 1.876556396484375, 1.9261665344238281, 1.9757766723632812]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 4.0, 17.0, 10.0, 11.0, 17.0, 18.0, 14.0, 23.0, 33.0, 35.0, 46.0, 55.0, 48.0, 54.0, 43.0, 60.0, 53.0, 55.0, 45.0, 65.0, 52.0, 40.0, 34.0, 33.0, 23.0, 19.0, 23.0, 13.0, 18.0, 8.0, 6.0, 6.0, 4.0, 6.0, 4.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.9184392690658569, -0.8921825289726257, -0.8659257888793945, -0.8396690487861633, -0.8134123086929321, -0.7871555685997009, -0.7608988285064697, -0.7346420884132385, -0.7083853483200073, -0.6821286082267761, -0.6558718681335449, -0.6296151280403137, -0.6033583879470825, -0.5771016478538513, -0.5508449077606201, -0.5245881676673889, -0.4983313977718353, -0.4720746576786041, -0.4458179175853729, -0.4195611774921417, -0.3933044373989105, -0.36704766750335693, -0.34079092741012573, -0.31453418731689453, -0.28827744722366333, -0.26202070713043213, -0.23576396703720093, -0.20950722694396973, -0.18325048685073853, -0.15699373185634613, -0.13073699176311493, -0.10448025166988373, -0.07822352647781372, -0.05196678638458252, -0.02571004256606102, 0.0005467012524604797, 0.02680344134569168, 0.05306018888950348, 0.07931692898273468, 0.10557366907596588, 0.13183040916919708, 0.15808714926242828, 0.18434388935565948, 0.21060064435005188, 0.23685738444328308, 0.2631141245365143, 0.2893708646297455, 0.3156276047229767, 0.3418843448162079, 0.3681410849094391, 0.3943978250026703, 0.4206545650959015, 0.4469113051891327, 0.4731680750846863, 0.4994248151779175, 0.5256815552711487, 0.5519382953643799, 0.5781950354576111, 0.6044517755508423, 0.6307085156440735, 0.6569652557373047, 0.6832219958305359, 0.7094787359237671, 0.7357354760169983, 0.7619922161102295]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 5.0, 6.0, 13.0, 9.0, 33.0, 80.0, 270.0, 1158.0, 5663.0, 66484.0, 951454.0, 19096.0, 3239.0, 718.0, 183.0, 57.0, 22.0, 19.0, 13.0, 5.0, 3.0, 2.0, 2.0, 4.0, 3.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.17578125, -1.1442794799804688, -1.1127777099609375, -1.0812759399414062, -1.049774169921875, -1.0182723999023438, -0.9867706298828125, -0.9552688598632812, -0.92376708984375, -0.8922653198242188, -0.8607635498046875, -0.8292617797851562, -0.797760009765625, -0.7662582397460938, -0.7347564697265625, -0.7032546997070312, -0.6717529296875, -0.6402511596679688, -0.6087493896484375, -0.5772476196289062, -0.545745849609375, -0.5142440795898438, -0.4827423095703125, -0.45124053955078125, -0.41973876953125, -0.38823699951171875, -0.3567352294921875, -0.32523345947265625, -0.293731689453125, -0.26222991943359375, -0.2307281494140625, -0.19922637939453125, -0.167724609375, -0.13622283935546875, -0.1047210693359375, -0.07321929931640625, -0.041717529296875, -0.01021575927734375, 0.0212860107421875, 0.05278778076171875, 0.08428955078125, 0.11579132080078125, 0.1472930908203125, 0.17879486083984375, 0.210296630859375, 0.24179840087890625, 0.2733001708984375, 0.30480194091796875, 0.3363037109375, 0.36780548095703125, 0.3993072509765625, 0.43080902099609375, 0.462310791015625, 0.49381256103515625, 0.5253143310546875, 0.5568161010742188, 0.58831787109375, 0.6198196411132812, 0.6513214111328125, 0.6828231811523438, 0.714324951171875, 0.7458267211914062, 0.7773284912109375, 0.8088302612304688, 0.84033203125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 7.0, 17.0, 28.0, 30.0, 38.0, 60.0, 64.0, 83.0, 97.0, 103.0, 118.0, 94.0, 79.0, 57.0, 47.0, 25.0, 14.0, 14.0, 9.0, 6.0, 8.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1435546875, -1.110504150390625, -1.07745361328125, -1.044403076171875, -1.0113525390625, -0.978302001953125, -0.94525146484375, -0.912200927734375, -0.879150390625, -0.846099853515625, -0.81304931640625, -0.779998779296875, -0.7469482421875, -0.713897705078125, -0.68084716796875, -0.647796630859375, -0.61474609375, -0.581695556640625, -0.54864501953125, -0.515594482421875, -0.4825439453125, -0.449493408203125, -0.41644287109375, -0.383392333984375, -0.350341796875, -0.317291259765625, -0.28424072265625, -0.251190185546875, -0.2181396484375, -0.185089111328125, -0.15203857421875, -0.118988037109375, -0.0859375, -0.052886962890625, -0.01983642578125, 0.013214111328125, 0.0462646484375, 0.079315185546875, 0.11236572265625, 0.145416259765625, 0.178466796875, 0.211517333984375, 0.24456787109375, 0.277618408203125, 0.3106689453125, 0.343719482421875, 0.37677001953125, 0.409820556640625, 0.44287109375, 0.475921630859375, 0.50897216796875, 0.542022705078125, 0.5750732421875, 0.608123779296875, 0.64117431640625, 0.674224853515625, 0.707275390625, 0.740325927734375, 0.77337646484375, 0.806427001953125, 0.8394775390625, 0.872528076171875, 0.90557861328125, 0.938629150390625, 0.9716796875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 4.0, 6.0, 6.0, 11.0, 12.0, 12.0, 15.0, 34.0, 38.0, 76.0, 149.0, 344.0, 807.0, 2197.0, 6938.0, 33356.0, 571832.0, 399256.0, 24544.0, 5768.0, 1855.0, 690.0, 248.0, 125.0, 82.0, 41.0, 29.0, 18.0, 15.0, 17.0, 4.0, 7.0, 8.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.422119140625, -0.40889739990234375, -0.3956756591796875, -0.38245391845703125, -0.369232177734375, -0.35601043701171875, -0.3427886962890625, -0.32956695556640625, -0.31634521484375, -0.30312347412109375, -0.2899017333984375, -0.27667999267578125, -0.263458251953125, -0.25023651123046875, -0.2370147705078125, -0.22379302978515625, -0.2105712890625, -0.19734954833984375, -0.1841278076171875, -0.17090606689453125, -0.157684326171875, -0.14446258544921875, -0.1312408447265625, -0.11801910400390625, -0.10479736328125, -0.09157562255859375, -0.0783538818359375, -0.06513214111328125, -0.051910400390625, -0.03868865966796875, -0.0254669189453125, -0.01224517822265625, 0.0009765625, 0.01419830322265625, 0.0274200439453125, 0.04064178466796875, 0.053863525390625, 0.06708526611328125, 0.0803070068359375, 0.09352874755859375, 0.10675048828125, 0.11997222900390625, 0.1331939697265625, 0.14641571044921875, 0.159637451171875, 0.17285919189453125, 0.1860809326171875, 0.19930267333984375, 0.2125244140625, 0.22574615478515625, 0.2389678955078125, 0.25218963623046875, 0.265411376953125, 0.27863311767578125, 0.2918548583984375, 0.30507659912109375, 0.31829833984375, 0.33152008056640625, 0.3447418212890625, 0.35796356201171875, 0.371185302734375, 0.38440704345703125, 0.3976287841796875, 0.41085052490234375, 0.424072265625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 5.0, 5.0, 2.0, 6.0, 8.0, 12.0, 17.0, 19.0, 23.0, 20.0, 37.0, 25.0, 46.0, 42.0, 41.0, 46.0, 48.0, 54.0, 52.0, 54.0, 54.0, 53.0, 46.0, 37.0, 34.0, 32.0, 35.0, 32.0, 22.0, 18.0, 9.0, 12.0, 11.0, 10.0, 9.0, 6.0, 0.0, 5.0, 7.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.982421875, -0.949737548828125, -0.91705322265625, -0.884368896484375, -0.8516845703125, -0.819000244140625, -0.78631591796875, -0.753631591796875, -0.720947265625, -0.688262939453125, -0.65557861328125, -0.622894287109375, -0.5902099609375, -0.557525634765625, -0.52484130859375, -0.492156982421875, -0.45947265625, -0.426788330078125, -0.39410400390625, -0.361419677734375, -0.3287353515625, -0.296051025390625, -0.26336669921875, -0.230682373046875, -0.197998046875, -0.165313720703125, -0.13262939453125, -0.099945068359375, -0.0672607421875, -0.034576416015625, -0.00189208984375, 0.030792236328125, 0.0634765625, 0.096160888671875, 0.12884521484375, 0.161529541015625, 0.1942138671875, 0.226898193359375, 0.25958251953125, 0.292266845703125, 0.324951171875, 0.357635498046875, 0.39031982421875, 0.423004150390625, 0.4556884765625, 0.488372802734375, 0.52105712890625, 0.553741455078125, 0.58642578125, 0.619110107421875, 0.65179443359375, 0.684478759765625, 0.7171630859375, 0.749847412109375, 0.78253173828125, 0.815216064453125, 0.847900390625, 0.880584716796875, 0.91326904296875, 0.945953369140625, 0.9786376953125, 1.011322021484375, 1.04400634765625, 1.076690673828125, 1.109375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 8.0, 4.0, 4.0, 7.0, 11.0, 13.0, 22.0, 38.0, 42.0, 80.0, 97.0, 164.0, 270.0, 481.0, 770.0, 1370.0, 2578.0, 5538.0, 13648.0, 41015.0, 176259.0, 528286.0, 205106.0, 45867.0, 14703.0, 5907.0, 2816.0, 1410.0, 801.0, 470.0, 260.0, 166.0, 110.0, 72.0, 41.0, 37.0, 23.0, 16.0, 5.0, 15.0, 8.0, 9.0, 3.0, 4.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06463623046875, -0.06244850158691406, -0.060260772705078125, -0.05807304382324219, -0.05588531494140625, -0.05369758605957031, -0.051509857177734375, -0.04932212829589844, -0.0471343994140625, -0.04494667053222656, -0.042758941650390625, -0.04057121276855469, -0.03838348388671875, -0.03619575500488281, -0.034008026123046875, -0.03182029724121094, -0.029632568359375, -0.027444839477539062, -0.025257110595703125, -0.023069381713867188, -0.02088165283203125, -0.018693923950195312, -0.016506195068359375, -0.014318466186523438, -0.0121307373046875, -0.009943008422851562, -0.007755279541015625, -0.0055675506591796875, -0.00337982177734375, -0.0011920928955078125, 0.000995635986328125, 0.0031833648681640625, 0.00537109375, 0.0075588226318359375, 0.009746551513671875, 0.011934280395507812, 0.01412200927734375, 0.016309738159179688, 0.018497467041015625, 0.020685195922851562, 0.0228729248046875, 0.025060653686523438, 0.027248382568359375, 0.029436111450195312, 0.03162384033203125, 0.03381156921386719, 0.035999298095703125, 0.03818702697753906, 0.040374755859375, 0.04256248474121094, 0.044750213623046875, 0.04693794250488281, 0.04912567138671875, 0.05131340026855469, 0.053501129150390625, 0.05568885803222656, 0.0578765869140625, 0.06006431579589844, 0.062252044677734375, 0.06443977355957031, 0.06662750244140625, 0.06881523132324219, 0.07100296020507812, 0.07319068908691406, 0.07537841796875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 8.0, 11.0, 9.0, 15.0, 18.0, 26.0, 42.0, 36.0, 73.0, 72.0, 115.0, 95.0, 100.0, 83.0, 58.0, 47.0, 38.0, 40.0, 17.0, 18.0, 12.0, 6.0, 11.0, 7.0, 6.0, 9.0, 4.0, 1.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.124641418457031e-05, -4.0055252611637115e-05, -3.886409103870392e-05, -3.767292946577072e-05, -3.6481767892837524e-05, -3.529060631990433e-05, -3.409944474697113e-05, -3.290828317403793e-05, -3.1717121601104736e-05, -3.052596002817154e-05, -2.9334798455238342e-05, -2.8143636882305145e-05, -2.6952475309371948e-05, -2.576131373643875e-05, -2.4570152163505554e-05, -2.3378990590572357e-05, -2.218782901763916e-05, -2.0996667444705963e-05, -1.9805505871772766e-05, -1.861434429883957e-05, -1.7423182725906372e-05, -1.6232021152973175e-05, -1.5040859580039978e-05, -1.3849698007106781e-05, -1.2658536434173584e-05, -1.1467374861240387e-05, -1.027621328830719e-05, -9.085051715373993e-06, -7.893890142440796e-06, -6.702728569507599e-06, -5.511566996574402e-06, -4.320405423641205e-06, -3.129243850708008e-06, -1.938082277774811e-06, -7.469207048416138e-07, 4.4424086809158325e-07, 1.6354024410247803e-06, 2.8265640139579773e-06, 4.017725586891174e-06, 5.208887159824371e-06, 6.400048732757568e-06, 7.591210305690765e-06, 8.782371878623962e-06, 9.97353345155716e-06, 1.1164695024490356e-05, 1.2355856597423553e-05, 1.354701817035675e-05, 1.4738179743289948e-05, 1.5929341316223145e-05, 1.712050288915634e-05, 1.831166446208954e-05, 1.9502826035022736e-05, 2.0693987607955933e-05, 2.188514918088913e-05, 2.3076310753822327e-05, 2.4267472326755524e-05, 2.545863389968872e-05, 2.6649795472621918e-05, 2.7840957045555115e-05, 2.9032118618488312e-05, 3.022328019142151e-05, 3.1414441764354706e-05, 3.26056033372879e-05, 3.37967649102211e-05, 3.49879264831543e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 7.0, 10.0, 13.0, 14.0, 31.0, 42.0, 62.0, 108.0, 197.0, 326.0, 592.0, 1026.0, 2129.0, 4829.0, 12492.0, 40332.0, 169951.0, 510137.0, 227771.0, 52315.0, 15189.0, 5625.0, 2646.0, 1198.0, 605.0, 365.0, 202.0, 125.0, 58.0, 48.0, 32.0, 20.0, 18.0, 12.0, 5.0, 9.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.068115234375, -0.06608772277832031, -0.06406021118164062, -0.06203269958496094, -0.06000518798828125, -0.05797767639160156, -0.055950164794921875, -0.05392265319824219, -0.0518951416015625, -0.04986763000488281, -0.047840118408203125, -0.04581260681152344, -0.04378509521484375, -0.04175758361816406, -0.039730072021484375, -0.03770256042480469, -0.035675048828125, -0.03364753723144531, -0.031620025634765625, -0.029592514038085938, -0.02756500244140625, -0.025537490844726562, -0.023509979248046875, -0.021482467651367188, -0.0194549560546875, -0.017427444458007812, -0.015399932861328125, -0.013372421264648438, -0.01134490966796875, -0.009317398071289062, -0.007289886474609375, -0.0052623748779296875, -0.00323486328125, -0.0012073516845703125, 0.000820159912109375, 0.0028476715087890625, 0.00487518310546875, 0.0069026947021484375, 0.008930206298828125, 0.010957717895507812, 0.0129852294921875, 0.015012741088867188, 0.017040252685546875, 0.019067764282226562, 0.02109527587890625, 0.023122787475585938, 0.025150299072265625, 0.027177810668945312, 0.029205322265625, 0.031232833862304688, 0.033260345458984375, 0.03528785705566406, 0.03731536865234375, 0.03934288024902344, 0.041370391845703125, 0.04339790344238281, 0.0454254150390625, 0.04745292663574219, 0.049480438232421875, 0.05150794982910156, 0.05353546142578125, 0.05556297302246094, 0.057590484619140625, 0.05961799621582031, 0.0616455078125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 12.0, 3.0, 12.0, 19.0, 21.0, 28.0, 34.0, 43.0, 68.0, 86.0, 83.0, 82.0, 79.0, 85.0, 77.0, 68.0, 51.0, 30.0, 34.0, 25.0, 16.0, 11.0, 10.0, 1.0, 8.0, 3.0, 2.0, 4.0, 1.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01861572265625, -0.018034696578979492, -0.017453670501708984, -0.016872644424438477, -0.01629161834716797, -0.01571059226989746, -0.015129566192626953, -0.014548540115356445, -0.013967514038085938, -0.01338648796081543, -0.012805461883544922, -0.012224435806274414, -0.011643409729003906, -0.011062383651733398, -0.01048135757446289, -0.009900331497192383, -0.009319305419921875, -0.008738279342651367, -0.00815725326538086, -0.0075762271881103516, -0.006995201110839844, -0.006414175033569336, -0.005833148956298828, -0.00525212287902832, -0.0046710968017578125, -0.004090070724487305, -0.003509044647216797, -0.002928018569946289, -0.0023469924926757812, -0.0017659664154052734, -0.0011849403381347656, -0.0006039142608642578, -2.288818359375e-05, 0.0005581378936767578, 0.0011391639709472656, 0.0017201900482177734, 0.0023012161254882812, 0.002882242202758789, 0.003463268280029297, 0.004044294357299805, 0.0046253204345703125, 0.00520634651184082, 0.005787372589111328, 0.006368398666381836, 0.006949424743652344, 0.0075304508209228516, 0.00811147689819336, 0.008692502975463867, 0.009273529052734375, 0.009854555130004883, 0.01043558120727539, 0.011016607284545898, 0.011597633361816406, 0.012178659439086914, 0.012759685516357422, 0.01334071159362793, 0.013921737670898438, 0.014502763748168945, 0.015083789825439453, 0.01566481590270996, 0.01624584197998047, 0.016826868057250977, 0.017407894134521484, 0.017988920211791992, 0.0185699462890625]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 2.0, 11.0, 19.0, 30.0, 119.0, 280.0, 327.0, 150.0, 43.0, 18.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7110267281532288, -0.6329634189605713, -0.5549001693725586, -0.4768368601799011, -0.39877355098724365, -0.3207102417945862, -0.2426469624042511, -0.16458368301391602, -0.08652037382125854, -0.008457079529762268, 0.06960621476173401, 0.14766950905323029, 0.22573280334472656, 0.30379611253738403, 0.3818593919277191, 0.4599226713180542, 0.5379859805107117, 0.6160492897033691, 0.6941125392913818, 0.7721758484840393, 0.8502391576766968, 0.9283024668693542, 1.0063657760620117, 1.0844290256500244, 1.162492275238037, 1.2405555248260498, 1.318618893623352, 1.3966821432113647, 1.474745512008667, 1.5528087615966797, 1.6308720111846924, 1.708935260772705, 1.7869987487792969, 1.8650619983673096, 1.9431253671646118, 2.021188735961914, 2.0992519855499268, 2.1773152351379395, 2.255378484725952, 2.333441734313965, 2.4115052223205566, 2.4895684719085693, 2.567631721496582, 2.645695209503174, 2.7237584590911865, 2.801821708679199, 2.879884958267212, 2.9579482078552246, 3.0360114574432373, 3.11407470703125, 3.1921379566192627, 3.2702014446258545, 3.348264694213867, 3.42632794380188, 3.5043911933898926, 3.5824544429779053, 3.660517692565918, 3.7385809421539307, 3.8166441917419434, 3.894707679748535, 3.972770929336548, 4.0508341789245605, 4.128897666931152, 4.206960678100586, 4.285024166107178]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 5.0, 14.0, 23.0, 30.0, 25.0, 43.0, 59.0, 87.0, 79.0, 96.0, 84.0, 101.0, 96.0, 64.0, 64.0, 31.0, 30.0, 26.0, 18.0, 7.0, 7.0, 9.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7793914079666138, -0.7500144839286804, -0.7206375002861023, -0.691260576248169, -0.6618836522102356, -0.6325066685676575, -0.6031297445297241, -0.573752760887146, -0.5443758368492126, -0.5149989128112793, -0.48562195897102356, -0.4562450051307678, -0.4268680512905121, -0.39749109745025635, -0.368114173412323, -0.33873721957206726, -0.3093602955341339, -0.2799833416938782, -0.2506064176559448, -0.2212294638156891, -0.19185250997543335, -0.1624755710363388, -0.13309863209724426, -0.10372167825698853, -0.07434473931789398, -0.04496779292821884, -0.015590850263834, 0.013786092400550842, 0.04316303879022598, 0.07253998517990112, 0.10191692411899567, 0.1312938779592514, 0.16067081689834595, 0.1900477558374405, 0.21942470967769623, 0.24880164861679077, 0.2781786024570465, 0.30755555629730225, 0.3369324803352356, 0.36630943417549133, 0.39568638801574707, 0.4250633418560028, 0.45444026589393616, 0.4838172197341919, 0.5131941437721252, 0.5425711274147034, 0.5719480514526367, 0.6013250350952148, 0.6307018995285034, 0.6600788235664368, 0.6894558072090149, 0.7188327312469482, 0.7482096552848816, 0.7775866389274597, 0.8069635629653931, 0.8363405466079712, 0.8657174706459045, 0.8950943946838379, 0.924471378326416, 0.9538483023643494, 0.9832252264022827, 1.0126022100448608, 1.0419790744781494, 1.0713560581207275, 1.1007330417633057]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 6.0, 8.0, 6.0, 19.0, 18.0, 59.0, 105.0, 312.0, 811.0, 4101.0, 33572.0, 716626.0, 273920.0, 15647.0, 2436.0, 555.0, 160.0, 71.0, 41.0, 21.0, 18.0, 13.0, 10.0, 0.0, 4.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.302734375, -1.2630615234375, -1.223388671875, -1.1837158203125, -1.14404296875, -1.1043701171875, -1.064697265625, -1.0250244140625, -0.9853515625, -0.9456787109375, -0.906005859375, -0.8663330078125, -0.82666015625, -0.7869873046875, -0.747314453125, -0.7076416015625, -0.66796875, -0.6282958984375, -0.588623046875, -0.5489501953125, -0.50927734375, -0.4696044921875, -0.429931640625, -0.3902587890625, -0.3505859375, -0.3109130859375, -0.271240234375, -0.2315673828125, -0.19189453125, -0.1522216796875, -0.112548828125, -0.0728759765625, -0.033203125, 0.0064697265625, 0.046142578125, 0.0858154296875, 0.12548828125, 0.1651611328125, 0.204833984375, 0.2445068359375, 0.2841796875, 0.3238525390625, 0.363525390625, 0.4031982421875, 0.44287109375, 0.4825439453125, 0.522216796875, 0.5618896484375, 0.6015625, 0.6412353515625, 0.680908203125, 0.7205810546875, 0.76025390625, 0.7999267578125, 0.839599609375, 0.8792724609375, 0.9189453125, 0.9586181640625, 0.998291015625, 1.0379638671875, 1.07763671875, 1.1173095703125, 1.156982421875, 1.1966552734375, 1.236328125]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 11.0, 24.0, 20.0, 36.0, 53.0, 72.0, 100.0, 81.0, 96.0, 126.0, 96.0, 76.0, 65.0, 41.0, 26.0, 26.0, 12.0, 14.0, 10.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2548828125, -1.1921844482421875, -1.129486083984375, -1.0667877197265625, -1.00408935546875, -0.9413909912109375, -0.878692626953125, -0.8159942626953125, -0.7532958984375, -0.6905975341796875, -0.627899169921875, -0.5652008056640625, -0.50250244140625, -0.4398040771484375, -0.377105712890625, -0.3144073486328125, -0.251708984375, -0.1890106201171875, -0.126312255859375, -0.0636138916015625, -0.00091552734375, 0.0617828369140625, 0.124481201171875, 0.1871795654296875, 0.2498779296875, 0.3125762939453125, 0.375274658203125, 0.4379730224609375, 0.50067138671875, 0.5633697509765625, 0.626068115234375, 0.6887664794921875, 0.75146484375, 0.8141632080078125, 0.876861572265625, 0.9395599365234375, 1.00225830078125, 1.0649566650390625, 1.127655029296875, 1.1903533935546875, 1.2530517578125, 1.3157501220703125, 1.378448486328125, 1.4411468505859375, 1.50384521484375, 1.5665435791015625, 1.629241943359375, 1.6919403076171875, 1.754638671875, 1.8173370361328125, 1.880035400390625, 1.9427337646484375, 2.00543212890625, 2.0681304931640625, 2.130828857421875, 2.1935272216796875, 2.2562255859375, 2.3189239501953125, 2.381622314453125, 2.4443206787109375, 2.50701904296875, 2.5697174072265625, 2.632415771484375, 2.6951141357421875, 2.7578125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 7.0, 7.0, 11.0, 12.0, 17.0, 20.0, 33.0, 36.0, 66.0, 92.0, 143.0, 258.0, 549.0, 1738.0, 11291.0, 354804.0, 659410.0, 16363.0, 2292.0, 621.0, 298.0, 147.0, 107.0, 65.0, 42.0, 32.0, 21.0, 18.0, 10.0, 9.0, 5.0, 5.0, 7.0, 6.0, 4.0, 7.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.623046875, -1.581512451171875, -1.53997802734375, -1.498443603515625, -1.4569091796875, -1.415374755859375, -1.37384033203125, -1.332305908203125, -1.290771484375, -1.249237060546875, -1.20770263671875, -1.166168212890625, -1.1246337890625, -1.083099365234375, -1.04156494140625, -1.000030517578125, -0.95849609375, -0.916961669921875, -0.87542724609375, -0.833892822265625, -0.7923583984375, -0.750823974609375, -0.70928955078125, -0.667755126953125, -0.626220703125, -0.584686279296875, -0.54315185546875, -0.501617431640625, -0.4600830078125, -0.418548583984375, -0.37701416015625, -0.335479736328125, -0.2939453125, -0.252410888671875, -0.21087646484375, -0.169342041015625, -0.1278076171875, -0.086273193359375, -0.04473876953125, -0.003204345703125, 0.038330078125, 0.079864501953125, 0.12139892578125, 0.162933349609375, 0.2044677734375, 0.246002197265625, 0.28753662109375, 0.329071044921875, 0.37060546875, 0.412139892578125, 0.45367431640625, 0.495208740234375, 0.5367431640625, 0.578277587890625, 0.61981201171875, 0.661346435546875, 0.702880859375, 0.744415283203125, 0.78594970703125, 0.827484130859375, 0.8690185546875, 0.910552978515625, 0.95208740234375, 0.993621826171875, 1.03515625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 5.0, 6.0, 5.0, 8.0, 11.0, 14.0, 15.0, 24.0, 24.0, 25.0, 19.0, 35.0, 39.0, 30.0, 34.0, 41.0, 51.0, 45.0, 37.0, 36.0, 56.0, 39.0, 49.0, 41.0, 39.0, 44.0, 21.0, 28.0, 25.0, 18.0, 28.0, 18.0, 17.0, 12.0, 10.0, 7.0, 11.0, 11.0, 4.0, 8.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.0810546875, -1.04901123046875, -1.0169677734375, -0.98492431640625, -0.952880859375, -0.92083740234375, -0.8887939453125, -0.85675048828125, -0.82470703125, -0.79266357421875, -0.7606201171875, -0.72857666015625, -0.696533203125, -0.66448974609375, -0.6324462890625, -0.60040283203125, -0.568359375, -0.53631591796875, -0.5042724609375, -0.47222900390625, -0.440185546875, -0.40814208984375, -0.3760986328125, -0.34405517578125, -0.31201171875, -0.27996826171875, -0.2479248046875, -0.21588134765625, -0.183837890625, -0.15179443359375, -0.1197509765625, -0.08770751953125, -0.0556640625, -0.02362060546875, 0.0084228515625, 0.04046630859375, 0.072509765625, 0.10455322265625, 0.1365966796875, 0.16864013671875, 0.20068359375, 0.23272705078125, 0.2647705078125, 0.29681396484375, 0.328857421875, 0.36090087890625, 0.3929443359375, 0.42498779296875, 0.45703125, 0.48907470703125, 0.5211181640625, 0.55316162109375, 0.585205078125, 0.61724853515625, 0.6492919921875, 0.68133544921875, 0.71337890625, 0.74542236328125, 0.7774658203125, 0.80950927734375, 0.841552734375, 0.87359619140625, 0.9056396484375, 0.93768310546875, 0.9697265625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 3.0, 5.0, 5.0, 7.0, 11.0, 13.0, 26.0, 26.0, 53.0, 118.0, 236.0, 451.0, 1340.0, 4484.0, 27355.0, 804666.0, 193612.0, 11973.0, 2572.0, 871.0, 348.0, 150.0, 84.0, 46.0, 30.0, 19.0, 16.0, 12.0, 5.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52490234375, -0.5083999633789062, -0.4918975830078125, -0.47539520263671875, -0.458892822265625, -0.44239044189453125, -0.4258880615234375, -0.40938568115234375, -0.39288330078125, -0.37638092041015625, -0.3598785400390625, -0.34337615966796875, -0.326873779296875, -0.31037139892578125, -0.2938690185546875, -0.27736663818359375, -0.2608642578125, -0.24436187744140625, -0.2278594970703125, -0.21135711669921875, -0.194854736328125, -0.17835235595703125, -0.1618499755859375, -0.14534759521484375, -0.12884521484375, -0.11234283447265625, -0.0958404541015625, -0.07933807373046875, -0.062835693359375, -0.04633331298828125, -0.0298309326171875, -0.01332855224609375, 0.003173828125, 0.01967620849609375, 0.0361785888671875, 0.05268096923828125, 0.069183349609375, 0.08568572998046875, 0.1021881103515625, 0.11869049072265625, 0.13519287109375, 0.15169525146484375, 0.1681976318359375, 0.18470001220703125, 0.201202392578125, 0.21770477294921875, 0.2342071533203125, 0.25070953369140625, 0.2672119140625, 0.28371429443359375, 0.3002166748046875, 0.31671905517578125, 0.333221435546875, 0.34972381591796875, 0.3662261962890625, 0.38272857666015625, 0.39923095703125, 0.41573333740234375, 0.4322357177734375, 0.44873809814453125, 0.465240478515625, 0.48174285888671875, 0.4982452392578125, 0.5147476196289062, 0.53125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 3.0, 4.0, 4.0, 5.0, 8.0, 11.0, 23.0, 39.0, 42.0, 44.0, 123.0, 145.0, 151.0, 106.0, 90.0, 65.0, 32.0, 24.0, 21.0, 8.0, 11.0, 8.0, 6.0, 5.0, 5.0, 1.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-6.830692291259766e-05, -6.66910782456398e-05, -6.507523357868195e-05, -6.345938891172409e-05, -6.184354424476624e-05, -6.022769957780838e-05, -5.8611854910850525e-05, -5.699601024389267e-05, -5.5380165576934814e-05, -5.376432090997696e-05, -5.2148476243019104e-05, -5.053263157606125e-05, -4.8916786909103394e-05, -4.730094224214554e-05, -4.568509757518768e-05, -4.406925290822983e-05, -4.245340824127197e-05, -4.083756357431412e-05, -3.922171890735626e-05, -3.760587424039841e-05, -3.599002957344055e-05, -3.4374184906482697e-05, -3.275834023952484e-05, -3.1142495572566986e-05, -2.952665090560913e-05, -2.7910806238651276e-05, -2.629496157169342e-05, -2.4679116904735565e-05, -2.306327223777771e-05, -2.1447427570819855e-05, -1.9831582903862e-05, -1.8215738236904144e-05, -1.659989356994629e-05, -1.4984048902988434e-05, -1.3368204236030579e-05, -1.1752359569072723e-05, -1.0136514902114868e-05, -8.520670235157013e-06, -6.904825568199158e-06, -5.2889809012413025e-06, -3.6731362342834473e-06, -2.057291567325592e-06, -4.414469003677368e-07, 1.1743977665901184e-06, 2.7902424335479736e-06, 4.406087100505829e-06, 6.021931767463684e-06, 7.63777643442154e-06, 9.253621101379395e-06, 1.086946576833725e-05, 1.2485310435295105e-05, 1.410115510225296e-05, 1.5716999769210815e-05, 1.733284443616867e-05, 1.8948689103126526e-05, 2.056453377008438e-05, 2.2180378437042236e-05, 2.379622310400009e-05, 2.5412067770957947e-05, 2.7027912437915802e-05, 2.8643757104873657e-05, 3.0259601771831512e-05, 3.187544643878937e-05, 3.349129110574722e-05, 3.510713577270508e-05]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 3.0, 5.0, 5.0, 11.0, 8.0, 18.0, 27.0, 30.0, 50.0, 91.0, 111.0, 286.0, 657.0, 1990.0, 8330.0, 80435.0, 883680.0, 62648.0, 7178.0, 1764.0, 591.0, 262.0, 139.0, 77.0, 36.0, 37.0, 18.0, 20.0, 15.0, 8.0, 10.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.489990234375, -0.4744148254394531, -0.45883941650390625, -0.4432640075683594, -0.4276885986328125, -0.4121131896972656, -0.39653778076171875, -0.3809623718261719, -0.365386962890625, -0.3498115539550781, -0.33423614501953125, -0.3186607360839844, -0.3030853271484375, -0.2875099182128906, -0.27193450927734375, -0.2563591003417969, -0.24078369140625, -0.22520828247070312, -0.20963287353515625, -0.19405746459960938, -0.1784820556640625, -0.16290664672851562, -0.14733123779296875, -0.13175582885742188, -0.116180419921875, -0.10060501098632812, -0.08502960205078125, -0.06945419311523438, -0.0538787841796875, -0.038303375244140625, -0.02272796630859375, -0.007152557373046875, 0.0084228515625, 0.023998260498046875, 0.03957366943359375, 0.055149078369140625, 0.0707244873046875, 0.08629989624023438, 0.10187530517578125, 0.11745071411132812, 0.133026123046875, 0.14860153198242188, 0.16417694091796875, 0.17975234985351562, 0.1953277587890625, 0.21090316772460938, 0.22647857666015625, 0.24205398559570312, 0.25762939453125, 0.2732048034667969, 0.28878021240234375, 0.3043556213378906, 0.3199310302734375, 0.3355064392089844, 0.35108184814453125, 0.3666572570800781, 0.382232666015625, 0.3978080749511719, 0.41338348388671875, 0.4289588928222656, 0.4445343017578125, 0.4601097106933594, 0.47568511962890625, 0.4912605285644531, 0.5068359375]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 6.0, 1.0, 5.0, 8.0, 6.0, 5.0, 11.0, 15.0, 13.0, 17.0, 25.0, 34.0, 30.0, 44.0, 47.0, 83.0, 74.0, 107.0, 93.0, 72.0, 56.0, 55.0, 39.0, 36.0, 24.0, 14.0, 10.0, 9.0, 7.0, 7.0, 9.0, 7.0, 6.0, 3.0, 3.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.086181640625, -0.08336734771728516, -0.08055305480957031, -0.07773876190185547, -0.07492446899414062, -0.07211017608642578, -0.06929588317871094, -0.0664815902709961, -0.06366729736328125, -0.060853004455566406, -0.05803871154785156, -0.05522441864013672, -0.052410125732421875, -0.04959583282470703, -0.04678153991699219, -0.043967247009277344, -0.0411529541015625, -0.038338661193847656, -0.03552436828613281, -0.03271007537841797, -0.029895782470703125, -0.02708148956298828, -0.024267196655273438, -0.021452903747558594, -0.01863861083984375, -0.015824317932128906, -0.013010025024414062, -0.010195732116699219, -0.007381439208984375, -0.004567146301269531, -0.0017528533935546875, 0.0010614395141601562, 0.003875732421875, 0.006690025329589844, 0.009504318237304688, 0.012318611145019531, 0.015132904052734375, 0.01794719696044922, 0.020761489868164062, 0.023575782775878906, 0.02639007568359375, 0.029204368591308594, 0.03201866149902344, 0.03483295440673828, 0.037647247314453125, 0.04046154022216797, 0.04327583312988281, 0.046090126037597656, 0.0489044189453125, 0.051718711853027344, 0.05453300476074219, 0.05734729766845703, 0.060161590576171875, 0.06297588348388672, 0.06579017639160156, 0.0686044692993164, 0.07141876220703125, 0.0742330551147461, 0.07704734802246094, 0.07986164093017578, 0.08267593383789062, 0.08549022674560547, 0.08830451965332031, 0.09111881256103516, 0.09393310546875]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 8.0, 13.0, 25.0, 55.0, 144.0, 294.0, 294.0, 122.0, 26.0, 16.0, 10.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.849997043609619, -6.70701265335083, -6.564028739929199, -6.42104434967041, -6.278059959411621, -6.13507604598999, -5.992091655731201, -5.84910774230957, -5.706123352050781, -5.563138961791992, -5.420155048370361, -5.277170658111572, -5.134186744689941, -4.991202354431152, -4.848217964172363, -4.705233573913574, -4.562249660491943, -4.419265270233154, -4.276281356811523, -4.133296966552734, -3.9903128147125244, -3.8473286628723145, -3.7043442726135254, -3.5613601207733154, -3.4183759689331055, -3.2753918170928955, -3.1324076652526855, -2.9894232749938965, -2.8464391231536865, -2.7034549713134766, -2.5604705810546875, -2.4174864292144775, -2.2745018005371094, -2.1315176486968994, -1.9885333776474, -1.8455491065979004, -1.7025649547576904, -1.5595808029174805, -1.416596531867981, -1.2736122608184814, -1.1306281089782715, -0.9876438975334167, -0.844659686088562, -0.7016754746437073, -0.5586912631988525, -0.4157070517539978, -0.27272284030914307, -0.12973856925964355, 0.013245582580566406, 0.15622979402542114, 0.2992140054702759, 0.4421982169151306, 0.5851824283599854, 0.7281666398048401, 0.8711508512496948, 1.0141351222991943, 1.1571192741394043, 1.3001034259796143, 1.4430876970291138, 1.5860719680786133, 1.7290561199188232, 1.8720402717590332, 2.0150246620178223, 2.1580088138580322, 2.300992965698242]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 8.0, 8.0, 17.0, 23.0, 36.0, 40.0, 52.0, 76.0, 71.0, 90.0, 94.0, 83.0, 82.0, 78.0, 62.0, 56.0, 44.0, 29.0, 32.0, 9.0, 14.0, 8.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.214970827102661, -2.100245714187622, -1.985520601272583, -1.8707953691482544, -1.7560702562332153, -1.6413451433181763, -1.5266199111938477, -1.4118947982788086, -1.2971696853637695, -1.1824445724487305, -1.0677194595336914, -0.9529942274093628, -0.8382691144943237, -0.7235440015792847, -0.6088188290596008, -0.494093656539917, -0.37936854362487793, -0.2646434009075165, -0.14991825819015503, -0.03519311547279358, 0.07953202724456787, 0.19425714015960693, 0.30898231267929077, 0.4237074851989746, 0.5384325981140137, 0.6531577110290527, 0.7678828835487366, 0.8826080560684204, 0.9973331689834595, 1.1120582818984985, 1.2267835140228271, 1.3415086269378662, 1.4562339782714844, 1.5709590911865234, 1.6856842041015625, 1.8004094362258911, 1.9151345491409302, 2.0298595428466797, 2.144584894180298, 2.259310007095337, 2.374035120010376, 2.488760232925415, 2.603485345840454, 2.718210458755493, 2.8329358100891113, 2.9476609230041504, 3.0623860359191895, 3.1771111488342285, 3.2918362617492676, 3.4065613746643066, 3.5212864875793457, 3.6360116004943848, 3.750736713409424, 3.865461826324463, 3.980187177658081, 4.094912528991699, 4.209637641906738, 4.324362754821777, 4.439087867736816, 4.5538129806518555, 4.6685380935668945, 4.783263206481934, 4.897988319396973, 5.012713432312012, 5.127438545227051]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 7.0, 16.0, 18.0, 36.0, 84.0, 120.0, 238.0, 649.0, 2064.0, 11287.0, 344419.0, 3744643.0, 82878.0, 5749.0, 1281.0, 418.0, 172.0, 96.0, 41.0, 22.0, 6.0, 15.0, 5.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.94921875, -1.882781982421875, -1.81634521484375, -1.749908447265625, -1.6834716796875, -1.617034912109375, -1.55059814453125, -1.484161376953125, -1.417724609375, -1.351287841796875, -1.28485107421875, -1.218414306640625, -1.1519775390625, -1.085540771484375, -1.01910400390625, -0.952667236328125, -0.88623046875, -0.819793701171875, -0.75335693359375, -0.686920166015625, -0.6204833984375, -0.554046630859375, -0.48760986328125, -0.421173095703125, -0.354736328125, -0.288299560546875, -0.22186279296875, -0.155426025390625, -0.0889892578125, -0.022552490234375, 0.04388427734375, 0.110321044921875, 0.1767578125, 0.243194580078125, 0.30963134765625, 0.376068115234375, 0.4425048828125, 0.508941650390625, 0.57537841796875, 0.641815185546875, 0.708251953125, 0.774688720703125, 0.84112548828125, 0.907562255859375, 0.9739990234375, 1.040435791015625, 1.10687255859375, 1.173309326171875, 1.23974609375, 1.306182861328125, 1.37261962890625, 1.439056396484375, 1.5054931640625, 1.571929931640625, 1.63836669921875, 1.704803466796875, 1.771240234375, 1.837677001953125, 1.90411376953125, 1.970550537109375, 2.0369873046875, 2.103424072265625, 2.16986083984375, 2.236297607421875, 2.302734375]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 5.0, 4.0, 2.0, 9.0, 7.0, 17.0, 15.0, 24.0, 32.0, 26.0, 39.0, 44.0, 72.0, 75.0, 73.0, 59.0, 72.0, 79.0, 61.0, 50.0, 51.0, 44.0, 28.0, 29.0, 22.0, 21.0, 11.0, 14.0, 3.0, 5.0, 3.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.99072265625, -0.962432861328125, -0.93414306640625, -0.905853271484375, -0.8775634765625, -0.849273681640625, -0.82098388671875, -0.792694091796875, -0.764404296875, -0.736114501953125, -0.70782470703125, -0.679534912109375, -0.6512451171875, -0.622955322265625, -0.59466552734375, -0.566375732421875, -0.5380859375, -0.509796142578125, -0.48150634765625, -0.453216552734375, -0.4249267578125, -0.396636962890625, -0.36834716796875, -0.340057373046875, -0.311767578125, -0.283477783203125, -0.25518798828125, -0.226898193359375, -0.1986083984375, -0.170318603515625, -0.14202880859375, -0.113739013671875, -0.08544921875, -0.057159423828125, -0.02886962890625, -0.000579833984375, 0.0277099609375, 0.055999755859375, 0.08428955078125, 0.112579345703125, 0.140869140625, 0.169158935546875, 0.19744873046875, 0.225738525390625, 0.2540283203125, 0.282318115234375, 0.31060791015625, 0.338897705078125, 0.3671875, 0.395477294921875, 0.42376708984375, 0.452056884765625, 0.4803466796875, 0.508636474609375, 0.53692626953125, 0.565216064453125, 0.593505859375, 0.621795654296875, 0.65008544921875, 0.678375244140625, 0.7066650390625, 0.734954833984375, 0.76324462890625, 0.791534423828125, 0.81982421875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 3.0, 6.0, 11.0, 16.0, 17.0, 34.0, 77.0, 115.0, 258.0, 497.0, 1199.0, 3742.0, 16484.0, 176421.0, 3790324.0, 182114.0, 16788.0, 3811.0, 1283.0, 522.0, 232.0, 132.0, 78.0, 47.0, 28.0, 14.0, 8.0, 4.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0849609375, -1.04241943359375, -0.9998779296875, -0.95733642578125, -0.914794921875, -0.87225341796875, -0.8297119140625, -0.78717041015625, -0.74462890625, -0.70208740234375, -0.6595458984375, -0.61700439453125, -0.574462890625, -0.53192138671875, -0.4893798828125, -0.44683837890625, -0.404296875, -0.36175537109375, -0.3192138671875, -0.27667236328125, -0.234130859375, -0.19158935546875, -0.1490478515625, -0.10650634765625, -0.06396484375, -0.02142333984375, 0.0211181640625, 0.06365966796875, 0.106201171875, 0.14874267578125, 0.1912841796875, 0.23382568359375, 0.2763671875, 0.31890869140625, 0.3614501953125, 0.40399169921875, 0.446533203125, 0.48907470703125, 0.5316162109375, 0.57415771484375, 0.61669921875, 0.65924072265625, 0.7017822265625, 0.74432373046875, 0.786865234375, 0.82940673828125, 0.8719482421875, 0.91448974609375, 0.95703125, 0.99957275390625, 1.0421142578125, 1.08465576171875, 1.127197265625, 1.16973876953125, 1.2122802734375, 1.25482177734375, 1.29736328125, 1.33990478515625, 1.3824462890625, 1.42498779296875, 1.467529296875, 1.51007080078125, 1.5526123046875, 1.59515380859375, 1.6376953125]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 2.0, 5.0, 6.0, 7.0, 16.0, 13.0, 12.0, 31.0, 60.0, 84.0, 115.0, 199.0, 344.0, 637.0, 853.0, 662.0, 449.0, 229.0, 121.0, 78.0, 48.0, 36.0, 21.0, 10.0, 11.0, 8.0, 5.0, 5.0, 8.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.35595703125, -0.3462409973144531, -0.33652496337890625, -0.3268089294433594, -0.3170928955078125, -0.3073768615722656, -0.29766082763671875, -0.2879447937011719, -0.278228759765625, -0.2685127258300781, -0.25879669189453125, -0.24908065795898438, -0.2393646240234375, -0.22964859008789062, -0.21993255615234375, -0.21021652221679688, -0.20050048828125, -0.19078445434570312, -0.18106842041015625, -0.17135238647460938, -0.1616363525390625, -0.15192031860351562, -0.14220428466796875, -0.13248825073242188, -0.122772216796875, -0.11305618286132812, -0.10334014892578125, -0.09362411499023438, -0.0839080810546875, -0.07419204711914062, -0.06447601318359375, -0.054759979248046875, -0.0450439453125, -0.035327911376953125, -0.02561187744140625, -0.015895843505859375, -0.0061798095703125, 0.003536224365234375, 0.01325225830078125, 0.022968292236328125, 0.032684326171875, 0.042400360107421875, 0.05211639404296875, 0.061832427978515625, 0.0715484619140625, 0.08126449584960938, 0.09098052978515625, 0.10069656372070312, 0.11041259765625, 0.12012863159179688, 0.12984466552734375, 0.13956069946289062, 0.1492767333984375, 0.15899276733398438, 0.16870880126953125, 0.17842483520507812, 0.188140869140625, 0.19785690307617188, 0.20757293701171875, 0.21728897094726562, 0.2270050048828125, 0.23672103881835938, 0.24643707275390625, 0.2561531066894531, 0.265869140625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 8.0, 4.0, 12.0, 12.0, 10.0, 19.0, 24.0, 44.0, 67.0, 73.0, 99.0, 119.0, 116.0, 121.0, 76.0, 56.0, 35.0, 26.0, 28.0, 14.0, 12.0, 6.0, 8.0, 2.0, 2.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8260102868080139, -0.7886925935745239, -0.7513749003410339, -0.714057207107544, -0.6767395734786987, -0.639421820640564, -0.6021041870117188, -0.5647864937782288, -0.5274688005447388, -0.4901511073112488, -0.4528334140777588, -0.4155157506465912, -0.3781980574131012, -0.3408803641796112, -0.3035627007484436, -0.2662450075149536, -0.22892731428146362, -0.19160962104797363, -0.15429194271564484, -0.11697425693273544, -0.07965657114982605, -0.04233887791633606, -0.005021199584007263, 0.03229647874832153, 0.06961417198181152, 0.10693185776472092, 0.1442495435476303, 0.1815672218799591, 0.2188849151134491, 0.2562026083469391, 0.2935202717781067, 0.3308379650115967, 0.36815571784973145, 0.40547341108322144, 0.4427911043167114, 0.48010876774787903, 0.5174264907836914, 0.5547441244125366, 0.5920618176460266, 0.6293795108795166, 0.6666972041130066, 0.7040148973464966, 0.7413325905799866, 0.7786502838134766, 0.8159679174423218, 0.8532856702804565, 0.8906033039093018, 0.9279209971427917, 0.9652386903762817, 1.002556324005127, 1.0398740768432617, 1.077191710472107, 1.1145094633102417, 1.151827096939087, 1.1891448497772217, 1.226462483406067, 1.263780117034912, 1.3010977506637573, 1.338415503501892, 1.3757331371307373, 1.413050889968872, 1.4503685235977173, 1.487686276435852, 1.5250039100646973, 1.562321662902832]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 6.0, 4.0, 6.0, 7.0, 14.0, 14.0, 16.0, 21.0, 22.0, 21.0, 35.0, 32.0, 44.0, 56.0, 53.0, 50.0, 71.0, 57.0, 51.0, 68.0, 56.0, 65.0, 27.0, 31.0, 31.0, 28.0, 22.0, 18.0, 20.0, 16.0, 8.0, 8.0, 7.0, 6.0, 6.0, 5.0, 1.0, 4.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-0.9553451538085938, -0.9303389191627502, -0.9053326845169067, -0.880326509475708, -0.8553202748298645, -0.830314040184021, -0.8053078651428223, -0.7803016304969788, -0.7552953958511353, -0.7302891612052917, -0.7052829265594482, -0.6802767515182495, -0.655270516872406, -0.6302642822265625, -0.6052581071853638, -0.5802518725395203, -0.5552456378936768, -0.5302394032478333, -0.5052331686019897, -0.480226993560791, -0.4552207589149475, -0.430214524269104, -0.4052083194255829, -0.38020211458206177, -0.35519587993621826, -0.33018964529037476, -0.30518344044685364, -0.2801772356033325, -0.255171000957489, -0.2301647812128067, -0.2051585614681244, -0.18015234172344208, -0.15514612197875977, -0.13013990223407745, -0.10513368248939514, -0.08012746274471283, -0.05512124300003052, -0.030115023255348206, -0.0051088035106658936, 0.01989741623401642, 0.04490363597869873, 0.06990985572338104, 0.09491607546806335, 0.11992229521274567, 0.14492851495742798, 0.1699347347021103, 0.1949409544467926, 0.21994717419147491, 0.24495339393615723, 0.26995962858200073, 0.29496583342552185, 0.31997203826904297, 0.3449782729148865, 0.36998450756073, 0.3949907124042511, 0.4199969172477722, 0.4450031518936157, 0.47000938653945923, 0.49501559138298035, 0.5200217962265015, 0.545028030872345, 0.5700342655181885, 0.5950404405593872, 0.6200466752052307, 0.6450529098510742]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 1.0, 4.0, 4.0, 6.0, 11.0, 7.0, 19.0, 15.0, 16.0, 21.0, 18.0, 27.0, 33.0, 47.0, 60.0, 120.0, 240.0, 475.0, 1094.0, 2789.0, 7728.0, 23963.0, 81506.0, 262503.0, 404499.0, 183977.0, 53923.0, 16170.0, 5496.0, 2039.0, 806.0, 348.0, 188.0, 109.0, 64.0, 51.0, 46.0, 26.0, 19.0, 14.0, 13.0, 20.0, 9.0, 7.0, 7.0, 6.0, 2.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.12396240234375, -0.12012863159179688, -0.11629486083984375, -0.11246109008789062, -0.1086273193359375, -0.10479354858398438, -0.10095977783203125, -0.09712600708007812, -0.093292236328125, -0.08945846557617188, -0.08562469482421875, -0.08179092407226562, -0.0779571533203125, -0.07412338256835938, -0.07028961181640625, -0.06645584106445312, -0.0626220703125, -0.058788299560546875, -0.05495452880859375, -0.051120758056640625, -0.0472869873046875, -0.043453216552734375, -0.03961944580078125, -0.035785675048828125, -0.031951904296875, -0.028118133544921875, -0.02428436279296875, -0.020450592041015625, -0.0166168212890625, -0.012783050537109375, -0.00894927978515625, -0.005115509033203125, -0.00128173828125, 0.002552032470703125, 0.00638580322265625, 0.010219573974609375, 0.0140533447265625, 0.017887115478515625, 0.02172088623046875, 0.025554656982421875, 0.029388427734375, 0.033222198486328125, 0.03705596923828125, 0.040889739990234375, 0.0447235107421875, 0.048557281494140625, 0.05239105224609375, 0.056224822998046875, 0.06005859375, 0.06389236450195312, 0.06772613525390625, 0.07155990600585938, 0.0753936767578125, 0.07922744750976562, 0.08306121826171875, 0.08689498901367188, 0.090728759765625, 0.09456253051757812, 0.09839630126953125, 0.10223007202148438, 0.1060638427734375, 0.10989761352539062, 0.11373138427734375, 0.11756515502929688, 0.12139892578125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 5.0, 5.0, 6.0, 5.0, 8.0, 14.0, 21.0, 23.0, 24.0, 26.0, 37.0, 42.0, 44.0, 56.0, 66.0, 50.0, 67.0, 64.0, 66.0, 78.0, 43.0, 45.0, 34.0, 27.0, 25.0, 28.0, 20.0, 13.0, 15.0, 8.0, 7.0, 12.0, 6.0, 4.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.64990234375, -0.6322669982910156, -0.6146316528320312, -0.5969963073730469, -0.5793609619140625, -0.5617256164550781, -0.5440902709960938, -0.5264549255371094, -0.508819580078125, -0.4911842346191406, -0.47354888916015625, -0.4559135437011719, -0.4382781982421875, -0.4206428527832031, -0.40300750732421875, -0.3853721618652344, -0.36773681640625, -0.3501014709472656, -0.33246612548828125, -0.3148307800292969, -0.2971954345703125, -0.2795600891113281, -0.26192474365234375, -0.24428939819335938, -0.226654052734375, -0.20901870727539062, -0.19138336181640625, -0.17374801635742188, -0.1561126708984375, -0.13847732543945312, -0.12084197998046875, -0.10320663452148438, -0.0855712890625, -0.06793594360351562, -0.05030059814453125, -0.032665252685546875, -0.0150299072265625, 0.002605438232421875, 0.02024078369140625, 0.037876129150390625, 0.055511474609375, 0.07314682006835938, 0.09078216552734375, 0.10841751098632812, 0.1260528564453125, 0.14368820190429688, 0.16132354736328125, 0.17895889282226562, 0.19659423828125, 0.21422958374023438, 0.23186492919921875, 0.24950027465820312, 0.2671356201171875, 0.2847709655761719, 0.30240631103515625, 0.3200416564941406, 0.337677001953125, 0.3553123474121094, 0.37294769287109375, 0.3905830383300781, 0.4082183837890625, 0.4258537292480469, 0.44348907470703125, 0.4611244201660156, 0.478759765625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 4.0, 9.0, 5.0, 9.0, 14.0, 20.0, 24.0, 25.0, 38.0, 53.0, 61.0, 82.0, 120.0, 139.0, 226.0, 302.0, 490.0, 849.0, 1525.0, 3324.0, 7897.0, 22930.0, 71765.0, 218706.0, 383578.0, 224443.0, 73523.0, 23096.0, 8065.0, 3252.0, 1567.0, 813.0, 457.0, 320.0, 212.0, 151.0, 114.0, 73.0, 58.0, 39.0, 47.0, 29.0, 29.0, 15.0, 8.0, 7.0, 9.0, 11.0, 2.0, 6.0, 2.0, 1.0, 3.0, 0.0, 6.0], "bins": [-0.10809326171875, -0.10486793518066406, -0.10164260864257812, -0.09841728210449219, -0.09519195556640625, -0.09196662902832031, -0.08874130249023438, -0.08551597595214844, -0.0822906494140625, -0.07906532287597656, -0.07583999633789062, -0.07261466979980469, -0.06938934326171875, -0.06616401672363281, -0.06293869018554688, -0.05971336364746094, -0.056488037109375, -0.05326271057128906, -0.050037384033203125, -0.04681205749511719, -0.04358673095703125, -0.04036140441894531, -0.037136077880859375, -0.03391075134277344, -0.0306854248046875, -0.027460098266601562, -0.024234771728515625, -0.021009445190429688, -0.01778411865234375, -0.014558792114257812, -0.011333465576171875, -0.008108139038085938, -0.0048828125, -0.0016574859619140625, 0.001567840576171875, 0.0047931671142578125, 0.00801849365234375, 0.011243820190429688, 0.014469146728515625, 0.017694473266601562, 0.0209197998046875, 0.024145126342773438, 0.027370452880859375, 0.030595779418945312, 0.03382110595703125, 0.03704643249511719, 0.040271759033203125, 0.04349708557128906, 0.046722412109375, 0.04994773864746094, 0.053173065185546875, 0.05639839172363281, 0.05962371826171875, 0.06284904479980469, 0.06607437133789062, 0.06929969787597656, 0.0725250244140625, 0.07575035095214844, 0.07897567749023438, 0.08220100402832031, 0.08542633056640625, 0.08865165710449219, 0.09187698364257812, 0.09510231018066406, 0.09832763671875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 0.0, 7.0, 4.0, 8.0, 10.0, 10.0, 24.0, 20.0, 20.0, 25.0, 34.0, 43.0, 25.0, 38.0, 53.0, 46.0, 47.0, 56.0, 63.0, 47.0, 49.0, 46.0, 55.0, 56.0, 33.0, 30.0, 25.0, 23.0, 20.0, 17.0, 12.0, 13.0, 10.0, 8.0, 5.0, 6.0, 5.0, 1.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8720703125, -0.843658447265625, -0.81524658203125, -0.786834716796875, -0.7584228515625, -0.730010986328125, -0.70159912109375, -0.673187255859375, -0.644775390625, -0.616363525390625, -0.58795166015625, -0.559539794921875, -0.5311279296875, -0.502716064453125, -0.47430419921875, -0.445892333984375, -0.41748046875, -0.389068603515625, -0.36065673828125, -0.332244873046875, -0.3038330078125, -0.275421142578125, -0.24700927734375, -0.218597412109375, -0.190185546875, -0.161773681640625, -0.13336181640625, -0.104949951171875, -0.0765380859375, -0.048126220703125, -0.01971435546875, 0.008697509765625, 0.037109375, 0.065521240234375, 0.09393310546875, 0.122344970703125, 0.1507568359375, 0.179168701171875, 0.20758056640625, 0.235992431640625, 0.264404296875, 0.292816162109375, 0.32122802734375, 0.349639892578125, 0.3780517578125, 0.406463623046875, 0.43487548828125, 0.463287353515625, 0.49169921875, 0.520111083984375, 0.54852294921875, 0.576934814453125, 0.6053466796875, 0.633758544921875, 0.66217041015625, 0.690582275390625, 0.718994140625, 0.747406005859375, 0.77581787109375, 0.804229736328125, 0.8326416015625, 0.861053466796875, 0.88946533203125, 0.917877197265625, 0.9462890625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 5.0, 7.0, 13.0, 12.0, 12.0, 22.0, 22.0, 39.0, 56.0, 89.0, 142.0, 239.0, 483.0, 921.0, 1976.0, 4883.0, 16347.0, 88373.0, 505685.0, 355955.0, 54155.0, 11833.0, 3811.0, 1640.0, 783.0, 434.0, 259.0, 127.0, 88.0, 40.0, 30.0, 26.0, 21.0, 12.0, 6.0, 0.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0589599609375, -0.05726909637451172, -0.05557823181152344, -0.053887367248535156, -0.052196502685546875, -0.050505638122558594, -0.04881477355957031, -0.04712390899658203, -0.04543304443359375, -0.04374217987060547, -0.04205131530761719, -0.040360450744628906, -0.038669586181640625, -0.036978721618652344, -0.03528785705566406, -0.03359699249267578, -0.0319061279296875, -0.03021526336669922, -0.028524398803710938, -0.026833534240722656, -0.025142669677734375, -0.023451805114746094, -0.021760940551757812, -0.02007007598876953, -0.01837921142578125, -0.01668834686279297, -0.014997482299804688, -0.013306617736816406, -0.011615753173828125, -0.009924888610839844, -0.008234024047851562, -0.006543159484863281, -0.004852294921875, -0.0031614303588867188, -0.0014705657958984375, 0.00022029876708984375, 0.001911163330078125, 0.0036020278930664062, 0.0052928924560546875, 0.006983757019042969, 0.00867462158203125, 0.010365486145019531, 0.012056350708007812, 0.013747215270996094, 0.015438079833984375, 0.017128944396972656, 0.018819808959960938, 0.02051067352294922, 0.0222015380859375, 0.02389240264892578, 0.025583267211914062, 0.027274131774902344, 0.028964996337890625, 0.030655860900878906, 0.03234672546386719, 0.03403759002685547, 0.03572845458984375, 0.03741931915283203, 0.03911018371582031, 0.040801048278808594, 0.042491912841796875, 0.044182777404785156, 0.04587364196777344, 0.04756450653076172, 0.04925537109375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 11.0, 12.0, 14.0, 24.0, 35.0, 45.0, 68.0, 88.0, 88.0, 96.0, 108.0, 99.0, 95.0, 60.0, 42.0, 34.0, 18.0, 25.0, 13.0, 7.0, 8.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7179718017578125e-05, -2.6333145797252655e-05, -2.5486573576927185e-05, -2.4640001356601715e-05, -2.3793429136276245e-05, -2.2946856915950775e-05, -2.2100284695625305e-05, -2.1253712475299835e-05, -2.0407140254974365e-05, -1.9560568034648895e-05, -1.8713995814323425e-05, -1.7867423593997955e-05, -1.7020851373672485e-05, -1.6174279153347015e-05, -1.5327706933021545e-05, -1.4481134712696075e-05, -1.3634562492370605e-05, -1.2787990272045135e-05, -1.1941418051719666e-05, -1.1094845831394196e-05, -1.0248273611068726e-05, -9.401701390743256e-06, -8.555129170417786e-06, -7.708556950092316e-06, -6.861984729766846e-06, -6.015412509441376e-06, -5.168840289115906e-06, -4.322268068790436e-06, -3.475695848464966e-06, -2.629123628139496e-06, -1.7825514078140259e-06, -9.359791874885559e-07, -8.940696716308594e-08, 7.57165253162384e-07, 1.603737473487854e-06, 2.450309693813324e-06, 3.296881914138794e-06, 4.143454134464264e-06, 4.990026354789734e-06, 5.836598575115204e-06, 6.683170795440674e-06, 7.529743015766144e-06, 8.376315236091614e-06, 9.222887456417084e-06, 1.0069459676742554e-05, 1.0916031897068024e-05, 1.1762604117393494e-05, 1.2609176337718964e-05, 1.3455748558044434e-05, 1.4302320778369904e-05, 1.5148892998695374e-05, 1.5995465219020844e-05, 1.6842037439346313e-05, 1.7688609659671783e-05, 1.8535181879997253e-05, 1.9381754100322723e-05, 2.0228326320648193e-05, 2.1074898540973663e-05, 2.1921470761299133e-05, 2.2768042981624603e-05, 2.3614615201950073e-05, 2.4461187422275543e-05, 2.5307759642601013e-05, 2.6154331862926483e-05, 2.7000904083251953e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 4.0, 6.0, 9.0, 10.0, 13.0, 30.0, 41.0, 49.0, 76.0, 106.0, 173.0, 236.0, 388.0, 557.0, 1059.0, 1913.0, 3949.0, 8924.0, 22559.0, 61807.0, 172845.0, 348283.0, 262904.0, 101045.0, 35930.0, 13585.0, 5818.0, 2655.0, 1381.0, 775.0, 510.0, 278.0, 206.0, 121.0, 90.0, 67.0, 49.0, 37.0, 15.0, 12.0, 9.0, 6.0, 10.0, 4.0, 3.0, 0.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0322265625, -0.03124213218688965, -0.030257701873779297, -0.029273271560668945, -0.028288841247558594, -0.027304410934448242, -0.02631998062133789, -0.02533555030822754, -0.024351119995117188, -0.023366689682006836, -0.022382259368896484, -0.021397829055786133, -0.02041339874267578, -0.01942896842956543, -0.018444538116455078, -0.017460107803344727, -0.016475677490234375, -0.015491247177124023, -0.014506816864013672, -0.01352238655090332, -0.012537956237792969, -0.011553525924682617, -0.010569095611572266, -0.009584665298461914, -0.008600234985351562, -0.007615804672241211, -0.006631374359130859, -0.005646944046020508, -0.004662513732910156, -0.0036780834197998047, -0.002693653106689453, -0.0017092227935791016, -0.00072479248046875, 0.00025963783264160156, 0.0012440681457519531, 0.0022284984588623047, 0.0032129287719726562, 0.004197359085083008, 0.005181789398193359, 0.006166219711303711, 0.0071506500244140625, 0.008135080337524414, 0.009119510650634766, 0.010103940963745117, 0.011088371276855469, 0.01207280158996582, 0.013057231903076172, 0.014041662216186523, 0.015026092529296875, 0.016010522842407227, 0.016994953155517578, 0.01797938346862793, 0.01896381378173828, 0.019948244094848633, 0.020932674407958984, 0.021917104721069336, 0.022901535034179688, 0.02388596534729004, 0.02487039566040039, 0.025854825973510742, 0.026839256286621094, 0.027823686599731445, 0.028808116912841797, 0.02979254722595215, 0.0307769775390625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 5.0, 0.0, 2.0, 1.0, 5.0, 6.0, 5.0, 6.0, 4.0, 10.0, 12.0, 16.0, 24.0, 22.0, 19.0, 29.0, 24.0, 42.0, 33.0, 56.0, 46.0, 56.0, 62.0, 45.0, 45.0, 51.0, 53.0, 45.0, 56.0, 38.0, 39.0, 29.0, 23.0, 16.0, 17.0, 12.0, 12.0, 13.0, 10.0, 8.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00695037841796875, -0.006698012351989746, -0.006445646286010742, -0.006193280220031738, -0.005940914154052734, -0.0056885480880737305, -0.0054361820220947266, -0.005183815956115723, -0.004931449890136719, -0.004679083824157715, -0.004426717758178711, -0.004174351692199707, -0.003921985626220703, -0.0036696195602416992, -0.0034172534942626953, -0.0031648874282836914, -0.0029125213623046875, -0.0026601552963256836, -0.0024077892303466797, -0.0021554231643676758, -0.0019030570983886719, -0.001650691032409668, -0.001398324966430664, -0.0011459589004516602, -0.0008935928344726562, -0.0006412267684936523, -0.00038886070251464844, -0.00013649463653564453, 0.00011587142944335938, 0.0003682374954223633, 0.0006206035614013672, 0.0008729696273803711, 0.001125335693359375, 0.001377701759338379, 0.0016300678253173828, 0.0018824338912963867, 0.0021347999572753906, 0.0023871660232543945, 0.0026395320892333984, 0.0028918981552124023, 0.0031442642211914062, 0.00339663028717041, 0.003648996353149414, 0.003901362419128418, 0.004153728485107422, 0.004406094551086426, 0.00465846061706543, 0.004910826683044434, 0.0051631927490234375, 0.005415558815002441, 0.005667924880981445, 0.005920290946960449, 0.006172657012939453, 0.006425023078918457, 0.006677389144897461, 0.006929755210876465, 0.007182121276855469, 0.007434487342834473, 0.0076868534088134766, 0.00793921947479248, 0.008191585540771484, 0.008443951606750488, 0.008696317672729492, 0.008948683738708496, 0.0092010498046875]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 6.0, 8.0, 7.0, 14.0, 23.0, 35.0, 108.0, 161.0, 238.0, 194.0, 98.0, 53.0, 32.0, 20.0, 3.0, 10.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5892325639724731, -0.5460082292556763, -0.5027838945388794, -0.45955950021743774, -0.41633516550064087, -0.373110830783844, -0.32988646626472473, -0.28666210174560547, -0.2434377670288086, -0.20021341741085052, -0.15698906779289246, -0.11376471817493439, -0.07054036855697632, -0.02731601893901825, 0.01590833067893982, 0.05913269519805908, 0.10235702991485596, 0.14558137953281403, 0.1888057291507721, 0.23203007876873016, 0.27525442838668823, 0.3184787631034851, 0.36170312762260437, 0.40492749214172363, 0.4481518268585205, 0.4913761615753174, 0.5346004962921143, 0.5778248906135559, 0.6210492253303528, 0.6642735600471497, 0.7074979543685913, 0.7507222890853882, 0.7939467430114746, 0.8371710777282715, 0.8803954124450684, 0.92361980676651, 0.9668441414833069, 1.0100685358047485, 1.0532928705215454, 1.0965172052383423, 1.1397415399551392, 1.182965874671936, 1.226190209388733, 1.2694145441055298, 1.3126389980316162, 1.355863332748413, 1.39908766746521, 1.4423120021820068, 1.4855363368988037, 1.5287606716156006, 1.5719850063323975, 1.6152093410491943, 1.6584336757659912, 1.7016581296920776, 1.7448824644088745, 1.7881067991256714, 1.8313311338424683, 1.8745554685592651, 1.917779803276062, 1.9610041379928589, 2.0042285919189453, 2.047452926635742, 2.090677261352539, 2.133901596069336, 2.177125930786133]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 7.0, 2.0, 8.0, 9.0, 13.0, 19.0, 20.0, 19.0, 22.0, 27.0, 38.0, 48.0, 61.0, 56.0, 62.0, 80.0, 65.0, 70.0, 73.0, 62.0, 36.0, 37.0, 37.0, 22.0, 22.0, 23.0, 14.0, 9.0, 13.0, 7.0, 5.0, 4.0, 8.0, 3.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6705573201179504, -0.6525649428367615, -0.6345725655555725, -0.6165802478790283, -0.5985878705978394, -0.5805954933166504, -0.5626031160354614, -0.5446107387542725, -0.5266184210777283, -0.5086260437965393, -0.49063369631767273, -0.47264131903648376, -0.4546489715576172, -0.4366565942764282, -0.41866421699523926, -0.4006718695163727, -0.3826794922351837, -0.36468711495399475, -0.3466947674751282, -0.3287023901939392, -0.31071004271507263, -0.29271766543388367, -0.2747253179550171, -0.2567329406738281, -0.23874057829380035, -0.22074821591377258, -0.2027558535337448, -0.18476349115371704, -0.16677111387252808, -0.1487787663936615, -0.13078638911247253, -0.11279402673244476, -0.09480166435241699, -0.07680930197238922, -0.05881693586707115, -0.04082456976175308, -0.02283220738172531, -0.00483984500169754, 0.013152524828910828, 0.0311448872089386, 0.04913724958896637, 0.06712961196899414, 0.08512197434902191, 0.10311434417963028, 0.12110670655965805, 0.13909906148910522, 0.1570914387702942, 0.17508380115032196, 0.19307616353034973, 0.2110685259103775, 0.22906088829040527, 0.24705326557159424, 0.2650456130504608, 0.2830379903316498, 0.30103033781051636, 0.3190227150917053, 0.3370150923728943, 0.35500746965408325, 0.37299981713294983, 0.3909921944141388, 0.40898454189300537, 0.42697691917419434, 0.4449692964553833, 0.4629616439342499, 0.48095399141311646]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 2.0, 6.0, 5.0, 5.0, 23.0, 15.0, 38.0, 40.0, 51.0, 94.0, 156.0, 241.0, 365.0, 702.0, 1213.0, 2365.0, 5084.0, 11256.0, 29266.0, 103042.0, 495414.0, 301536.0, 60936.0, 20209.0, 8258.0, 3840.0, 1933.0, 1013.0, 584.0, 296.0, 191.0, 124.0, 71.0, 55.0, 36.0, 22.0, 16.0, 10.0, 11.0, 9.0, 5.0, 5.0, 7.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.48291015625, -0.46671295166015625, -0.4505157470703125, -0.43431854248046875, -0.418121337890625, -0.40192413330078125, -0.3857269287109375, -0.36952972412109375, -0.35333251953125, -0.33713531494140625, -0.3209381103515625, -0.30474090576171875, -0.288543701171875, -0.27234649658203125, -0.2561492919921875, -0.23995208740234375, -0.2237548828125, -0.20755767822265625, -0.1913604736328125, -0.17516326904296875, -0.158966064453125, -0.14276885986328125, -0.1265716552734375, -0.11037445068359375, -0.09417724609375, -0.07798004150390625, -0.0617828369140625, -0.04558563232421875, -0.029388427734375, -0.01319122314453125, 0.0030059814453125, 0.01920318603515625, 0.035400390625, 0.05159759521484375, 0.0677947998046875, 0.08399200439453125, 0.100189208984375, 0.11638641357421875, 0.1325836181640625, 0.14878082275390625, 0.16497802734375, 0.18117523193359375, 0.1973724365234375, 0.21356964111328125, 0.229766845703125, 0.24596405029296875, 0.2621612548828125, 0.27835845947265625, 0.2945556640625, 0.31075286865234375, 0.3269500732421875, 0.34314727783203125, 0.359344482421875, 0.37554168701171875, 0.3917388916015625, 0.40793609619140625, 0.42413330078125, 0.44033050537109375, 0.4565277099609375, 0.47272491455078125, 0.488922119140625, 0.5051193237304688, 0.5213165283203125, 0.5375137329101562, 0.5537109375]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 10.0, 7.0, 7.0, 15.0, 18.0, 24.0, 23.0, 44.0, 37.0, 46.0, 61.0, 70.0, 73.0, 76.0, 77.0, 79.0, 56.0, 63.0, 33.0, 45.0, 32.0, 26.0, 13.0, 18.0, 9.0, 8.0, 7.0, 9.0, 5.0, 3.0, 2.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.50390625, -1.4652023315429688, -1.4264984130859375, -1.3877944946289062, -1.349090576171875, -1.3103866577148438, -1.2716827392578125, -1.2329788208007812, -1.19427490234375, -1.1555709838867188, -1.1168670654296875, -1.0781631469726562, -1.039459228515625, -1.0007553100585938, -0.9620513916015625, -0.9233474731445312, -0.8846435546875, -0.8459396362304688, -0.8072357177734375, -0.7685317993164062, -0.729827880859375, -0.6911239624023438, -0.6524200439453125, -0.6137161254882812, -0.57501220703125, -0.5363082885742188, -0.4976043701171875, -0.45890045166015625, -0.420196533203125, -0.38149261474609375, -0.3427886962890625, -0.30408477783203125, -0.265380859375, -0.22667694091796875, -0.1879730224609375, -0.14926910400390625, -0.110565185546875, -0.07186126708984375, -0.0331573486328125, 0.00554656982421875, 0.04425048828125, 0.08295440673828125, 0.1216583251953125, 0.16036224365234375, 0.199066162109375, 0.23777008056640625, 0.2764739990234375, 0.31517791748046875, 0.3538818359375, 0.39258575439453125, 0.4312896728515625, 0.46999359130859375, 0.508697509765625, 0.5474014282226562, 0.5861053466796875, 0.6248092651367188, 0.66351318359375, 0.7022171020507812, 0.7409210205078125, 0.7796249389648438, 0.818328857421875, 0.8570327758789062, 0.8957366943359375, 0.9344406127929688, 0.97314453125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 5.0, 5.0, 2.0, 4.0, 5.0, 4.0, 6.0, 6.0, 13.0, 9.0, 23.0, 21.0, 27.0, 35.0, 48.0, 117.0, 180.0, 479.0, 1288.0, 6441.0, 68382.0, 899754.0, 63687.0, 5924.0, 1197.0, 390.0, 173.0, 93.0, 58.0, 46.0, 34.0, 22.0, 15.0, 13.0, 11.0, 10.0, 8.0, 6.0, 6.0, 3.0, 2.0, 1.0, 0.0, 4.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1318359375, -1.0947113037109375, -1.057586669921875, -1.0204620361328125, -0.98333740234375, -0.9462127685546875, -0.909088134765625, -0.8719635009765625, -0.8348388671875, -0.7977142333984375, -0.760589599609375, -0.7234649658203125, -0.68634033203125, -0.6492156982421875, -0.612091064453125, -0.5749664306640625, -0.537841796875, -0.5007171630859375, -0.463592529296875, -0.4264678955078125, -0.38934326171875, -0.3522186279296875, -0.315093994140625, -0.2779693603515625, -0.2408447265625, -0.2037200927734375, -0.166595458984375, -0.1294708251953125, -0.09234619140625, -0.0552215576171875, -0.018096923828125, 0.0190277099609375, 0.05615234375, 0.0932769775390625, 0.130401611328125, 0.1675262451171875, 0.20465087890625, 0.2417755126953125, 0.278900146484375, 0.3160247802734375, 0.3531494140625, 0.3902740478515625, 0.427398681640625, 0.4645233154296875, 0.50164794921875, 0.5387725830078125, 0.575897216796875, 0.6130218505859375, 0.650146484375, 0.6872711181640625, 0.724395751953125, 0.7615203857421875, 0.79864501953125, 0.8357696533203125, 0.872894287109375, 0.9100189208984375, 0.9471435546875, 0.9842681884765625, 1.021392822265625, 1.0585174560546875, 1.09564208984375, 1.1327667236328125, 1.169891357421875, 1.2070159912109375, 1.244140625]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 7.0, 7.0, 11.0, 16.0, 10.0, 18.0, 12.0, 24.0, 27.0, 26.0, 31.0, 34.0, 42.0, 41.0, 53.0, 48.0, 45.0, 43.0, 36.0, 53.0, 57.0, 44.0, 34.0, 34.0, 28.0, 32.0, 29.0, 25.0, 25.0, 16.0, 17.0, 14.0, 16.0, 13.0, 10.0, 8.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9775390625, -0.946075439453125, -0.91461181640625, -0.883148193359375, -0.8516845703125, -0.820220947265625, -0.78875732421875, -0.757293701171875, -0.725830078125, -0.694366455078125, -0.66290283203125, -0.631439208984375, -0.5999755859375, -0.568511962890625, -0.53704833984375, -0.505584716796875, -0.47412109375, -0.442657470703125, -0.41119384765625, -0.379730224609375, -0.3482666015625, -0.316802978515625, -0.28533935546875, -0.253875732421875, -0.222412109375, -0.190948486328125, -0.15948486328125, -0.128021240234375, -0.0965576171875, -0.065093994140625, -0.03363037109375, -0.002166748046875, 0.029296875, 0.060760498046875, 0.09222412109375, 0.123687744140625, 0.1551513671875, 0.186614990234375, 0.21807861328125, 0.249542236328125, 0.281005859375, 0.312469482421875, 0.34393310546875, 0.375396728515625, 0.4068603515625, 0.438323974609375, 0.46978759765625, 0.501251220703125, 0.53271484375, 0.564178466796875, 0.59564208984375, 0.627105712890625, 0.6585693359375, 0.690032958984375, 0.72149658203125, 0.752960205078125, 0.784423828125, 0.815887451171875, 0.84735107421875, 0.878814697265625, 0.9102783203125, 0.941741943359375, 0.97320556640625, 1.004669189453125, 1.0361328125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 3.0, 3.0, 6.0, 3.0, 5.0, 15.0, 23.0, 26.0, 75.0, 175.0, 475.0, 2134.0, 18899.0, 982422.0, 40182.0, 3040.0, 651.0, 215.0, 96.0, 33.0, 20.0, 10.0, 11.0, 11.0, 4.0, 6.0, 0.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.041015625, -1.0109329223632812, -0.9808502197265625, -0.9507675170898438, -0.920684814453125, -0.8906021118164062, -0.8605194091796875, -0.8304367065429688, -0.80035400390625, -0.7702713012695312, -0.7401885986328125, -0.7101058959960938, -0.680023193359375, -0.6499404907226562, -0.6198577880859375, -0.5897750854492188, -0.5596923828125, -0.5296096801757812, -0.4995269775390625, -0.46944427490234375, -0.439361572265625, -0.40927886962890625, -0.3791961669921875, -0.34911346435546875, -0.31903076171875, -0.28894805908203125, -0.2588653564453125, -0.22878265380859375, -0.198699951171875, -0.16861724853515625, -0.1385345458984375, -0.10845184326171875, -0.078369140625, -0.04828643798828125, -0.0182037353515625, 0.01187896728515625, 0.041961669921875, 0.07204437255859375, 0.1021270751953125, 0.13220977783203125, 0.16229248046875, 0.19237518310546875, 0.2224578857421875, 0.25254058837890625, 0.282623291015625, 0.31270599365234375, 0.3427886962890625, 0.37287139892578125, 0.4029541015625, 0.43303680419921875, 0.4631195068359375, 0.49320220947265625, 0.523284912109375, 0.5533676147460938, 0.5834503173828125, 0.6135330200195312, 0.64361572265625, 0.6736984252929688, 0.7037811279296875, 0.7338638305664062, 0.763946533203125, 0.7940292358398438, 0.8241119384765625, 0.8541946411132812, 0.88427734375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 0.0, 4.0, 14.0, 17.0, 31.0, 82.0, 218.0, 347.0, 174.0, 64.0, 22.0, 13.0, 7.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015234947204589844, -0.0001485804095864296, -0.00014481134712696075, -0.0001410422846674919, -0.00013727322220802307, -0.00013350415974855423, -0.0001297350972890854, -0.00012596603482961655, -0.0001221969723701477, -0.00011842790991067886, -0.00011465884745121002, -0.00011088978499174118, -0.00010712072253227234, -0.0001033516600728035, -9.958259761333466e-05, -9.581353515386581e-05, -9.204447269439697e-05, -8.827541023492813e-05, -8.450634777545929e-05, -8.073728531599045e-05, -7.69682228565216e-05, -7.319916039705276e-05, -6.943009793758392e-05, -6.566103547811508e-05, -6.189197301864624e-05, -5.81229105591774e-05, -5.435384809970856e-05, -5.0584785640239716e-05, -4.6815723180770874e-05, -4.304666072130203e-05, -3.927759826183319e-05, -3.550853580236435e-05, -3.173947334289551e-05, -2.7970410883426666e-05, -2.4201348423957825e-05, -2.0432285964488983e-05, -1.666322350502014e-05, -1.28941610455513e-05, -9.125098586082458e-06, -5.356036126613617e-06, -1.5869736671447754e-06, 2.182088792324066e-06, 5.951151251792908e-06, 9.72021371126175e-06, 1.348927617073059e-05, 1.7258338630199432e-05, 2.1027401089668274e-05, 2.4796463549137115e-05, 2.8565526008605957e-05, 3.23345884680748e-05, 3.610365092754364e-05, 3.987271338701248e-05, 4.364177584648132e-05, 4.7410838305950165e-05, 5.1179900765419006e-05, 5.494896322488785e-05, 5.871802568435669e-05, 6.248708814382553e-05, 6.625615060329437e-05, 7.002521306276321e-05, 7.379427552223206e-05, 7.75633379817009e-05, 8.133240044116974e-05, 8.510146290063858e-05, 8.887052536010742e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 9.0, 10.0, 14.0, 16.0, 37.0, 52.0, 127.0, 360.0, 1321.0, 7883.0, 240045.0, 784219.0, 11843.0, 1797.0, 458.0, 168.0, 91.0, 33.0, 19.0, 9.0, 15.0, 8.0, 8.0, 3.0, 4.0, 0.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.595703125, -0.569915771484375, -0.54412841796875, -0.518341064453125, -0.4925537109375, -0.466766357421875, -0.44097900390625, -0.415191650390625, -0.389404296875, -0.363616943359375, -0.33782958984375, -0.312042236328125, -0.2862548828125, -0.260467529296875, -0.23468017578125, -0.208892822265625, -0.18310546875, -0.157318115234375, -0.13153076171875, -0.105743408203125, -0.0799560546875, -0.054168701171875, -0.02838134765625, -0.002593994140625, 0.023193359375, 0.048980712890625, 0.07476806640625, 0.100555419921875, 0.1263427734375, 0.152130126953125, 0.17791748046875, 0.203704833984375, 0.2294921875, 0.255279541015625, 0.28106689453125, 0.306854248046875, 0.3326416015625, 0.358428955078125, 0.38421630859375, 0.410003662109375, 0.435791015625, 0.461578369140625, 0.48736572265625, 0.513153076171875, 0.5389404296875, 0.564727783203125, 0.59051513671875, 0.616302490234375, 0.64208984375, 0.667877197265625, 0.69366455078125, 0.719451904296875, 0.7452392578125, 0.771026611328125, 0.79681396484375, 0.822601318359375, 0.848388671875, 0.874176025390625, 0.89996337890625, 0.925750732421875, 0.9515380859375, 0.977325439453125, 1.00311279296875, 1.028900146484375, 1.0546875]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 5.0, 5.0, 12.0, 7.0, 14.0, 16.0, 42.0, 57.0, 93.0, 159.0, 183.0, 146.0, 90.0, 58.0, 30.0, 27.0, 11.0, 12.0, 2.0, 2.0, 9.0, 4.0, 3.0, 6.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.134521484375, -0.12923049926757812, -0.12393951416015625, -0.11864852905273438, -0.1133575439453125, -0.10806655883789062, -0.10277557373046875, -0.09748458862304688, -0.092193603515625, -0.08690261840820312, -0.08161163330078125, -0.07632064819335938, -0.0710296630859375, -0.06573867797851562, -0.06044769287109375, -0.055156707763671875, -0.04986572265625, -0.044574737548828125, -0.03928375244140625, -0.033992767333984375, -0.0287017822265625, -0.023410797119140625, -0.01811981201171875, -0.012828826904296875, -0.007537841796875, -0.002246856689453125, 0.00304412841796875, 0.008335113525390625, 0.0136260986328125, 0.018917083740234375, 0.02420806884765625, 0.029499053955078125, 0.0347900390625, 0.040081024169921875, 0.04537200927734375, 0.050662994384765625, 0.0559539794921875, 0.061244964599609375, 0.06653594970703125, 0.07182693481445312, 0.077117919921875, 0.08240890502929688, 0.08769989013671875, 0.09299087524414062, 0.0982818603515625, 0.10357284545898438, 0.10886383056640625, 0.11415481567382812, 0.11944580078125, 0.12473678588867188, 0.13002777099609375, 0.13531875610351562, 0.1406097412109375, 0.14590072631835938, 0.15119171142578125, 0.15648269653320312, 0.161773681640625, 0.16706466674804688, 0.17235565185546875, 0.17764663696289062, 0.1829376220703125, 0.18822860717773438, 0.19351959228515625, 0.19881057739257812, 0.2041015625]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 4.0, 14.0, 10.0, 22.0, 38.0, 55.0, 95.0, 111.0, 143.0, 150.0, 118.0, 79.0, 50.0, 30.0, 34.0, 16.0, 5.0, 8.0, 6.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.339508056640625, -1.280866265296936, -1.222224473953247, -1.1635828018188477, -1.1049410104751587, -1.0462992191314697, -0.9876574277877808, -0.9290156364440918, -0.8703739047050476, -0.8117321133613586, -0.7530903816223145, -0.6944485902786255, -0.6358067989349365, -0.5771650671958923, -0.5185232758522034, -0.4598815143108368, -0.4012397527694702, -0.34259799122810364, -0.28395622968673706, -0.2253144383430481, -0.16667267680168152, -0.10803091526031494, -0.04938912391662598, 0.0092526376247406, 0.06789439916610718, 0.12653616070747375, 0.18517793715000153, 0.2438197135925293, 0.3024614751338959, 0.36110323667526245, 0.4197450280189514, 0.478386789560318, 0.5370285511016846, 0.5956703424453735, 0.6543120741844177, 0.7129538655281067, 0.7715955972671509, 0.8302373886108398, 0.8888791799545288, 0.9475209712982178, 1.0061626434326172, 1.0648044347763062, 1.1234462261199951, 1.1820878982543945, 1.2407296895980835, 1.2993714809417725, 1.3580132722854614, 1.4166550636291504, 1.4752968549728394, 1.5339386463165283, 1.5925804376602173, 1.6512222290039062, 1.7098639011383057, 1.7685056924819946, 1.8271474838256836, 1.8857892751693726, 1.9444310665130615, 2.003072738647461, 2.0617146492004395, 2.120356321334839, 2.1789982318878174, 2.237639904022217, 2.2962818145751953, 2.3549234867095947, 2.413565158843994]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 9.0, 5.0, 4.0, 14.0, 6.0, 8.0, 15.0, 17.0, 21.0, 20.0, 26.0, 30.0, 35.0, 32.0, 41.0, 32.0, 42.0, 35.0, 45.0, 46.0, 49.0, 34.0, 42.0, 32.0, 29.0, 48.0, 35.0, 39.0, 29.0, 30.0, 15.0, 24.0, 19.0, 16.0, 11.0, 12.0, 11.0, 4.0, 9.0, 7.0, 4.0, 2.0, 2.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.6911041736602783, -1.6398669481277466, -1.5886297225952148, -1.537392497062683, -1.4861552715301514, -1.4349180459976196, -1.383680820465088, -1.3324435949325562, -1.2812063694000244, -1.2299691438674927, -1.178731918334961, -1.1274946928024292, -1.0762574672698975, -1.0250202417373657, -0.973783016204834, -0.9225457906723022, -0.8713085651397705, -0.8200713396072388, -0.768834114074707, -0.7175968885421753, -0.6663596630096436, -0.6151224374771118, -0.5638852119445801, -0.5126479864120483, -0.4614107608795166, -0.41017353534698486, -0.3589363098144531, -0.3076990842819214, -0.25646185874938965, -0.2052246332168579, -0.15398740768432617, -0.10275018215179443, -0.051512956619262695, -0.00027573108673095703, 0.05096149444580078, 0.10219871997833252, 0.15343594551086426, 0.204673171043396, 0.25591039657592773, 0.3071476221084595, 0.3583848476409912, 0.40962207317352295, 0.4608592987060547, 0.5120965242385864, 0.5633337497711182, 0.6145709753036499, 0.6658082008361816, 0.7170454263687134, 0.7682826519012451, 0.8195198774337769, 0.8707571029663086, 0.9219943284988403, 0.9732315540313721, 1.0244687795639038, 1.0757060050964355, 1.1269432306289673, 1.178180456161499, 1.2294176816940308, 1.2806549072265625, 1.3318921327590942, 1.383129358291626, 1.4343665838241577, 1.4856038093566895, 1.5368410348892212, 1.588078260421753]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 4.0, 7.0, 8.0, 13.0, 27.0, 33.0, 43.0, 89.0, 170.0, 295.0, 681.0, 1893.0, 6280.0, 50239.0, 2522104.0, 1566789.0, 34928.0, 6570.0, 2331.0, 892.0, 399.0, 202.0, 119.0, 56.0, 36.0, 16.0, 21.0, 14.0, 4.0, 5.0, 4.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.173828125, -2.1207275390625, -2.067626953125, -2.0145263671875, -1.96142578125, -1.9083251953125, -1.855224609375, -1.8021240234375, -1.7490234375, -1.6959228515625, -1.642822265625, -1.5897216796875, -1.53662109375, -1.4835205078125, -1.430419921875, -1.3773193359375, -1.32421875, -1.2711181640625, -1.218017578125, -1.1649169921875, -1.11181640625, -1.0587158203125, -1.005615234375, -0.9525146484375, -0.8994140625, -0.8463134765625, -0.793212890625, -0.7401123046875, -0.68701171875, -0.6339111328125, -0.580810546875, -0.5277099609375, -0.474609375, -0.4215087890625, -0.368408203125, -0.3153076171875, -0.26220703125, -0.2091064453125, -0.156005859375, -0.1029052734375, -0.0498046875, 0.0032958984375, 0.056396484375, 0.1094970703125, 0.16259765625, 0.2156982421875, 0.268798828125, 0.3218994140625, 0.375, 0.4281005859375, 0.481201171875, 0.5343017578125, 0.58740234375, 0.6405029296875, 0.693603515625, 0.7467041015625, 0.7998046875, 0.8529052734375, 0.906005859375, 0.9591064453125, 1.01220703125, 1.0653076171875, 1.118408203125, 1.1715087890625, 1.224609375]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 6.0, 5.0, 9.0, 16.0, 24.0, 35.0, 32.0, 71.0, 68.0, 92.0, 104.0, 115.0, 104.0, 80.0, 65.0, 53.0, 44.0, 27.0, 21.0, 11.0, 10.0, 6.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6298828125, -1.5938796997070312, -1.5578765869140625, -1.5218734741210938, -1.485870361328125, -1.4498672485351562, -1.4138641357421875, -1.3778610229492188, -1.34185791015625, -1.3058547973632812, -1.2698516845703125, -1.2338485717773438, -1.197845458984375, -1.1618423461914062, -1.1258392333984375, -1.0898361206054688, -1.0538330078125, -1.0178298950195312, -0.9818267822265625, -0.9458236694335938, -0.909820556640625, -0.8738174438476562, -0.8378143310546875, -0.8018112182617188, -0.76580810546875, -0.7298049926757812, -0.6938018798828125, -0.6577987670898438, -0.621795654296875, -0.5857925415039062, -0.5497894287109375, -0.5137863159179688, -0.477783203125, -0.44178009033203125, -0.4057769775390625, -0.36977386474609375, -0.333770751953125, -0.29776763916015625, -0.2617645263671875, -0.22576141357421875, -0.18975830078125, -0.15375518798828125, -0.1177520751953125, -0.08174896240234375, -0.045745849609375, -0.00974273681640625, 0.0262603759765625, 0.06226348876953125, 0.0982666015625, 0.13426971435546875, 0.1702728271484375, 0.20627593994140625, 0.242279052734375, 0.27828216552734375, 0.3142852783203125, 0.35028839111328125, 0.38629150390625, 0.42229461669921875, 0.4582977294921875, 0.49430084228515625, 0.530303955078125, 0.5663070678710938, 0.6023101806640625, 0.6383132934570312, 0.67431640625]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 9.0, 12.0, 13.0, 22.0, 39.0, 58.0, 78.0, 140.0, 243.0, 457.0, 907.0, 2191.0, 6502.0, 27335.0, 279063.0, 3613119.0, 228686.0, 25127.0, 6144.0, 2174.0, 862.0, 418.0, 246.0, 137.0, 93.0, 63.0, 43.0, 24.0, 22.0, 13.0, 9.0, 8.0, 8.0, 7.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1240234375, -1.0904388427734375, -1.056854248046875, -1.0232696533203125, -0.98968505859375, -0.9561004638671875, -0.922515869140625, -0.8889312744140625, -0.8553466796875, -0.8217620849609375, -0.788177490234375, -0.7545928955078125, -0.72100830078125, -0.6874237060546875, -0.653839111328125, -0.6202545166015625, -0.586669921875, -0.5530853271484375, -0.519500732421875, -0.4859161376953125, -0.45233154296875, -0.4187469482421875, -0.385162353515625, -0.3515777587890625, -0.3179931640625, -0.2844085693359375, -0.250823974609375, -0.2172393798828125, -0.18365478515625, -0.1500701904296875, -0.116485595703125, -0.0829010009765625, -0.04931640625, -0.0157318115234375, 0.017852783203125, 0.0514373779296875, 0.08502197265625, 0.1186065673828125, 0.152191162109375, 0.1857757568359375, 0.2193603515625, 0.2529449462890625, 0.286529541015625, 0.3201141357421875, 0.35369873046875, 0.3872833251953125, 0.420867919921875, 0.4544525146484375, 0.488037109375, 0.5216217041015625, 0.555206298828125, 0.5887908935546875, 0.62237548828125, 0.6559600830078125, 0.689544677734375, 0.7231292724609375, 0.7567138671875, 0.7902984619140625, 0.823883056640625, 0.8574676513671875, 0.89105224609375, 0.9246368408203125, 0.958221435546875, 0.9918060302734375, 1.025390625]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 1.0, 5.0, 13.0, 16.0, 15.0, 16.0, 19.0, 22.0, 31.0, 43.0, 48.0, 95.0, 138.0, 237.0, 379.0, 569.0, 627.0, 561.0, 420.0, 279.0, 186.0, 117.0, 57.0, 43.0, 40.0, 27.0, 20.0, 11.0, 6.0, 9.0, 1.0, 4.0, 6.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.242919921875, -0.23547935485839844, -0.22803878784179688, -0.2205982208251953, -0.21315765380859375, -0.2057170867919922, -0.19827651977539062, -0.19083595275878906, -0.1833953857421875, -0.17595481872558594, -0.16851425170898438, -0.1610736846923828, -0.15363311767578125, -0.1461925506591797, -0.13875198364257812, -0.13131141662597656, -0.123870849609375, -0.11643028259277344, -0.10898971557617188, -0.10154914855957031, -0.09410858154296875, -0.08666801452636719, -0.07922744750976562, -0.07178688049316406, -0.0643463134765625, -0.05690574645996094, -0.049465179443359375, -0.04202461242675781, -0.03458404541015625, -0.027143478393554688, -0.019702911376953125, -0.012262344360351562, -0.00482177734375, 0.0026187896728515625, 0.010059356689453125, 0.017499923706054688, 0.02494049072265625, 0.03238105773925781, 0.039821624755859375, 0.04726219177246094, 0.0547027587890625, 0.06214332580566406, 0.06958389282226562, 0.07702445983886719, 0.08446502685546875, 0.09190559387207031, 0.09934616088867188, 0.10678672790527344, 0.114227294921875, 0.12166786193847656, 0.12910842895507812, 0.1365489959716797, 0.14398956298828125, 0.1514301300048828, 0.15887069702148438, 0.16631126403808594, 0.1737518310546875, 0.18119239807128906, 0.18863296508789062, 0.1960735321044922, 0.20351409912109375, 0.2109546661376953, 0.21839523315429688, 0.22583580017089844, 0.2332763671875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 6.0, 7.0, 4.0, 5.0, 15.0, 22.0, 21.0, 46.0, 49.0, 107.0, 119.0, 129.0, 132.0, 104.0, 82.0, 58.0, 29.0, 29.0, 16.0, 14.0, 9.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9102871417999268, -0.8685171008110046, -0.8267470598220825, -0.7849770188331604, -0.7432069778442383, -0.7014369368553162, -0.659666895866394, -0.6178968548774719, -0.5761268138885498, -0.5343567728996277, -0.49258673191070557, -0.45081669092178345, -0.40904664993286133, -0.3672766089439392, -0.3255065679550171, -0.28373652696609497, -0.24196648597717285, -0.20019644498825073, -0.1584264039993286, -0.1166563630104065, -0.07488632202148438, -0.033116281032562256, 0.008653759956359863, 0.05042380094528198, 0.0921938419342041, 0.13396388292312622, 0.17573392391204834, 0.21750396490097046, 0.2592740058898926, 0.3010440468788147, 0.3428140878677368, 0.38458412885665894, 0.4263540506362915, 0.4681240916252136, 0.5098941326141357, 0.5516641736030579, 0.59343421459198, 0.6352042555809021, 0.6769742965698242, 0.7187443375587463, 0.7605143785476685, 0.8022844195365906, 0.8440544605255127, 0.8858245015144348, 0.9275945425033569, 0.969364583492279, 1.0111346244812012, 1.0529046058654785, 1.0946747064590454, 1.1364448070526123, 1.1782147884368896, 1.219984769821167, 1.2617548704147339, 1.3035249710083008, 1.3452949523925781, 1.3870649337768555, 1.4288350343704224, 1.4706051349639893, 1.5123751163482666, 1.554145097732544, 1.5959151983261108, 1.6376852989196777, 1.679455280303955, 1.7212252616882324, 1.7629953622817993]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 10.0, 2.0, 3.0, 6.0, 13.0, 13.0, 15.0, 18.0, 25.0, 38.0, 34.0, 45.0, 47.0, 48.0, 68.0, 46.0, 64.0, 45.0, 58.0, 47.0, 52.0, 51.0, 45.0, 34.0, 36.0, 22.0, 19.0, 21.0, 15.0, 14.0, 13.0, 14.0, 5.0, 3.0, 3.0, 2.0, 5.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.8779414296150208, -0.855319619178772, -0.8326977491378784, -0.8100759387016296, -0.7874541282653809, -0.7648323178291321, -0.7422104477882385, -0.7195886373519897, -0.696966826915741, -0.6743450164794922, -0.6517231464385986, -0.6291013360023499, -0.6064795255661011, -0.5838577151298523, -0.5612358450889587, -0.53861403465271, -0.5159921646118164, -0.49337032437324524, -0.47074851393699646, -0.4481266736984253, -0.4255048632621765, -0.40288302302360535, -0.3802611827850342, -0.3576393723487854, -0.3350175619125366, -0.31239572167396545, -0.2897739112377167, -0.2671520709991455, -0.24453026056289673, -0.22190842032432556, -0.1992865949869156, -0.17666476964950562, -0.15404295921325684, -0.13142113387584686, -0.10879930853843689, -0.08617747575044632, -0.06355565041303635, -0.04093382507562637, -0.018311992287635803, 0.00430983304977417, 0.026931658387184143, 0.049553483724594116, 0.07217530906200409, 0.09479714184999466, 0.11741896718740463, 0.140040785074234, 0.16266262531280518, 0.18528445065021515, 0.20790627598762512, 0.2305281013250351, 0.25314992666244507, 0.27577176690101624, 0.298393577337265, 0.3210154175758362, 0.34363722801208496, 0.36625906825065613, 0.3888809084892273, 0.41150274872779846, 0.43412455916404724, 0.4567463994026184, 0.4793682098388672, 0.501990020275116, 0.5246118903160095, 0.5472337007522583, 0.5698555111885071]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 10.0, 8.0, 10.0, 19.0, 26.0, 41.0, 83.0, 123.0, 287.0, 777.0, 2464.0, 10343.0, 69177.0, 539212.0, 374234.0, 41678.0, 7060.0, 1872.0, 592.0, 235.0, 121.0, 60.0, 36.0, 28.0, 14.0, 12.0, 12.0, 5.0, 2.0, 5.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.189453125, -0.1818389892578125, -0.174224853515625, -0.1666107177734375, -0.15899658203125, -0.1513824462890625, -0.143768310546875, -0.1361541748046875, -0.1285400390625, -0.1209259033203125, -0.113311767578125, -0.1056976318359375, -0.09808349609375, -0.0904693603515625, -0.082855224609375, -0.0752410888671875, -0.067626953125, -0.0600128173828125, -0.052398681640625, -0.0447845458984375, -0.03717041015625, -0.0295562744140625, -0.021942138671875, -0.0143280029296875, -0.0067138671875, 0.0009002685546875, 0.008514404296875, 0.0161285400390625, 0.02374267578125, 0.0313568115234375, 0.038970947265625, 0.0465850830078125, 0.05419921875, 0.0618133544921875, 0.069427490234375, 0.0770416259765625, 0.08465576171875, 0.0922698974609375, 0.099884033203125, 0.1074981689453125, 0.1151123046875, 0.1227264404296875, 0.130340576171875, 0.1379547119140625, 0.14556884765625, 0.1531829833984375, 0.160797119140625, 0.1684112548828125, 0.176025390625, 0.1836395263671875, 0.191253662109375, 0.1988677978515625, 0.20648193359375, 0.2140960693359375, 0.221710205078125, 0.2293243408203125, 0.2369384765625, 0.2445526123046875, 0.252166748046875, 0.2597808837890625, 0.26739501953125, 0.2750091552734375, 0.282623291015625, 0.2902374267578125, 0.2978515625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 5.0, 8.0, 12.0, 22.0, 24.0, 18.0, 38.0, 43.0, 67.0, 94.0, 84.0, 91.0, 71.0, 85.0, 70.0, 72.0, 48.0, 36.0, 30.0, 24.0, 20.0, 14.0, 5.0, 8.0, 4.0, 8.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.064453125, -1.0402946472167969, -1.0161361694335938, -0.9919776916503906, -0.9678192138671875, -0.9436607360839844, -0.9195022583007812, -0.8953437805175781, -0.871185302734375, -0.8470268249511719, -0.8228683471679688, -0.7987098693847656, -0.7745513916015625, -0.7503929138183594, -0.7262344360351562, -0.7020759582519531, -0.67791748046875, -0.6537590026855469, -0.6296005249023438, -0.6054420471191406, -0.5812835693359375, -0.5571250915527344, -0.5329666137695312, -0.5088081359863281, -0.484649658203125, -0.4604911804199219, -0.43633270263671875, -0.4121742248535156, -0.3880157470703125, -0.3638572692871094, -0.33969879150390625, -0.3155403137207031, -0.2913818359375, -0.2672233581542969, -0.24306488037109375, -0.21890640258789062, -0.1947479248046875, -0.17058944702148438, -0.14643096923828125, -0.12227249145507812, -0.098114013671875, -0.07395553588867188, -0.04979705810546875, -0.025638580322265625, -0.0014801025390625, 0.022678375244140625, 0.04683685302734375, 0.07099533081054688, 0.09515380859375, 0.11931228637695312, 0.14347076416015625, 0.16762924194335938, 0.1917877197265625, 0.21594619750976562, 0.24010467529296875, 0.2642631530761719, 0.288421630859375, 0.3125801086425781, 0.33673858642578125, 0.3608970642089844, 0.3850555419921875, 0.4092140197753906, 0.43337249755859375, 0.4575309753417969, 0.481689453125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 7.0, 4.0, 7.0, 6.0, 2.0, 7.0, 8.0, 15.0, 15.0, 23.0, 18.0, 37.0, 59.0, 60.0, 124.0, 168.0, 234.0, 361.0, 713.0, 1434.0, 3219.0, 8960.0, 30520.0, 125968.0, 405953.0, 341455.0, 92898.0, 23385.0, 7190.0, 2643.0, 1300.0, 609.0, 410.0, 229.0, 142.0, 103.0, 70.0, 54.0, 44.0, 24.0, 14.0, 17.0, 15.0, 6.0, 10.0, 2.0, 4.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.13916015625, -0.13492965698242188, -0.13069915771484375, -0.12646865844726562, -0.1222381591796875, -0.11800765991210938, -0.11377716064453125, -0.10954666137695312, -0.105316162109375, -0.10108566284179688, -0.09685516357421875, -0.09262466430664062, -0.0883941650390625, -0.08416366577148438, -0.07993316650390625, -0.07570266723632812, -0.07147216796875, -0.06724166870117188, -0.06301116943359375, -0.058780670166015625, -0.0545501708984375, -0.050319671630859375, -0.04608917236328125, -0.041858673095703125, -0.037628173828125, -0.033397674560546875, -0.02916717529296875, -0.024936676025390625, -0.0207061767578125, -0.016475677490234375, -0.01224517822265625, -0.008014678955078125, -0.0037841796875, 0.000446319580078125, 0.00467681884765625, 0.008907318115234375, 0.0131378173828125, 0.017368316650390625, 0.02159881591796875, 0.025829315185546875, 0.030059814453125, 0.034290313720703125, 0.03852081298828125, 0.042751312255859375, 0.0469818115234375, 0.051212310791015625, 0.05544281005859375, 0.059673309326171875, 0.06390380859375, 0.06813430786132812, 0.07236480712890625, 0.07659530639648438, 0.0808258056640625, 0.08505630493164062, 0.08928680419921875, 0.09351730346679688, 0.097747802734375, 0.10197830200195312, 0.10620880126953125, 0.11043930053710938, 0.1146697998046875, 0.11890029907226562, 0.12313079833984375, 0.12736129760742188, 0.131591796875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 6.0, 1.0, 2.0, 9.0, 7.0, 19.0, 11.0, 16.0, 20.0, 17.0, 19.0, 37.0, 32.0, 34.0, 60.0, 32.0, 49.0, 52.0, 38.0, 43.0, 44.0, 53.0, 47.0, 28.0, 39.0, 46.0, 36.0, 24.0, 25.0, 26.0, 23.0, 15.0, 19.0, 10.0, 16.0, 10.0, 6.0, 9.0, 7.0, 6.0, 3.0, 4.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7255859375, -0.6997909545898438, -0.6739959716796875, -0.6482009887695312, -0.622406005859375, -0.5966110229492188, -0.5708160400390625, -0.5450210571289062, -0.51922607421875, -0.49343109130859375, -0.4676361083984375, -0.44184112548828125, -0.416046142578125, -0.39025115966796875, -0.3644561767578125, -0.33866119384765625, -0.3128662109375, -0.28707122802734375, -0.2612762451171875, -0.23548126220703125, -0.209686279296875, -0.18389129638671875, -0.1580963134765625, -0.13230133056640625, -0.10650634765625, -0.08071136474609375, -0.0549163818359375, -0.02912139892578125, -0.003326416015625, 0.02246856689453125, 0.0482635498046875, 0.07405853271484375, 0.099853515625, 0.12564849853515625, 0.1514434814453125, 0.17723846435546875, 0.203033447265625, 0.22882843017578125, 0.2546234130859375, 0.28041839599609375, 0.30621337890625, 0.33200836181640625, 0.3578033447265625, 0.38359832763671875, 0.409393310546875, 0.43518829345703125, 0.4609832763671875, 0.48677825927734375, 0.5125732421875, 0.5383682250976562, 0.5641632080078125, 0.5899581909179688, 0.615753173828125, 0.6415481567382812, 0.6673431396484375, 0.6931381225585938, 0.71893310546875, 0.7447280883789062, 0.7705230712890625, 0.7963180541992188, 0.822113037109375, 0.8479080200195312, 0.8737030029296875, 0.8994979858398438, 0.92529296875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 8.0, 7.0, 12.0, 14.0, 32.0, 30.0, 43.0, 82.0, 135.0, 245.0, 437.0, 832.0, 1762.0, 4264.0, 14784.0, 87965.0, 548278.0, 332605.0, 42443.0, 8920.0, 2987.0, 1236.0, 606.0, 309.0, 174.0, 102.0, 81.0, 45.0, 25.0, 20.0, 12.0, 12.0, 10.0, 9.0, 5.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.05792236328125, -0.05597972869873047, -0.05403709411621094, -0.052094459533691406, -0.050151824951171875, -0.048209190368652344, -0.04626655578613281, -0.04432392120361328, -0.04238128662109375, -0.04043865203857422, -0.03849601745605469, -0.036553382873535156, -0.034610748291015625, -0.032668113708496094, -0.030725479125976562, -0.02878284454345703, -0.0268402099609375, -0.02489757537841797, -0.022954940795898438, -0.021012306213378906, -0.019069671630859375, -0.017127037048339844, -0.015184402465820312, -0.013241767883300781, -0.01129913330078125, -0.009356498718261719, -0.0074138641357421875, -0.005471229553222656, -0.003528594970703125, -0.0015859603881835938, 0.0003566741943359375, 0.0022993087768554688, 0.004241943359375, 0.006184577941894531, 0.008127212524414062, 0.010069847106933594, 0.012012481689453125, 0.013955116271972656, 0.015897750854492188, 0.01784038543701172, 0.01978302001953125, 0.02172565460205078, 0.023668289184570312, 0.025610923767089844, 0.027553558349609375, 0.029496192932128906, 0.03143882751464844, 0.03338146209716797, 0.0353240966796875, 0.03726673126220703, 0.03920936584472656, 0.041152000427246094, 0.043094635009765625, 0.045037269592285156, 0.04697990417480469, 0.04892253875732422, 0.05086517333984375, 0.05280780792236328, 0.05475044250488281, 0.056693077087402344, 0.058635711669921875, 0.060578346252441406, 0.06252098083496094, 0.06446361541748047, 0.06640625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 10.0, 7.0, 13.0, 24.0, 40.0, 49.0, 73.0, 93.0, 139.0, 127.0, 125.0, 97.0, 74.0, 51.0, 41.0, 20.0, 7.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.319978713989258e-05, -3.207474946975708e-05, -3.094971179962158e-05, -2.9824674129486084e-05, -2.8699636459350586e-05, -2.7574598789215088e-05, -2.644956111907959e-05, -2.5324523448944092e-05, -2.4199485778808594e-05, -2.3074448108673096e-05, -2.1949410438537598e-05, -2.08243727684021e-05, -1.96993350982666e-05, -1.8574297428131104e-05, -1.7449259757995605e-05, -1.6324222087860107e-05, -1.519918441772461e-05, -1.4074146747589111e-05, -1.2949109077453613e-05, -1.1824071407318115e-05, -1.0699033737182617e-05, -9.573996067047119e-06, -8.448958396911621e-06, -7.323920726776123e-06, -6.198883056640625e-06, -5.073845386505127e-06, -3.948807716369629e-06, -2.823770046234131e-06, -1.6987323760986328e-06, -5.736947059631348e-07, 5.513429641723633e-07, 1.6763806343078613e-06, 2.8014183044433594e-06, 3.926455974578857e-06, 5.0514936447143555e-06, 6.1765313148498535e-06, 7.3015689849853516e-06, 8.42660665512085e-06, 9.551644325256348e-06, 1.0676681995391846e-05, 1.1801719665527344e-05, 1.2926757335662842e-05, 1.405179500579834e-05, 1.5176832675933838e-05, 1.6301870346069336e-05, 1.7426908016204834e-05, 1.8551945686340332e-05, 1.967698335647583e-05, 2.0802021026611328e-05, 2.1927058696746826e-05, 2.3052096366882324e-05, 2.4177134037017822e-05, 2.530217170715332e-05, 2.642720937728882e-05, 2.7552247047424316e-05, 2.8677284717559814e-05, 2.9802322387695312e-05, 3.092736005783081e-05, 3.205239772796631e-05, 3.317743539810181e-05, 3.4302473068237305e-05, 3.54275107383728e-05, 3.65525484085083e-05, 3.76775860786438e-05, 3.88026237487793e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 7.0, 9.0, 25.0, 31.0, 52.0, 84.0, 188.0, 330.0, 681.0, 1770.0, 6500.0, 37733.0, 311363.0, 573237.0, 98336.0, 13108.0, 3098.0, 1019.0, 451.0, 217.0, 124.0, 73.0, 41.0, 26.0, 16.0, 12.0, 3.0, 5.0, 1.0, 6.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08538818359375, -0.08321142196655273, -0.08103466033935547, -0.0788578987121582, -0.07668113708496094, -0.07450437545776367, -0.0723276138305664, -0.07015085220336914, -0.06797409057617188, -0.06579732894897461, -0.06362056732177734, -0.06144380569458008, -0.05926704406738281, -0.05709028244018555, -0.05491352081298828, -0.052736759185791016, -0.05055999755859375, -0.048383235931396484, -0.04620647430419922, -0.04402971267700195, -0.04185295104980469, -0.03967618942260742, -0.037499427795410156, -0.03532266616821289, -0.033145904541015625, -0.03096914291381836, -0.028792381286621094, -0.026615619659423828, -0.024438858032226562, -0.022262096405029297, -0.02008533477783203, -0.017908573150634766, -0.0157318115234375, -0.013555049896240234, -0.011378288269042969, -0.009201526641845703, -0.0070247650146484375, -0.004848003387451172, -0.0026712417602539062, -0.0004944801330566406, 0.001682281494140625, 0.0038590431213378906, 0.006035804748535156, 0.008212566375732422, 0.010389328002929688, 0.012566089630126953, 0.014742851257324219, 0.016919612884521484, 0.01909637451171875, 0.021273136138916016, 0.02344989776611328, 0.025626659393310547, 0.027803421020507812, 0.029980182647705078, 0.032156944274902344, 0.03433370590209961, 0.036510467529296875, 0.03868722915649414, 0.040863990783691406, 0.04304075241088867, 0.04521751403808594, 0.0473942756652832, 0.04957103729248047, 0.051747798919677734, 0.053924560546875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 6.0, 5.0, 10.0, 14.0, 23.0, 29.0, 50.0, 50.0, 67.0, 83.0, 97.0, 109.0, 102.0, 92.0, 67.0, 58.0, 42.0, 26.0, 26.0, 15.0, 9.0, 8.0, 7.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0243682861328125, -0.0238112211227417, -0.0232541561126709, -0.022697091102600098, -0.022140026092529297, -0.021582961082458496, -0.021025896072387695, -0.020468831062316895, -0.019911766052246094, -0.019354701042175293, -0.018797636032104492, -0.01824057102203369, -0.01768350601196289, -0.01712644100189209, -0.01656937599182129, -0.01601231098175049, -0.015455245971679688, -0.014898180961608887, -0.014341115951538086, -0.013784050941467285, -0.013226985931396484, -0.012669920921325684, -0.012112855911254883, -0.011555790901184082, -0.010998725891113281, -0.01044166088104248, -0.00988459587097168, -0.009327530860900879, -0.008770465850830078, -0.008213400840759277, -0.0076563358306884766, -0.007099270820617676, -0.006542205810546875, -0.005985140800476074, -0.0054280757904052734, -0.004871010780334473, -0.004313945770263672, -0.003756880760192871, -0.0031998157501220703, -0.0026427507400512695, -0.0020856857299804688, -0.001528620719909668, -0.0009715557098388672, -0.0004144906997680664, 0.00014257431030273438, 0.0006996393203735352, 0.001256704330444336, 0.0018137693405151367, 0.0023708343505859375, 0.0029278993606567383, 0.003484964370727539, 0.00404202938079834, 0.004599094390869141, 0.005156159400939941, 0.005713224411010742, 0.006270289421081543, 0.006827354431152344, 0.0073844194412231445, 0.007941484451293945, 0.008498549461364746, 0.009055614471435547, 0.009612679481506348, 0.010169744491577148, 0.01072680950164795, 0.01128387451171875]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 9.0, 5.0, 13.0, 18.0, 27.0, 45.0, 70.0, 105.0, 163.0, 150.0, 142.0, 102.0, 54.0, 39.0, 27.0, 15.0, 6.0, 10.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7070823907852173, -0.6754773855209351, -0.6438724398612976, -0.6122674345970154, -0.5806624889373779, -0.5490574836730957, -0.5174524784088135, -0.48584750294685364, -0.4542425274848938, -0.42263755202293396, -0.3910325765609741, -0.3594275712966919, -0.32782259583473206, -0.2962176203727722, -0.26461261510849, -0.23300763964653015, -0.2014026641845703, -0.16979768872261047, -0.13819269835948944, -0.106587715446949, -0.07498273253440857, -0.04337775707244873, -0.011772766709327698, 0.019832223653793335, 0.051437199115753174, 0.08304218202829361, 0.11464716494083405, 0.14625215530395508, 0.17785713076591492, 0.20946210622787476, 0.2410670965909958, 0.2726720869541168, 0.3042771816253662, 0.33588215708732605, 0.3674871325492859, 0.3990921378135681, 0.43069711327552795, 0.4623020887374878, 0.49390709400177, 0.5255120992660522, 0.5571170449256897, 0.5887220501899719, 0.6203269958496094, 0.6519320011138916, 0.6835370063781738, 0.7151419520378113, 0.7467469573020935, 0.778351902961731, 0.8099569082260132, 0.8415619134902954, 0.8731668591499329, 0.9047718644142151, 0.9363768100738525, 0.9679818153381348, 0.999586820602417, 1.0311918258666992, 1.0627968311309814, 1.0944018363952637, 1.126006841659546, 1.1576117277145386, 1.1892167329788208, 1.220821738243103, 1.2524267435073853, 1.2840317487716675, 1.3156366348266602]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 7.0, 2.0, 2.0, 5.0, 11.0, 15.0, 23.0, 16.0, 29.0, 26.0, 45.0, 43.0, 59.0, 64.0, 54.0, 73.0, 52.0, 67.0, 50.0, 61.0, 51.0, 48.0, 43.0, 26.0, 26.0, 21.0, 20.0, 10.0, 11.0, 17.0, 6.0, 4.0, 2.0, 0.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.6449584364891052, -0.6277809739112854, -0.6106034517288208, -0.593425989151001, -0.5762484669685364, -0.5590710043907166, -0.541893482208252, -0.5247160196304321, -0.5075385570526123, -0.4903610646724701, -0.4731835722923279, -0.45600610971450806, -0.43882861733436584, -0.42165112495422363, -0.4044736325740814, -0.3872961401939392, -0.370118647813797, -0.3529411554336548, -0.3357636630535126, -0.31858617067337036, -0.30140870809555054, -0.2842312157154083, -0.2670537233352661, -0.2498762309551239, -0.23269875347614288, -0.21552126109600067, -0.19834378361701965, -0.18116629123687744, -0.16398879885673523, -0.1468113213777542, -0.129633828997612, -0.11245634406805038, -0.09527882933616638, -0.07810134440660477, -0.06092385575175285, -0.04374636709690094, -0.026568882167339325, -0.00939139723777771, 0.007786095142364502, 0.024963580071926117, 0.04214106500148773, 0.05931854993104935, 0.07649603486061096, 0.09367352724075317, 0.11085101217031479, 0.1280284970998764, 0.14520598948001862, 0.16238346695899963, 0.17956095933914185, 0.19673845171928406, 0.21391592919826508, 0.2310934215784073, 0.2482708990573883, 0.2654483914375305, 0.28262588381767273, 0.29980337619781494, 0.31698083877563477, 0.334158331155777, 0.3513358235359192, 0.368513286113739, 0.3856907784938812, 0.40286827087402344, 0.42004576325416565, 0.43722325563430786, 0.4544007480144501]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 3.0, 4.0, 4.0, 16.0, 14.0, 34.0, 47.0, 91.0, 169.0, 287.0, 618.0, 1432.0, 3624.0, 10432.0, 40855.0, 255057.0, 605488.0, 99305.0, 20638.0, 6145.0, 2253.0, 1009.0, 493.0, 217.0, 123.0, 82.0, 35.0, 24.0, 23.0, 11.0, 7.0, 5.0, 7.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.43505859375, -0.41783905029296875, -0.4006195068359375, -0.38339996337890625, -0.366180419921875, -0.34896087646484375, -0.3317413330078125, -0.31452178955078125, -0.29730224609375, -0.28008270263671875, -0.2628631591796875, -0.24564361572265625, -0.228424072265625, -0.21120452880859375, -0.1939849853515625, -0.17676544189453125, -0.1595458984375, -0.14232635498046875, -0.1251068115234375, -0.10788726806640625, -0.090667724609375, -0.07344818115234375, -0.0562286376953125, -0.03900909423828125, -0.02178955078125, -0.00457000732421875, 0.0126495361328125, 0.02986907958984375, 0.047088623046875, 0.06430816650390625, 0.0815277099609375, 0.09874725341796875, 0.115966796875, 0.13318634033203125, 0.1504058837890625, 0.16762542724609375, 0.184844970703125, 0.20206451416015625, 0.2192840576171875, 0.23650360107421875, 0.25372314453125, 0.27094268798828125, 0.2881622314453125, 0.30538177490234375, 0.322601318359375, 0.33982086181640625, 0.3570404052734375, 0.37425994873046875, 0.3914794921875, 0.40869903564453125, 0.4259185791015625, 0.44313812255859375, 0.460357666015625, 0.47757720947265625, 0.4947967529296875, 0.5120162963867188, 0.52923583984375, 0.5464553833007812, 0.5636749267578125, 0.5808944702148438, 0.598114013671875, 0.6153335571289062, 0.6325531005859375, 0.6497726440429688, 0.6669921875]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 3.0, 5.0, 7.0, 7.0, 9.0, 14.0, 20.0, 32.0, 31.0, 39.0, 47.0, 56.0, 58.0, 66.0, 73.0, 57.0, 71.0, 60.0, 68.0, 48.0, 49.0, 38.0, 20.0, 32.0, 25.0, 16.0, 10.0, 9.0, 9.0, 5.0, 2.0, 2.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0], "bins": [-1.5126953125, -1.475311279296875, -1.43792724609375, -1.400543212890625, -1.3631591796875, -1.325775146484375, -1.28839111328125, -1.251007080078125, -1.213623046875, -1.176239013671875, -1.13885498046875, -1.101470947265625, -1.0640869140625, -1.026702880859375, -0.98931884765625, -0.951934814453125, -0.91455078125, -0.877166748046875, -0.83978271484375, -0.802398681640625, -0.7650146484375, -0.727630615234375, -0.69024658203125, -0.652862548828125, -0.615478515625, -0.578094482421875, -0.54071044921875, -0.503326416015625, -0.4659423828125, -0.428558349609375, -0.39117431640625, -0.353790283203125, -0.31640625, -0.279022216796875, -0.24163818359375, -0.204254150390625, -0.1668701171875, -0.129486083984375, -0.09210205078125, -0.054718017578125, -0.017333984375, 0.020050048828125, 0.05743408203125, 0.094818115234375, 0.1322021484375, 0.169586181640625, 0.20697021484375, 0.244354248046875, 0.28173828125, 0.319122314453125, 0.35650634765625, 0.393890380859375, 0.4312744140625, 0.468658447265625, 0.50604248046875, 0.543426513671875, 0.580810546875, 0.618194580078125, 0.65557861328125, 0.692962646484375, 0.7303466796875, 0.767730712890625, 0.80511474609375, 0.842498779296875, 0.8798828125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 2.0, 6.0, 6.0, 12.0, 17.0, 9.0, 17.0, 26.0, 30.0, 40.0, 63.0, 83.0, 116.0, 228.0, 436.0, 1208.0, 4887.0, 44199.0, 858668.0, 126254.0, 9149.0, 1704.0, 584.0, 298.0, 161.0, 96.0, 63.0, 49.0, 33.0, 25.0, 22.0, 10.0, 17.0, 7.0, 6.0, 5.0, 1.0, 1.0, 3.0, 6.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.96826171875, -0.9394989013671875, -0.910736083984375, -0.8819732666015625, -0.85321044921875, -0.8244476318359375, -0.795684814453125, -0.7669219970703125, -0.7381591796875, -0.7093963623046875, -0.680633544921875, -0.6518707275390625, -0.62310791015625, -0.5943450927734375, -0.565582275390625, -0.5368194580078125, -0.508056640625, -0.4792938232421875, -0.450531005859375, -0.4217681884765625, -0.39300537109375, -0.3642425537109375, -0.335479736328125, -0.3067169189453125, -0.2779541015625, -0.2491912841796875, -0.220428466796875, -0.1916656494140625, -0.16290283203125, -0.1341400146484375, -0.105377197265625, -0.0766143798828125, -0.0478515625, -0.0190887451171875, 0.009674072265625, 0.0384368896484375, 0.06719970703125, 0.0959625244140625, 0.124725341796875, 0.1534881591796875, 0.1822509765625, 0.2110137939453125, 0.239776611328125, 0.2685394287109375, 0.29730224609375, 0.3260650634765625, 0.354827880859375, 0.3835906982421875, 0.412353515625, 0.4411163330078125, 0.469879150390625, 0.4986419677734375, 0.52740478515625, 0.5561676025390625, 0.584930419921875, 0.6136932373046875, 0.6424560546875, 0.6712188720703125, 0.699981689453125, 0.7287445068359375, 0.75750732421875, 0.7862701416015625, 0.815032958984375, 0.8437957763671875, 0.87255859375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 4.0, 3.0, 9.0, 4.0, 11.0, 16.0, 20.0, 22.0, 25.0, 35.0, 27.0, 39.0, 29.0, 45.0, 45.0, 56.0, 52.0, 49.0, 47.0, 46.0, 54.0, 51.0, 46.0, 37.0, 33.0, 34.0, 23.0, 25.0, 16.0, 18.0, 16.0, 15.0, 13.0, 9.0, 5.0, 8.0, 4.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.03515625, -1.0014495849609375, -0.967742919921875, -0.9340362548828125, -0.90032958984375, -0.8666229248046875, -0.832916259765625, -0.7992095947265625, -0.7655029296875, -0.7317962646484375, -0.698089599609375, -0.6643829345703125, -0.63067626953125, -0.5969696044921875, -0.563262939453125, -0.5295562744140625, -0.495849609375, -0.4621429443359375, -0.428436279296875, -0.3947296142578125, -0.36102294921875, -0.3273162841796875, -0.293609619140625, -0.2599029541015625, -0.2261962890625, -0.1924896240234375, -0.158782958984375, -0.1250762939453125, -0.09136962890625, -0.0576629638671875, -0.023956298828125, 0.0097503662109375, 0.04345703125, 0.0771636962890625, 0.110870361328125, 0.1445770263671875, 0.17828369140625, 0.2119903564453125, 0.245697021484375, 0.2794036865234375, 0.3131103515625, 0.3468170166015625, 0.380523681640625, 0.4142303466796875, 0.44793701171875, 0.4816436767578125, 0.515350341796875, 0.5490570068359375, 0.582763671875, 0.6164703369140625, 0.650177001953125, 0.6838836669921875, 0.71759033203125, 0.7512969970703125, 0.785003662109375, 0.8187103271484375, 0.8524169921875, 0.8861236572265625, 0.919830322265625, 0.9535369873046875, 0.98724365234375, 1.0209503173828125, 1.054656982421875, 1.0883636474609375, 1.1220703125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 5.0, 9.0, 12.0, 15.0, 27.0, 70.0, 178.0, 610.0, 3351.0, 185251.0, 852380.0, 5378.0, 832.0, 236.0, 96.0, 44.0, 15.0, 11.0, 4.0, 5.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.806640625, -0.7843017578125, -0.761962890625, -0.7396240234375, -0.71728515625, -0.6949462890625, -0.672607421875, -0.6502685546875, -0.6279296875, -0.6055908203125, -0.583251953125, -0.5609130859375, -0.53857421875, -0.5162353515625, -0.493896484375, -0.4715576171875, -0.44921875, -0.4268798828125, -0.404541015625, -0.3822021484375, -0.35986328125, -0.3375244140625, -0.315185546875, -0.2928466796875, -0.2705078125, -0.2481689453125, -0.225830078125, -0.2034912109375, -0.18115234375, -0.1588134765625, -0.136474609375, -0.1141357421875, -0.091796875, -0.0694580078125, -0.047119140625, -0.0247802734375, -0.00244140625, 0.0198974609375, 0.042236328125, 0.0645751953125, 0.0869140625, 0.1092529296875, 0.131591796875, 0.1539306640625, 0.17626953125, 0.1986083984375, 0.220947265625, 0.2432861328125, 0.265625, 0.2879638671875, 0.310302734375, 0.3326416015625, 0.35498046875, 0.3773193359375, 0.399658203125, 0.4219970703125, 0.4443359375, 0.4666748046875, 0.489013671875, 0.5113525390625, 0.53369140625, 0.5560302734375, 0.578369140625, 0.6007080078125, 0.623046875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 8.0, 14.0, 20.0, 17.0, 32.0, 36.0, 68.0, 79.0, 141.0, 154.0, 120.0, 80.0, 79.0, 49.0, 27.0, 16.0, 13.0, 15.0, 7.0, 6.0, 1.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-4.374980926513672e-05, -4.2613595724105835e-05, -4.147738218307495e-05, -4.034116864204407e-05, -3.9204955101013184e-05, -3.80687415599823e-05, -3.6932528018951416e-05, -3.579631447792053e-05, -3.466010093688965e-05, -3.3523887395858765e-05, -3.238767385482788e-05, -3.1251460313797e-05, -3.0115246772766113e-05, -2.897903323173523e-05, -2.7842819690704346e-05, -2.6706606149673462e-05, -2.5570392608642578e-05, -2.4434179067611694e-05, -2.329796552658081e-05, -2.2161751985549927e-05, -2.1025538444519043e-05, -1.988932490348816e-05, -1.8753111362457275e-05, -1.761689782142639e-05, -1.6480684280395508e-05, -1.5344470739364624e-05, -1.420825719833374e-05, -1.3072043657302856e-05, -1.1935830116271973e-05, -1.0799616575241089e-05, -9.663403034210205e-06, -8.527189493179321e-06, -7.3909759521484375e-06, -6.254762411117554e-06, -5.11854887008667e-06, -3.982335329055786e-06, -2.8461217880249023e-06, -1.7099082469940186e-06, -5.736947059631348e-07, 5.62518835067749e-07, 1.6987323760986328e-06, 2.8349459171295166e-06, 3.9711594581604e-06, 5.107372999191284e-06, 6.243586540222168e-06, 7.379800081253052e-06, 8.516013622283936e-06, 9.65222716331482e-06, 1.0788440704345703e-05, 1.1924654245376587e-05, 1.306086778640747e-05, 1.4197081327438354e-05, 1.5333294868469238e-05, 1.6469508409500122e-05, 1.7605721950531006e-05, 1.874193549156189e-05, 1.9878149032592773e-05, 2.1014362573623657e-05, 2.215057611465454e-05, 2.3286789655685425e-05, 2.442300319671631e-05, 2.5559216737747192e-05, 2.6695430278778076e-05, 2.783164381980896e-05, 2.8967857360839844e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 5.0, 3.0, 7.0, 13.0, 20.0, 40.0, 98.0, 176.0, 509.0, 1484.0, 11514.0, 945473.0, 84723.0, 3135.0, 840.0, 265.0, 121.0, 50.0, 30.0, 18.0, 9.0, 8.0, 8.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49462890625, -0.47612762451171875, -0.4576263427734375, -0.43912506103515625, -0.420623779296875, -0.40212249755859375, -0.3836212158203125, -0.36511993408203125, -0.34661865234375, -0.32811737060546875, -0.3096160888671875, -0.29111480712890625, -0.272613525390625, -0.25411224365234375, -0.2356109619140625, -0.21710968017578125, -0.1986083984375, -0.18010711669921875, -0.1616058349609375, -0.14310455322265625, -0.124603271484375, -0.10610198974609375, -0.0876007080078125, -0.06909942626953125, -0.05059814453125, -0.03209686279296875, -0.0135955810546875, 0.00490570068359375, 0.023406982421875, 0.04190826416015625, 0.0604095458984375, 0.07891082763671875, 0.097412109375, 0.11591339111328125, 0.1344146728515625, 0.15291595458984375, 0.171417236328125, 0.18991851806640625, 0.2084197998046875, 0.22692108154296875, 0.24542236328125, 0.26392364501953125, 0.2824249267578125, 0.30092620849609375, 0.319427490234375, 0.33792877197265625, 0.3564300537109375, 0.37493133544921875, 0.3934326171875, 0.41193389892578125, 0.4304351806640625, 0.44893646240234375, 0.467437744140625, 0.48593902587890625, 0.5044403076171875, 0.5229415893554688, 0.54144287109375, 0.5599441528320312, 0.5784454345703125, 0.5969467163085938, 0.615447998046875, 0.6339492797851562, 0.6524505615234375, 0.6709518432617188, 0.689453125]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 8.0, 7.0, 11.0, 25.0, 28.0, 41.0, 63.0, 121.0, 239.0, 168.0, 114.0, 67.0, 42.0, 23.0, 9.0, 12.0, 6.0, 6.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1439208984375, -0.13940811157226562, -0.13489532470703125, -0.13038253784179688, -0.1258697509765625, -0.12135696411132812, -0.11684417724609375, -0.11233139038085938, -0.107818603515625, -0.10330581665039062, -0.09879302978515625, -0.09428024291992188, -0.0897674560546875, -0.08525466918945312, -0.08074188232421875, -0.07622909545898438, -0.07171630859375, -0.06720352172851562, -0.06269073486328125, -0.058177947998046875, -0.0536651611328125, -0.049152374267578125, -0.04463958740234375, -0.040126800537109375, -0.035614013671875, -0.031101226806640625, -0.02658843994140625, -0.022075653076171875, -0.0175628662109375, -0.013050079345703125, -0.00853729248046875, -0.004024505615234375, 0.00048828125, 0.005001068115234375, 0.00951385498046875, 0.014026641845703125, 0.0185394287109375, 0.023052215576171875, 0.02756500244140625, 0.032077789306640625, 0.036590576171875, 0.041103363037109375, 0.04561614990234375, 0.050128936767578125, 0.0546417236328125, 0.059154510498046875, 0.06366729736328125, 0.06818008422851562, 0.07269287109375, 0.07720565795898438, 0.08171844482421875, 0.08623123168945312, 0.0907440185546875, 0.09525680541992188, 0.09976959228515625, 0.10428237915039062, 0.108795166015625, 0.11330795288085938, 0.11782073974609375, 0.12233352661132812, 0.1268463134765625, 0.13135910034179688, 0.13587188720703125, 0.14038467407226562, 0.1448974609375]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 14.0, 19.0, 47.0, 94.0, 208.0, 302.0, 157.0, 90.0, 42.0, 17.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.331616997718811, -1.2243868112564087, -1.117156744003296, -1.0099265575408936, -0.9026963710784912, -0.7954662442207336, -0.6882361173629761, -0.5810059309005737, -0.47377580404281616, -0.3665456473827362, -0.25931549072265625, -0.15208536386489868, -0.044855207204818726, 0.06237494945526123, 0.1696050763130188, 0.27683526277542114, 0.3840653896331787, 0.49129554629325867, 0.5985257029533386, 0.7057558298110962, 0.8129860162734985, 0.9202161431312561, 1.0274462699890137, 1.134676456451416, 1.2419066429138184, 1.3491368293762207, 1.4563668966293335, 1.5635970830917358, 1.6708272695541382, 1.778057336807251, 1.8852875232696533, 1.9925177097320557, 2.099747896194458, 2.2069780826568604, 2.3142082691192627, 2.421438217163086, 2.5286684036254883, 2.6358985900878906, 2.743128776550293, 2.8503589630126953, 2.9575891494750977, 3.0648193359375, 3.1720495223999023, 3.2792797088623047, 3.386509656906128, 3.4937398433685303, 3.6009700298309326, 3.708200216293335, 3.815430164337158, 3.9226603507995605, 4.029890537261963, 4.137120723724365, 4.244350910186768, 4.35158109664917, 4.458810806274414, 4.566040992736816, 4.673271656036377, 4.780501842498779, 4.887732028961182, 4.994962215423584, 5.102192401885986, 5.209422588348389, 5.316652297973633, 5.423882484436035, 5.5311126708984375]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 4.0, 4.0, 13.0, 10.0, 12.0, 16.0, 18.0, 27.0, 28.0, 31.0, 26.0, 41.0, 33.0, 28.0, 40.0, 37.0, 43.0, 49.0, 47.0, 58.0, 43.0, 53.0, 37.0, 35.0, 39.0, 34.0, 28.0, 26.0, 21.0, 23.0, 16.0, 16.0, 14.0, 21.0, 7.0, 10.0, 7.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.8246935606002808, -1.7724653482437134, -1.720237135887146, -1.6680089235305786, -1.6157808303833008, -1.5635526180267334, -1.511324405670166, -1.4590961933135986, -1.4068679809570312, -1.3546397686004639, -1.3024115562438965, -1.250183343887329, -1.1979551315307617, -1.1457269191741943, -1.0934988260269165, -1.0412706136703491, -0.9890424013137817, -0.9368141889572144, -0.884585976600647, -0.8323578238487244, -0.780129611492157, -0.7279013991355896, -0.675673246383667, -0.6234450340270996, -0.5712168216705322, -0.5189886093139648, -0.46676042675971985, -0.41453224420547485, -0.36230403184890747, -0.3100758194923401, -0.2578476369380951, -0.2056194543838501, -0.15339124202728271, -0.10116304457187653, -0.04893484711647034, 0.003293350338935852, 0.05552154779434204, 0.10774976015090942, 0.15997794270515442, 0.21220612525939941, 0.2644343376159668, 0.3166625499725342, 0.3688907325267792, 0.42111891508102417, 0.47334712743759155, 0.5255753397941589, 0.5778034925460815, 0.6300317049026489, 0.6822599172592163, 0.7344881296157837, 0.7867163419723511, 0.8389444947242737, 0.8911727070808411, 0.9434009194374084, 0.995629072189331, 1.0478572845458984, 1.1000854969024658, 1.1523137092590332, 1.2045419216156006, 1.256770133972168, 1.3089983463287354, 1.3612265586853027, 1.4134546518325806, 1.465682864189148, 1.5179110765457153]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 2.0, 7.0, 3.0, 3.0, 5.0, 16.0, 15.0, 35.0, 50.0, 74.0, 114.0, 246.0, 461.0, 973.0, 2535.0, 8794.0, 67171.0, 2105327.0, 1924756.0, 67095.0, 11150.0, 3126.0, 1209.0, 508.0, 252.0, 147.0, 84.0, 46.0, 29.0, 15.0, 12.0, 11.0, 4.0, 4.0, 3.0, 2.0, 0.0, 3.0], "bins": [-1.8203125, -1.7789306640625, -1.737548828125, -1.6961669921875, -1.65478515625, -1.6134033203125, -1.572021484375, -1.5306396484375, -1.4892578125, -1.4478759765625, -1.406494140625, -1.3651123046875, -1.32373046875, -1.2823486328125, -1.240966796875, -1.1995849609375, -1.158203125, -1.1168212890625, -1.075439453125, -1.0340576171875, -0.99267578125, -0.9512939453125, -0.909912109375, -0.8685302734375, -0.8271484375, -0.7857666015625, -0.744384765625, -0.7030029296875, -0.66162109375, -0.6202392578125, -0.578857421875, -0.5374755859375, -0.49609375, -0.4547119140625, -0.413330078125, -0.3719482421875, -0.33056640625, -0.2891845703125, -0.247802734375, -0.2064208984375, -0.1650390625, -0.1236572265625, -0.082275390625, -0.0408935546875, 0.00048828125, 0.0418701171875, 0.083251953125, 0.1246337890625, 0.166015625, 0.2073974609375, 0.248779296875, 0.2901611328125, 0.33154296875, 0.3729248046875, 0.414306640625, 0.4556884765625, 0.4970703125, 0.5384521484375, 0.579833984375, 0.6212158203125, 0.66259765625, 0.7039794921875, 0.745361328125, 0.7867431640625, 0.828125]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 9.0, 10.0, 6.0, 15.0, 14.0, 30.0, 21.0, 40.0, 48.0, 59.0, 75.0, 72.0, 91.0, 84.0, 74.0, 69.0, 52.0, 52.0, 40.0, 37.0, 27.0, 18.0, 19.0, 14.0, 7.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.95654296875, -0.9320907592773438, -0.9076385498046875, -0.8831863403320312, -0.858734130859375, -0.8342819213867188, -0.8098297119140625, -0.7853775024414062, -0.76092529296875, -0.7364730834960938, -0.7120208740234375, -0.6875686645507812, -0.663116455078125, -0.6386642456054688, -0.6142120361328125, -0.5897598266601562, -0.5653076171875, -0.5408554077148438, -0.5164031982421875, -0.49195098876953125, -0.467498779296875, -0.44304656982421875, -0.4185943603515625, -0.39414215087890625, -0.36968994140625, -0.34523773193359375, -0.3207855224609375, -0.29633331298828125, -0.271881103515625, -0.24742889404296875, -0.2229766845703125, -0.19852447509765625, -0.174072265625, -0.14962005615234375, -0.1251678466796875, -0.10071563720703125, -0.076263427734375, -0.05181121826171875, -0.0273590087890625, -0.00290679931640625, 0.02154541015625, 0.04599761962890625, 0.0704498291015625, 0.09490203857421875, 0.119354248046875, 0.14380645751953125, 0.1682586669921875, 0.19271087646484375, 0.2171630859375, 0.24161529541015625, 0.2660675048828125, 0.29051971435546875, 0.314971923828125, 0.33942413330078125, 0.3638763427734375, 0.38832855224609375, 0.41278076171875, 0.43723297119140625, 0.4616851806640625, 0.48613739013671875, 0.510589599609375, 0.5350418090820312, 0.5594940185546875, 0.5839462280273438, 0.6083984375]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 9.0, 12.0, 24.0, 50.0, 119.0, 235.0, 606.0, 1920.0, 9953.0, 209326.0, 3907176.0, 57483.0, 5353.0, 1260.0, 391.0, 167.0, 78.0, 51.0, 14.0, 13.0, 10.0, 14.0, 7.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2890625, -2.227752685546875, -2.16644287109375, -2.105133056640625, -2.0438232421875, -1.982513427734375, -1.92120361328125, -1.859893798828125, -1.798583984375, -1.737274169921875, -1.67596435546875, -1.614654541015625, -1.5533447265625, -1.492034912109375, -1.43072509765625, -1.369415283203125, -1.30810546875, -1.246795654296875, -1.18548583984375, -1.124176025390625, -1.0628662109375, -1.001556396484375, -0.94024658203125, -0.878936767578125, -0.817626953125, -0.756317138671875, -0.69500732421875, -0.633697509765625, -0.5723876953125, -0.511077880859375, -0.44976806640625, -0.388458251953125, -0.3271484375, -0.265838623046875, -0.20452880859375, -0.143218994140625, -0.0819091796875, -0.020599365234375, 0.04071044921875, 0.102020263671875, 0.163330078125, 0.224639892578125, 0.28594970703125, 0.347259521484375, 0.4085693359375, 0.469879150390625, 0.53118896484375, 0.592498779296875, 0.65380859375, 0.715118408203125, 0.77642822265625, 0.837738037109375, 0.8990478515625, 0.960357666015625, 1.02166748046875, 1.082977294921875, 1.144287109375, 1.205596923828125, 1.26690673828125, 1.328216552734375, 1.3895263671875, 1.450836181640625, 1.51214599609375, 1.573455810546875, 1.634765625]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 10.0, 13.0, 13.0, 13.0, 21.0, 37.0, 49.0, 79.0, 159.0, 350.0, 741.0, 1054.0, 732.0, 386.0, 176.0, 101.0, 54.0, 31.0, 29.0, 10.0, 6.0, 5.0, 2.0, 6.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.37841796875, -0.3656272888183594, -0.35283660888671875, -0.3400459289550781, -0.3272552490234375, -0.3144645690917969, -0.30167388916015625, -0.2888832092285156, -0.276092529296875, -0.2633018493652344, -0.25051116943359375, -0.23772048950195312, -0.2249298095703125, -0.21213912963867188, -0.19934844970703125, -0.18655776977539062, -0.17376708984375, -0.16097640991210938, -0.14818572998046875, -0.13539505004882812, -0.1226043701171875, -0.10981369018554688, -0.09702301025390625, -0.08423233032226562, -0.071441650390625, -0.058650970458984375, -0.04586029052734375, -0.033069610595703125, -0.0202789306640625, -0.007488250732421875, 0.00530242919921875, 0.018093109130859375, 0.0308837890625, 0.043674468994140625, 0.05646514892578125, 0.06925582885742188, 0.0820465087890625, 0.09483718872070312, 0.10762786865234375, 0.12041854858398438, 0.133209228515625, 0.14599990844726562, 0.15879058837890625, 0.17158126831054688, 0.1843719482421875, 0.19716262817382812, 0.20995330810546875, 0.22274398803710938, 0.23553466796875, 0.24832534790039062, 0.26111602783203125, 0.2739067077636719, 0.2866973876953125, 0.2994880676269531, 0.31227874755859375, 0.3250694274902344, 0.337860107421875, 0.3506507873535156, 0.36344146728515625, 0.3762321472167969, 0.3890228271484375, 0.4018135070800781, 0.41460418701171875, 0.4273948669433594, 0.440185546875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 7.0, 6.0, 13.0, 14.0, 29.0, 44.0, 64.0, 87.0, 117.0, 132.0, 125.0, 121.0, 71.0, 65.0, 46.0, 27.0, 9.0, 10.0, 7.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9351988434791565, -0.8907696008682251, -0.8463403582572937, -0.8019111156463623, -0.7574818134307861, -0.7130526304244995, -0.6686233282089233, -0.6241940855979919, -0.5797648429870605, -0.5353356003761292, -0.49090635776519775, -0.44647708535194397, -0.4020478427410126, -0.3576186001300812, -0.3131893277168274, -0.268760085105896, -0.2243308424949646, -0.1799015998840332, -0.1354723423719406, -0.09104308485984802, -0.046613842248916626, -0.0021845996379852295, 0.042244672775268555, 0.08667391538619995, 0.13110315799713135, 0.17553240060806274, 0.21996165812015533, 0.2643909156322479, 0.3088201582431793, 0.3532494008541107, 0.3976786732673645, 0.4421079158782959, 0.4865370988845825, 0.5309663414955139, 0.5753955841064453, 0.6198248863220215, 0.6642540693283081, 0.7086833715438843, 0.7531126141548157, 0.7975418567657471, 0.8419710993766785, 0.8864003419876099, 0.9308295845985413, 0.9752588272094727, 1.0196881294250488, 1.0641173124313354, 1.1085466146469116, 1.1529757976531982, 1.1974050998687744, 1.2418344020843506, 1.2862635850906372, 1.3306928873062134, 1.3751220703125, 1.4195513725280762, 1.4639806747436523, 1.508409857749939, 1.5528390407562256, 1.5972683429718018, 1.6416975259780884, 1.6861268281936646, 1.7305560111999512, 1.7749853134155273, 1.8194146156311035, 1.8638437986373901, 1.9082731008529663]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 10.0, 11.0, 12.0, 15.0, 32.0, 27.0, 34.0, 44.0, 51.0, 67.0, 61.0, 77.0, 72.0, 64.0, 74.0, 52.0, 50.0, 38.0, 47.0, 36.0, 32.0, 21.0, 16.0, 18.0, 15.0, 7.0, 9.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9331230521202087, -0.9056692123413086, -0.8782153129577637, -0.8507614135742188, -0.8233075737953186, -0.7958537340164185, -0.7683998346328735, -0.7409459352493286, -0.7134920954704285, -0.6860382556915283, -0.6585843563079834, -0.6311304569244385, -0.6036766171455383, -0.5762227773666382, -0.5487688779830933, -0.5213149785995483, -0.4938611388206482, -0.46640726923942566, -0.4389533996582031, -0.4114995300769806, -0.38404566049575806, -0.3565917909145355, -0.329137921333313, -0.30168405175209045, -0.2742301821708679, -0.24677631258964539, -0.21932244300842285, -0.19186857342720032, -0.16441470384597778, -0.13696083426475525, -0.10950696468353271, -0.08205309510231018, -0.05459916591644287, -0.027145296335220337, 0.00030857324600219727, 0.02776244282722473, 0.055216312408447266, 0.0826701819896698, 0.11012405157089233, 0.13757792115211487, 0.1650317907333374, 0.19248566031455994, 0.21993952989578247, 0.247393399477005, 0.27484726905822754, 0.3023011386394501, 0.3297550082206726, 0.35720887780189514, 0.3846627473831177, 0.4121166169643402, 0.43957048654556274, 0.4670243561267853, 0.4944782257080078, 0.5219321250915527, 0.5493859648704529, 0.576839804649353, 0.604293704032898, 0.6317476034164429, 0.659201443195343, 0.6866552829742432, 0.7141091823577881, 0.741563081741333, 0.7690169215202332, 0.7964707612991333, 0.8239246606826782]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 4.0, 11.0, 12.0, 24.0, 54.0, 88.0, 283.0, 730.0, 2243.0, 7929.0, 132621.0, 876659.0, 21753.0, 4095.0, 1298.0, 447.0, 159.0, 65.0, 30.0, 16.0, 9.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.57421875, -0.5539016723632812, -0.5335845947265625, -0.5132675170898438, -0.492950439453125, -0.47263336181640625, -0.4523162841796875, -0.43199920654296875, -0.41168212890625, -0.39136505126953125, -0.3710479736328125, -0.35073089599609375, -0.330413818359375, -0.31009674072265625, -0.2897796630859375, -0.26946258544921875, -0.2491455078125, -0.22882843017578125, -0.2085113525390625, -0.18819427490234375, -0.167877197265625, -0.14756011962890625, -0.1272430419921875, -0.10692596435546875, -0.08660888671875, -0.06629180908203125, -0.0459747314453125, -0.02565765380859375, -0.005340576171875, 0.01497650146484375, 0.0352935791015625, 0.05561065673828125, 0.075927734375, 0.09624481201171875, 0.1165618896484375, 0.13687896728515625, 0.157196044921875, 0.17751312255859375, 0.1978302001953125, 0.21814727783203125, 0.23846435546875, 0.25878143310546875, 0.2790985107421875, 0.29941558837890625, 0.319732666015625, 0.34004974365234375, 0.3603668212890625, 0.38068389892578125, 0.4010009765625, 0.42131805419921875, 0.4416351318359375, 0.46195220947265625, 0.482269287109375, 0.5025863647460938, 0.5229034423828125, 0.5432205200195312, 0.56353759765625, 0.5838546752929688, 0.6041717529296875, 0.6244888305664062, 0.644805908203125, 0.6651229858398438, 0.6854400634765625, 0.7057571411132812, 0.72607421875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 8.0, 20.0, 23.0, 28.0, 31.0, 45.0, 43.0, 77.0, 74.0, 87.0, 80.0, 92.0, 69.0, 66.0, 53.0, 46.0, 40.0, 24.0, 28.0, 18.0, 17.0, 12.0, 3.0, 1.0, 6.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.658203125, -0.6375656127929688, -0.6169281005859375, -0.5962905883789062, -0.575653076171875, -0.5550155639648438, -0.5343780517578125, -0.5137405395507812, -0.49310302734375, -0.47246551513671875, -0.4518280029296875, -0.43119049072265625, -0.410552978515625, -0.38991546630859375, -0.3692779541015625, -0.34864044189453125, -0.3280029296875, -0.30736541748046875, -0.2867279052734375, -0.26609039306640625, -0.245452880859375, -0.22481536865234375, -0.2041778564453125, -0.18354034423828125, -0.16290283203125, -0.14226531982421875, -0.1216278076171875, -0.10099029541015625, -0.080352783203125, -0.05971527099609375, -0.0390777587890625, -0.01844024658203125, 0.002197265625, 0.02283477783203125, 0.0434722900390625, 0.06410980224609375, 0.084747314453125, 0.10538482666015625, 0.1260223388671875, 0.14665985107421875, 0.16729736328125, 0.18793487548828125, 0.2085723876953125, 0.22920989990234375, 0.249847412109375, 0.27048492431640625, 0.2911224365234375, 0.31175994873046875, 0.3323974609375, 0.35303497314453125, 0.3736724853515625, 0.39430999755859375, 0.414947509765625, 0.43558502197265625, 0.4562225341796875, 0.47686004638671875, 0.49749755859375, 0.5181350708007812, 0.5387725830078125, 0.5594100952148438, 0.580047607421875, 0.6006851196289062, 0.6213226318359375, 0.6419601440429688, 0.66259765625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 7.0, 6.0, 5.0, 5.0, 5.0, 10.0, 17.0, 26.0, 25.0, 49.0, 74.0, 163.0, 283.0, 574.0, 1308.0, 2901.0, 7961.0, 41282.0, 644797.0, 318271.0, 20894.0, 5601.0, 2266.0, 990.0, 480.0, 241.0, 126.0, 75.0, 34.0, 14.0, 20.0, 13.0, 12.0, 5.0, 5.0, 1.0, 1.0, 3.0, 4.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.281982421875, -0.2722053527832031, -0.26242828369140625, -0.2526512145996094, -0.2428741455078125, -0.23309707641601562, -0.22332000732421875, -0.21354293823242188, -0.203765869140625, -0.19398880004882812, -0.18421173095703125, -0.17443466186523438, -0.1646575927734375, -0.15488052368164062, -0.14510345458984375, -0.13532638549804688, -0.12554931640625, -0.11577224731445312, -0.10599517822265625, -0.09621810913085938, -0.0864410400390625, -0.07666397094726562, -0.06688690185546875, -0.057109832763671875, -0.047332763671875, -0.037555694580078125, -0.02777862548828125, -0.018001556396484375, -0.0082244873046875, 0.001552581787109375, 0.01132965087890625, 0.021106719970703125, 0.0308837890625, 0.040660858154296875, 0.05043792724609375, 0.060214996337890625, 0.0699920654296875, 0.07976913452148438, 0.08954620361328125, 0.09932327270507812, 0.109100341796875, 0.11887741088867188, 0.12865447998046875, 0.13843154907226562, 0.1482086181640625, 0.15798568725585938, 0.16776275634765625, 0.17753982543945312, 0.18731689453125, 0.19709396362304688, 0.20687103271484375, 0.21664810180664062, 0.2264251708984375, 0.23620223999023438, 0.24597930908203125, 0.2557563781738281, 0.265533447265625, 0.2753105163574219, 0.28508758544921875, 0.2948646545410156, 0.3046417236328125, 0.3144187927246094, 0.32419586181640625, 0.3339729309082031, 0.34375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 4.0, 5.0, 7.0, 4.0, 4.0, 13.0, 7.0, 13.0, 16.0, 13.0, 24.0, 29.0, 34.0, 28.0, 38.0, 42.0, 38.0, 41.0, 39.0, 55.0, 51.0, 46.0, 46.0, 40.0, 45.0, 30.0, 36.0, 29.0, 31.0, 26.0, 24.0, 26.0, 7.0, 15.0, 20.0, 11.0, 14.0, 7.0, 6.0, 9.0, 5.0, 5.0, 13.0, 4.0, 3.0, 1.0, 2.0], "bins": [-0.896484375, -0.8729705810546875, -0.849456787109375, -0.8259429931640625, -0.80242919921875, -0.7789154052734375, -0.755401611328125, -0.7318878173828125, -0.7083740234375, -0.6848602294921875, -0.661346435546875, -0.6378326416015625, -0.61431884765625, -0.5908050537109375, -0.567291259765625, -0.5437774658203125, -0.520263671875, -0.4967498779296875, -0.473236083984375, -0.4497222900390625, -0.42620849609375, -0.4026947021484375, -0.379180908203125, -0.3556671142578125, -0.3321533203125, -0.3086395263671875, -0.285125732421875, -0.2616119384765625, -0.23809814453125, -0.2145843505859375, -0.191070556640625, -0.1675567626953125, -0.14404296875, -0.1205291748046875, -0.097015380859375, -0.0735015869140625, -0.04998779296875, -0.0264739990234375, -0.002960205078125, 0.0205535888671875, 0.0440673828125, 0.0675811767578125, 0.091094970703125, 0.1146087646484375, 0.13812255859375, 0.1616363525390625, 0.185150146484375, 0.2086639404296875, 0.232177734375, 0.2556915283203125, 0.279205322265625, 0.3027191162109375, 0.32623291015625, 0.3497467041015625, 0.373260498046875, 0.3967742919921875, 0.4202880859375, 0.4438018798828125, 0.467315673828125, 0.4908294677734375, 0.51434326171875, 0.5378570556640625, 0.561370849609375, 0.5848846435546875, 0.6083984375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 7.0, 10.0, 11.0, 11.0, 16.0, 28.0, 44.0, 54.0, 100.0, 208.0, 398.0, 762.0, 2008.0, 6392.0, 31390.0, 328585.0, 600005.0, 63378.0, 10351.0, 2778.0, 1004.0, 436.0, 240.0, 130.0, 71.0, 46.0, 33.0, 11.0, 6.0, 9.0, 6.0, 6.0, 3.0, 4.0, 1.0, 4.0, 6.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.081787109375, -0.07907581329345703, -0.07636451721191406, -0.0736532211303711, -0.07094192504882812, -0.06823062896728516, -0.06551933288574219, -0.06280803680419922, -0.06009674072265625, -0.05738544464111328, -0.05467414855957031, -0.051962852478027344, -0.049251556396484375, -0.046540260314941406, -0.04382896423339844, -0.04111766815185547, -0.0384063720703125, -0.03569507598876953, -0.03298377990722656, -0.030272483825683594, -0.027561187744140625, -0.024849891662597656, -0.022138595581054688, -0.01942729949951172, -0.01671600341796875, -0.014004707336425781, -0.011293411254882812, -0.008582115173339844, -0.005870819091796875, -0.0031595230102539062, -0.0004482269287109375, 0.0022630691528320312, 0.004974365234375, 0.007685661315917969, 0.010396957397460938, 0.013108253479003906, 0.015819549560546875, 0.018530845642089844, 0.021242141723632812, 0.02395343780517578, 0.02666473388671875, 0.02937602996826172, 0.03208732604980469, 0.034798622131347656, 0.037509918212890625, 0.040221214294433594, 0.04293251037597656, 0.04564380645751953, 0.0483551025390625, 0.05106639862060547, 0.05377769470214844, 0.056488990783691406, 0.059200286865234375, 0.061911582946777344, 0.06462287902832031, 0.06733417510986328, 0.07004547119140625, 0.07275676727294922, 0.07546806335449219, 0.07817935943603516, 0.08089065551757812, 0.0836019515991211, 0.08631324768066406, 0.08902454376220703, 0.09173583984375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 1.0, 0.0, 3.0, 1.0, 9.0, 5.0, 18.0, 21.0, 43.0, 49.0, 71.0, 97.0, 126.0, 135.0, 120.0, 110.0, 67.0, 45.0, 27.0, 21.0, 8.0, 8.0, 7.0, 3.0, 1.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6345252990722656e-05, -2.5218352675437927e-05, -2.4091452360153198e-05, -2.296455204486847e-05, -2.183765172958374e-05, -2.071075141429901e-05, -1.9583851099014282e-05, -1.8456950783729553e-05, -1.7330050468444824e-05, -1.6203150153160095e-05, -1.5076249837875366e-05, -1.3949349522590637e-05, -1.2822449207305908e-05, -1.169554889202118e-05, -1.056864857673645e-05, -9.441748261451721e-06, -8.314847946166992e-06, -7.187947630882263e-06, -6.061047315597534e-06, -4.934147000312805e-06, -3.807246685028076e-06, -2.680346369743347e-06, -1.5534460544586182e-06, -4.2654573917388916e-07, 7.003545761108398e-07, 1.8272548913955688e-06, 2.954155206680298e-06, 4.081055521965027e-06, 5.207955837249756e-06, 6.334856152534485e-06, 7.461756467819214e-06, 8.588656783103943e-06, 9.715557098388672e-06, 1.0842457413673401e-05, 1.196935772895813e-05, 1.3096258044242859e-05, 1.4223158359527588e-05, 1.5350058674812317e-05, 1.6476958990097046e-05, 1.7603859305381775e-05, 1.8730759620666504e-05, 1.9857659935951233e-05, 2.0984560251235962e-05, 2.211146056652069e-05, 2.323836088180542e-05, 2.436526119709015e-05, 2.5492161512374878e-05, 2.6619061827659607e-05, 2.7745962142944336e-05, 2.8872862458229065e-05, 2.9999762773513794e-05, 3.112666308879852e-05, 3.225356340408325e-05, 3.338046371936798e-05, 3.450736403465271e-05, 3.563426434993744e-05, 3.676116466522217e-05, 3.78880649805069e-05, 3.9014965295791626e-05, 4.0141865611076355e-05, 4.1268765926361084e-05, 4.239566624164581e-05, 4.352256655693054e-05, 4.464946687221527e-05, 4.57763671875e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 7.0, 2.0, 8.0, 19.0, 17.0, 24.0, 41.0, 58.0, 74.0, 150.0, 198.0, 379.0, 680.0, 1430.0, 3185.0, 7687.0, 21082.0, 66314.0, 231014.0, 434259.0, 195325.0, 56266.0, 17932.0, 6782.0, 2902.0, 1253.0, 632.0, 276.0, 210.0, 105.0, 64.0, 57.0, 33.0, 21.0, 9.0, 18.0, 10.0, 5.0, 5.0, 10.0, 3.0, 4.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05059814453125, -0.049037933349609375, -0.04747772216796875, -0.045917510986328125, -0.0443572998046875, -0.042797088623046875, -0.04123687744140625, -0.039676666259765625, -0.038116455078125, -0.036556243896484375, -0.03499603271484375, -0.033435821533203125, -0.0318756103515625, -0.030315399169921875, -0.02875518798828125, -0.027194976806640625, -0.025634765625, -0.024074554443359375, -0.02251434326171875, -0.020954132080078125, -0.0193939208984375, -0.017833709716796875, -0.01627349853515625, -0.014713287353515625, -0.013153076171875, -0.011592864990234375, -0.01003265380859375, -0.008472442626953125, -0.0069122314453125, -0.005352020263671875, -0.00379180908203125, -0.002231597900390625, -0.00067138671875, 0.000888824462890625, 0.00244903564453125, 0.004009246826171875, 0.0055694580078125, 0.007129669189453125, 0.00868988037109375, 0.010250091552734375, 0.011810302734375, 0.013370513916015625, 0.01493072509765625, 0.016490936279296875, 0.0180511474609375, 0.019611358642578125, 0.02117156982421875, 0.022731781005859375, 0.0242919921875, 0.025852203369140625, 0.02741241455078125, 0.028972625732421875, 0.0305328369140625, 0.032093048095703125, 0.03365325927734375, 0.035213470458984375, 0.036773681640625, 0.038333892822265625, 0.03989410400390625, 0.041454315185546875, 0.0430145263671875, 0.044574737548828125, 0.04613494873046875, 0.047695159912109375, 0.04925537109375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 5.0, 9.0, 8.0, 8.0, 16.0, 10.0, 26.0, 35.0, 33.0, 41.0, 49.0, 40.0, 63.0, 73.0, 64.0, 70.0, 78.0, 69.0, 61.0, 51.0, 31.0, 33.0, 22.0, 22.0, 9.0, 15.0, 8.0, 9.0, 4.0, 5.0, 7.0, 3.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0139312744140625, -0.013493776321411133, -0.013056278228759766, -0.012618780136108398, -0.012181282043457031, -0.011743783950805664, -0.011306285858154297, -0.01086878776550293, -0.010431289672851562, -0.009993791580200195, -0.009556293487548828, -0.009118795394897461, -0.008681297302246094, -0.008243799209594727, -0.007806301116943359, -0.007368803024291992, -0.006931304931640625, -0.006493806838989258, -0.006056308746337891, -0.0056188106536865234, -0.005181312561035156, -0.004743814468383789, -0.004306316375732422, -0.0038688182830810547, -0.0034313201904296875, -0.0029938220977783203, -0.002556324005126953, -0.002118825912475586, -0.0016813278198242188, -0.0012438297271728516, -0.0008063316345214844, -0.0003688335418701172, 6.866455078125e-05, 0.0005061626434326172, 0.0009436607360839844, 0.0013811588287353516, 0.0018186569213867188, 0.002256155014038086, 0.002693653106689453, 0.0031311511993408203, 0.0035686492919921875, 0.004006147384643555, 0.004443645477294922, 0.004881143569946289, 0.005318641662597656, 0.0057561397552490234, 0.006193637847900391, 0.006631135940551758, 0.007068634033203125, 0.007506132125854492, 0.00794363021850586, 0.008381128311157227, 0.008818626403808594, 0.009256124496459961, 0.009693622589111328, 0.010131120681762695, 0.010568618774414062, 0.01100611686706543, 0.011443614959716797, 0.011881113052368164, 0.012318611145019531, 0.012756109237670898, 0.013193607330322266, 0.013631105422973633, 0.014068603515625]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 11.0, 6.0, 23.0, 39.0, 88.0, 117.0, 154.0, 185.0, 155.0, 89.0, 66.0, 25.0, 21.0, 10.0, 5.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5204527378082275, -0.4865703582763672, -0.45268794894218445, -0.4188055396080017, -0.38492316007614136, -0.351040780544281, -0.31715837121009827, -0.2832759618759155, -0.24939358234405518, -0.21551118791103363, -0.18162879347801208, -0.14774639904499054, -0.113864004611969, -0.07998161017894745, -0.0460992157459259, -0.012216821312904358, 0.021665573120117188, 0.05554796755313873, 0.08943036198616028, 0.12331275641918182, 0.15719515085220337, 0.19107754528522491, 0.22495993971824646, 0.2588423490524292, 0.29272472858428955, 0.3266071081161499, 0.36048951745033264, 0.3943719267845154, 0.42825430631637573, 0.4621366858482361, 0.4960190951824188, 0.5299015045166016, 0.5637840032577515, 0.5976663827896118, 0.6315487623214722, 0.6654312014579773, 0.6993135809898376, 0.733195960521698, 0.7670783996582031, 0.8009607791900635, 0.8348431587219238, 0.8687255382537842, 0.9026079177856445, 0.9364903569221497, 0.97037273645401, 1.0042551755905151, 1.0381375551223755, 1.0720199346542358, 1.1059023141860962, 1.1397846937179565, 1.173667073249817, 1.2075494527816772, 1.2414319515228271, 1.2753143310546875, 1.3091967105865479, 1.3430790901184082, 1.3769614696502686, 1.410843849182129, 1.4447262287139893, 1.4786086082458496, 1.51249098777771, 1.5463734865188599, 1.5802558660507202, 1.6141382455825806, 1.648020625114441]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 8.0, 9.0, 15.0, 14.0, 32.0, 36.0, 36.0, 50.0, 63.0, 57.0, 63.0, 79.0, 77.0, 73.0, 61.0, 54.0, 57.0, 43.0, 31.0, 40.0, 20.0, 21.0, 22.0, 11.0, 10.0, 6.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.515916645526886, -0.49793168902397156, -0.47994673252105713, -0.4619617760181427, -0.44397681951522827, -0.42599186301231384, -0.4080069065093994, -0.390021950006485, -0.37203699350357056, -0.35405203700065613, -0.3360670804977417, -0.31808212399482727, -0.30009716749191284, -0.2821122109889984, -0.264127254486084, -0.24614229798316956, -0.22815734148025513, -0.2101723849773407, -0.19218742847442627, -0.17420247197151184, -0.1562175154685974, -0.13823255896568298, -0.12024760246276855, -0.10226264595985413, -0.0842776894569397, -0.06629273295402527, -0.04830777645111084, -0.03032281994819641, -0.012337863445281982, 0.005647093057632446, 0.023632049560546875, 0.041617006063461304, 0.05960190296173096, 0.07758685946464539, 0.09557181596755981, 0.11355677247047424, 0.13154172897338867, 0.1495266854763031, 0.16751164197921753, 0.18549659848213196, 0.2034815549850464, 0.22146651148796082, 0.23945146799087524, 0.2574364244937897, 0.2754213809967041, 0.29340633749961853, 0.31139129400253296, 0.3293762505054474, 0.3473612070083618, 0.36534616351127625, 0.3833311200141907, 0.4013160765171051, 0.41930103302001953, 0.43728598952293396, 0.4552709460258484, 0.4732559025287628, 0.49124085903167725, 0.5092258453369141, 0.5272107720375061, 0.5451956987380981, 0.563180685043335, 0.5811656713485718, 0.5991505980491638, 0.6171355247497559, 0.6351205110549927]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 6.0, 8.0, 10.0, 22.0, 15.0, 28.0, 40.0, 74.0, 120.0, 182.0, 370.0, 646.0, 1491.0, 3583.0, 10767.0, 39770.0, 355269.0, 566928.0, 48818.0, 12875.0, 4143.0, 1686.0, 767.0, 360.0, 222.0, 122.0, 69.0, 58.0, 20.0, 17.0, 20.0, 8.0, 12.0, 6.0, 8.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64990234375, -0.6313705444335938, -0.6128387451171875, -0.5943069458007812, -0.575775146484375, -0.5572433471679688, -0.5387115478515625, -0.5201797485351562, -0.50164794921875, -0.48311614990234375, -0.4645843505859375, -0.44605255126953125, -0.427520751953125, -0.40898895263671875, -0.3904571533203125, -0.37192535400390625, -0.3533935546875, -0.33486175537109375, -0.3163299560546875, -0.29779815673828125, -0.279266357421875, -0.26073455810546875, -0.2422027587890625, -0.22367095947265625, -0.20513916015625, -0.18660736083984375, -0.1680755615234375, -0.14954376220703125, -0.131011962890625, -0.11248016357421875, -0.0939483642578125, -0.07541656494140625, -0.056884765625, -0.03835296630859375, -0.0198211669921875, -0.00128936767578125, 0.017242431640625, 0.03577423095703125, 0.0543060302734375, 0.07283782958984375, 0.09136962890625, 0.10990142822265625, 0.1284332275390625, 0.14696502685546875, 0.165496826171875, 0.18402862548828125, 0.2025604248046875, 0.22109222412109375, 0.2396240234375, 0.25815582275390625, 0.2766876220703125, 0.29521942138671875, 0.313751220703125, 0.33228302001953125, 0.3508148193359375, 0.36934661865234375, 0.38787841796875, 0.40641021728515625, 0.4249420166015625, 0.44347381591796875, 0.462005615234375, 0.48053741455078125, 0.4990692138671875, 0.5176010131835938, 0.5361328125]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 6.0, 2.0, 9.0, 12.0, 21.0, 34.0, 39.0, 49.0, 64.0, 79.0, 105.0, 96.0, 99.0, 74.0, 75.0, 59.0, 51.0, 46.0, 35.0, 25.0, 12.0, 7.0, 6.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6904296875, -1.64215087890625, -1.5938720703125, -1.54559326171875, -1.497314453125, -1.44903564453125, -1.4007568359375, -1.35247802734375, -1.30419921875, -1.25592041015625, -1.2076416015625, -1.15936279296875, -1.111083984375, -1.06280517578125, -1.0145263671875, -0.96624755859375, -0.91796875, -0.86968994140625, -0.8214111328125, -0.77313232421875, -0.724853515625, -0.67657470703125, -0.6282958984375, -0.58001708984375, -0.53173828125, -0.48345947265625, -0.4351806640625, -0.38690185546875, -0.338623046875, -0.29034423828125, -0.2420654296875, -0.19378662109375, -0.1455078125, -0.09722900390625, -0.0489501953125, -0.00067138671875, 0.047607421875, 0.09588623046875, 0.1441650390625, 0.19244384765625, 0.24072265625, 0.28900146484375, 0.3372802734375, 0.38555908203125, 0.433837890625, 0.48211669921875, 0.5303955078125, 0.57867431640625, 0.626953125, 0.67523193359375, 0.7235107421875, 0.77178955078125, 0.820068359375, 0.86834716796875, 0.9166259765625, 0.96490478515625, 1.01318359375, 1.06146240234375, 1.1097412109375, 1.15802001953125, 1.206298828125, 1.25457763671875, 1.3028564453125, 1.35113525390625, 1.3994140625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 0.0, 8.0, 1.0, 2.0, 4.0, 6.0, 5.0, 6.0, 7.0, 3.0, 10.0, 14.0, 21.0, 16.0, 27.0, 37.0, 56.0, 91.0, 138.0, 205.0, 367.0, 794.0, 3612.0, 57625.0, 952235.0, 29356.0, 2351.0, 629.0, 336.0, 184.0, 115.0, 69.0, 56.0, 40.0, 29.0, 23.0, 17.0, 8.0, 19.0, 7.0, 7.0, 4.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.189453125, -1.1475677490234375, -1.105682373046875, -1.0637969970703125, -1.02191162109375, -0.9800262451171875, -0.938140869140625, -0.8962554931640625, -0.8543701171875, -0.8124847412109375, -0.770599365234375, -0.7287139892578125, -0.68682861328125, -0.6449432373046875, -0.603057861328125, -0.5611724853515625, -0.519287109375, -0.4774017333984375, -0.435516357421875, -0.3936309814453125, -0.35174560546875, -0.3098602294921875, -0.267974853515625, -0.2260894775390625, -0.1842041015625, -0.1423187255859375, -0.100433349609375, -0.0585479736328125, -0.01666259765625, 0.0252227783203125, 0.067108154296875, 0.1089935302734375, 0.15087890625, 0.1927642822265625, 0.234649658203125, 0.2765350341796875, 0.31842041015625, 0.3603057861328125, 0.402191162109375, 0.4440765380859375, 0.4859619140625, 0.5278472900390625, 0.569732666015625, 0.6116180419921875, 0.65350341796875, 0.6953887939453125, 0.737274169921875, 0.7791595458984375, 0.821044921875, 0.8629302978515625, 0.904815673828125, 0.9467010498046875, 0.98858642578125, 1.0304718017578125, 1.072357177734375, 1.1142425537109375, 1.1561279296875, 1.1980133056640625, 1.239898681640625, 1.2817840576171875, 1.32366943359375, 1.3655548095703125, 1.407440185546875, 1.4493255615234375, 1.4912109375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 6.0, 10.0, 8.0, 7.0, 12.0, 13.0, 21.0, 20.0, 36.0, 29.0, 36.0, 40.0, 51.0, 58.0, 53.0, 55.0, 60.0, 64.0, 45.0, 48.0, 53.0, 44.0, 40.0, 28.0, 36.0, 26.0, 12.0, 15.0, 16.0, 12.0, 7.0, 7.0, 5.0, 5.0, 6.0, 1.0, 5.0, 1.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.197265625, -1.16064453125, -1.1240234375, -1.08740234375, -1.05078125, -1.01416015625, -0.9775390625, -0.94091796875, -0.904296875, -0.86767578125, -0.8310546875, -0.79443359375, -0.7578125, -0.72119140625, -0.6845703125, -0.64794921875, -0.611328125, -0.57470703125, -0.5380859375, -0.50146484375, -0.46484375, -0.42822265625, -0.3916015625, -0.35498046875, -0.318359375, -0.28173828125, -0.2451171875, -0.20849609375, -0.171875, -0.13525390625, -0.0986328125, -0.06201171875, -0.025390625, 0.01123046875, 0.0478515625, 0.08447265625, 0.12109375, 0.15771484375, 0.1943359375, 0.23095703125, 0.267578125, 0.30419921875, 0.3408203125, 0.37744140625, 0.4140625, 0.45068359375, 0.4873046875, 0.52392578125, 0.560546875, 0.59716796875, 0.6337890625, 0.67041015625, 0.70703125, 0.74365234375, 0.7802734375, 0.81689453125, 0.853515625, 0.89013671875, 0.9267578125, 0.96337890625, 1.0, 1.03662109375, 1.0732421875, 1.10986328125, 1.146484375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 7.0, 8.0, 27.0, 34.0, 53.0, 139.0, 216.0, 548.0, 1379.0, 5090.0, 80000.0, 934979.0, 21558.0, 2870.0, 916.0, 365.0, 168.0, 91.0, 37.0, 22.0, 11.0, 10.0, 7.0, 6.0, 2.0, 0.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38037109375, -0.36644744873046875, -0.3525238037109375, -0.33860015869140625, -0.324676513671875, -0.31075286865234375, -0.2968292236328125, -0.28290557861328125, -0.26898193359375, -0.25505828857421875, -0.2411346435546875, -0.22721099853515625, -0.213287353515625, -0.19936370849609375, -0.1854400634765625, -0.17151641845703125, -0.1575927734375, -0.14366912841796875, -0.1297454833984375, -0.11582183837890625, -0.101898193359375, -0.08797454833984375, -0.0740509033203125, -0.06012725830078125, -0.04620361328125, -0.03227996826171875, -0.0183563232421875, -0.00443267822265625, 0.009490966796875, 0.02341461181640625, 0.0373382568359375, 0.05126190185546875, 0.065185546875, 0.07910919189453125, 0.0930328369140625, 0.10695648193359375, 0.120880126953125, 0.13480377197265625, 0.1487274169921875, 0.16265106201171875, 0.17657470703125, 0.19049835205078125, 0.2044219970703125, 0.21834564208984375, 0.232269287109375, 0.24619293212890625, 0.2601165771484375, 0.27404022216796875, 0.2879638671875, 0.30188751220703125, 0.3158111572265625, 0.32973480224609375, 0.343658447265625, 0.35758209228515625, 0.3715057373046875, 0.38542938232421875, 0.39935302734375, 0.41327667236328125, 0.4272003173828125, 0.44112396240234375, 0.455047607421875, 0.46897125244140625, 0.4828948974609375, 0.49681854248046875, 0.5107421875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 13.0, 34.0, 68.0, 102.0, 338.0, 265.0, 88.0, 33.0, 17.0, 16.0, 10.0, 9.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.839897155761719e-05, -4.608370363712311e-05, -4.376843571662903e-05, -4.145316779613495e-05, -3.913789987564087e-05, -3.682263195514679e-05, -3.450736403465271e-05, -3.219209611415863e-05, -2.987682819366455e-05, -2.756156027317047e-05, -2.524629235267639e-05, -2.2931024432182312e-05, -2.0615756511688232e-05, -1.8300488591194153e-05, -1.5985220670700073e-05, -1.3669952750205994e-05, -1.1354684829711914e-05, -9.039416909217834e-06, -6.724148988723755e-06, -4.408881068229675e-06, -2.0936131477355957e-06, 2.2165477275848389e-07, 2.5369226932525635e-06, 4.852190613746643e-06, 7.167458534240723e-06, 9.482726454734802e-06, 1.1797994375228882e-05, 1.4113262295722961e-05, 1.642853021621704e-05, 1.874379813671112e-05, 2.10590660572052e-05, 2.337433397769928e-05, 2.568960189819336e-05, 2.800486981868744e-05, 3.032013773918152e-05, 3.26354056596756e-05, 3.495067358016968e-05, 3.726594150066376e-05, 3.958120942115784e-05, 4.1896477341651917e-05, 4.4211745262145996e-05, 4.6527013182640076e-05, 4.8842281103134155e-05, 5.1157549023628235e-05, 5.3472816944122314e-05, 5.5788084864616394e-05, 5.8103352785110474e-05, 6.041862070560455e-05, 6.273388862609863e-05, 6.504915654659271e-05, 6.736442446708679e-05, 6.967969238758087e-05, 7.199496030807495e-05, 7.431022822856903e-05, 7.662549614906311e-05, 7.894076406955719e-05, 8.125603199005127e-05, 8.357129991054535e-05, 8.588656783103943e-05, 8.820183575153351e-05, 9.051710367202759e-05, 9.283237159252167e-05, 9.514763951301575e-05, 9.746290743350983e-05, 9.97781753540039e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 6.0, 11.0, 25.0, 40.0, 61.0, 122.0, 244.0, 555.0, 1517.0, 8542.0, 672777.0, 355141.0, 7085.0, 1434.0, 503.0, 226.0, 111.0, 50.0, 43.0, 16.0, 13.0, 13.0, 7.0, 1.0, 6.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6181640625, -0.6009750366210938, -0.5837860107421875, -0.5665969848632812, -0.549407958984375, -0.5322189331054688, -0.5150299072265625, -0.49784088134765625, -0.48065185546875, -0.46346282958984375, -0.4462738037109375, -0.42908477783203125, -0.411895751953125, -0.39470672607421875, -0.3775177001953125, -0.36032867431640625, -0.3431396484375, -0.32595062255859375, -0.3087615966796875, -0.29157257080078125, -0.274383544921875, -0.25719451904296875, -0.2400054931640625, -0.22281646728515625, -0.20562744140625, -0.18843841552734375, -0.1712493896484375, -0.15406036376953125, -0.136871337890625, -0.11968231201171875, -0.1024932861328125, -0.08530426025390625, -0.068115234375, -0.05092620849609375, -0.0337371826171875, -0.01654815673828125, 0.000640869140625, 0.01782989501953125, 0.0350189208984375, 0.05220794677734375, 0.06939697265625, 0.08658599853515625, 0.1037750244140625, 0.12096405029296875, 0.138153076171875, 0.15534210205078125, 0.1725311279296875, 0.18972015380859375, 0.2069091796875, 0.22409820556640625, 0.2412872314453125, 0.25847625732421875, 0.275665283203125, 0.29285430908203125, 0.3100433349609375, 0.32723236083984375, 0.34442138671875, 0.36161041259765625, 0.3787994384765625, 0.39598846435546875, 0.413177490234375, 0.43036651611328125, 0.4475555419921875, 0.46474456787109375, 0.48193359375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 6.0, 8.0, 11.0, 12.0, 28.0, 33.0, 30.0, 62.0, 131.0, 241.0, 171.0, 86.0, 58.0, 41.0, 24.0, 19.0, 15.0, 10.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.12005615234375, -0.11640071868896484, -0.11274528503417969, -0.10908985137939453, -0.10543441772460938, -0.10177898406982422, -0.09812355041503906, -0.0944681167602539, -0.09081268310546875, -0.0871572494506836, -0.08350181579589844, -0.07984638214111328, -0.07619094848632812, -0.07253551483154297, -0.06888008117675781, -0.06522464752197266, -0.0615692138671875, -0.057913780212402344, -0.05425834655761719, -0.05060291290283203, -0.046947479248046875, -0.04329204559326172, -0.03963661193847656, -0.035981178283691406, -0.03232574462890625, -0.028670310974121094, -0.025014877319335938, -0.02135944366455078, -0.017704010009765625, -0.014048576354980469, -0.010393142700195312, -0.006737709045410156, -0.003082275390625, 0.0005731582641601562, 0.0042285919189453125, 0.007884025573730469, 0.011539459228515625, 0.015194892883300781, 0.018850326538085938, 0.022505760192871094, 0.02616119384765625, 0.029816627502441406, 0.03347206115722656, 0.03712749481201172, 0.040782928466796875, 0.04443836212158203, 0.04809379577636719, 0.051749229431152344, 0.0554046630859375, 0.059060096740722656, 0.06271553039550781, 0.06637096405029297, 0.07002639770507812, 0.07368183135986328, 0.07733726501464844, 0.0809926986694336, 0.08464813232421875, 0.0883035659790039, 0.09195899963378906, 0.09561443328857422, 0.09926986694335938, 0.10292530059814453, 0.10658073425292969, 0.11023616790771484, 0.1138916015625]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 9.0, 7.0, 20.0, 48.0, 77.0, 107.0, 155.0, 182.0, 146.0, 109.0, 71.0, 26.0, 18.0, 9.0, 7.0, 4.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.3378665447235107, -2.2680842876434326, -2.1983020305633545, -2.1285197734832764, -2.0587375164031982, -1.9889552593231201, -1.9191731214523315, -1.8493908643722534, -1.7796086072921753, -1.7098263502120972, -1.640044093132019, -1.570261836051941, -1.5004796981811523, -1.4306974411010742, -1.360915184020996, -1.291132926940918, -1.2213506698608398, -1.1515684127807617, -1.0817861557006836, -1.0120038986206055, -0.9422217011451721, -0.872439444065094, -0.8026572465896606, -0.7328749895095825, -0.6630927324295044, -0.5933104753494263, -0.5235282182693481, -0.4537460207939148, -0.38396376371383667, -0.31418150663375854, -0.2443992793560028, -0.17461705207824707, -0.10483503341674805, -0.035052791237831116, 0.034729450941085815, 0.10451169312000275, 0.17429393529891968, 0.2440761923789978, 0.31385841965675354, 0.3836406469345093, 0.4534229040145874, 0.5232051610946655, 0.5929874181747437, 0.662769615650177, 0.7325518727302551, 0.8023341298103333, 0.8721163272857666, 0.9418985843658447, 1.0116808414459229, 1.081463098526001, 1.151245355606079, 1.2210276126861572, 1.2908098697662354, 1.3605921268463135, 1.430374264717102, 1.5001565217971802, 1.5699387788772583, 1.6397210359573364, 1.7095032930374146, 1.7792855501174927, 1.8490676879882812, 1.9188499450683594, 1.9886322021484375, 2.0584144592285156, 2.1281967163085938]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 2.0, 7.0, 6.0, 1.0, 6.0, 8.0, 8.0, 14.0, 12.0, 9.0, 17.0, 21.0, 11.0, 24.0, 20.0, 20.0, 30.0, 23.0, 34.0, 33.0, 37.0, 48.0, 39.0, 40.0, 29.0, 33.0, 39.0, 35.0, 38.0, 38.0, 31.0, 33.0, 29.0, 22.0, 25.0, 27.0, 22.0, 21.0, 14.0, 14.0, 16.0, 13.0, 11.0, 6.0, 4.0, 7.0, 11.0, 4.0, 6.0, 3.0, 1.0, 6.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.3289316892623901, -1.2862021923065186, -1.2434725761413574, -1.2007430791854858, -1.1580134630203247, -1.1152839660644531, -1.072554349899292, -1.0298248529434204, -0.987095296382904, -0.9443657398223877, -0.9016361832618713, -0.858906626701355, -0.8161771297454834, -0.7734475135803223, -0.7307180166244507, -0.6879884600639343, -0.645258903503418, -0.6025293469429016, -0.5597997903823853, -0.5170702934265137, -0.4743407070636749, -0.43161115050315857, -0.3888816237449646, -0.34615206718444824, -0.3034225106239319, -0.2606929540634155, -0.21796341240406036, -0.1752338707447052, -0.13250431418418884, -0.08977475762367249, -0.047045230865478516, -0.004315674304962158, 0.03841400146484375, 0.08114355057477951, 0.12387309968471527, 0.16660264134407043, 0.2093321979045868, 0.25206175446510315, 0.2947912812232971, 0.3375208377838135, 0.38025039434432983, 0.4229799509048462, 0.46570950746536255, 0.5084390640258789, 0.5511685609817505, 0.5938981771469116, 0.6366276741027832, 0.6793572306632996, 0.7220867872238159, 0.7648163437843323, 0.8075459003448486, 0.8502753973007202, 0.8930050134658813, 0.9357345104217529, 0.9784640669822693, 1.0211936235427856, 1.0639231204986572, 1.1066526174545288, 1.14938223361969, 1.1921117305755615, 1.2348413467407227, 1.2775708436965942, 1.3203003406524658, 1.363029956817627, 1.405759572982788]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 5.0, 7.0, 8.0, 14.0, 9.0, 12.0, 21.0, 31.0, 34.0, 46.0, 46.0, 78.0, 150.0, 282.0, 611.0, 1880.0, 9566.0, 231104.0, 3881260.0, 60608.0, 5878.0, 1471.0, 483.0, 232.0, 120.0, 75.0, 58.0, 38.0, 34.0, 32.0, 21.0, 22.0, 8.0, 8.0, 6.0, 6.0, 8.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.908203125, -1.840911865234375, -1.77362060546875, -1.706329345703125, -1.6390380859375, -1.571746826171875, -1.50445556640625, -1.437164306640625, -1.369873046875, -1.302581787109375, -1.23529052734375, -1.167999267578125, -1.1007080078125, -1.033416748046875, -0.96612548828125, -0.898834228515625, -0.83154296875, -0.764251708984375, -0.69696044921875, -0.629669189453125, -0.5623779296875, -0.495086669921875, -0.42779541015625, -0.360504150390625, -0.293212890625, -0.225921630859375, -0.15863037109375, -0.091339111328125, -0.0240478515625, 0.043243408203125, 0.11053466796875, 0.177825927734375, 0.2451171875, 0.312408447265625, 0.37969970703125, 0.446990966796875, 0.5142822265625, 0.581573486328125, 0.64886474609375, 0.716156005859375, 0.783447265625, 0.850738525390625, 0.91802978515625, 0.985321044921875, 1.0526123046875, 1.119903564453125, 1.18719482421875, 1.254486083984375, 1.32177734375, 1.389068603515625, 1.45635986328125, 1.523651123046875, 1.5909423828125, 1.658233642578125, 1.72552490234375, 1.792816162109375, 1.860107421875, 1.927398681640625, 1.99468994140625, 2.061981201171875, 2.1292724609375, 2.196563720703125, 2.26385498046875, 2.331146240234375, 2.3984375]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 3.0, 4.0, 6.0, 11.0, 12.0, 15.0, 19.0, 21.0, 43.0, 48.0, 43.0, 64.0, 60.0, 67.0, 57.0, 82.0, 66.0, 67.0, 48.0, 55.0, 42.0, 30.0, 38.0, 23.0, 17.0, 13.0, 12.0, 13.0, 5.0, 3.0, 3.0, 6.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.435546875, -0.4159393310546875, -0.396331787109375, -0.3767242431640625, -0.35711669921875, -0.3375091552734375, -0.317901611328125, -0.2982940673828125, -0.2786865234375, -0.2590789794921875, -0.239471435546875, -0.2198638916015625, -0.20025634765625, -0.1806488037109375, -0.161041259765625, -0.1414337158203125, -0.121826171875, -0.1022186279296875, -0.082611083984375, -0.0630035400390625, -0.04339599609375, -0.0237884521484375, -0.004180908203125, 0.0154266357421875, 0.0350341796875, 0.0546417236328125, 0.074249267578125, 0.0938568115234375, 0.11346435546875, 0.1330718994140625, 0.152679443359375, 0.1722869873046875, 0.19189453125, 0.2115020751953125, 0.231109619140625, 0.2507171630859375, 0.27032470703125, 0.2899322509765625, 0.309539794921875, 0.3291473388671875, 0.3487548828125, 0.3683624267578125, 0.387969970703125, 0.4075775146484375, 0.42718505859375, 0.4467926025390625, 0.466400146484375, 0.4860076904296875, 0.505615234375, 0.5252227783203125, 0.544830322265625, 0.5644378662109375, 0.58404541015625, 0.6036529541015625, 0.623260498046875, 0.6428680419921875, 0.6624755859375, 0.6820831298828125, 0.701690673828125, 0.7212982177734375, 0.74090576171875, 0.7605133056640625, 0.780120849609375, 0.7997283935546875, 0.8193359375]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 14.0, 15.0, 27.0, 33.0, 71.0, 168.0, 370.0, 1044.0, 3779.0, 26110.0, 1513100.0, 2610685.0, 32485.0, 4428.0, 1186.0, 386.0, 189.0, 81.0, 53.0, 25.0, 10.0, 6.0, 3.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2978515625, -1.2438812255859375, -1.189910888671875, -1.1359405517578125, -1.08197021484375, -1.0279998779296875, -0.974029541015625, -0.9200592041015625, -0.8660888671875, -0.8121185302734375, -0.758148193359375, -0.7041778564453125, -0.65020751953125, -0.5962371826171875, -0.542266845703125, -0.4882965087890625, -0.434326171875, -0.3803558349609375, -0.326385498046875, -0.2724151611328125, -0.21844482421875, -0.1644744873046875, -0.110504150390625, -0.0565338134765625, -0.0025634765625, 0.0514068603515625, 0.105377197265625, 0.1593475341796875, 0.21331787109375, 0.2672882080078125, 0.321258544921875, 0.3752288818359375, 0.42919921875, 0.4831695556640625, 0.537139892578125, 0.5911102294921875, 0.64508056640625, 0.6990509033203125, 0.753021240234375, 0.8069915771484375, 0.8609619140625, 0.9149322509765625, 0.968902587890625, 1.0228729248046875, 1.07684326171875, 1.1308135986328125, 1.184783935546875, 1.2387542724609375, 1.292724609375, 1.3466949462890625, 1.400665283203125, 1.4546356201171875, 1.50860595703125, 1.5625762939453125, 1.616546630859375, 1.6705169677734375, 1.7244873046875, 1.7784576416015625, 1.832427978515625, 1.8863983154296875, 1.94036865234375, 1.9943389892578125, 2.048309326171875, 2.1022796630859375, 2.15625]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 10.0, 11.0, 15.0, 24.0, 29.0, 31.0, 48.0, 71.0, 97.0, 155.0, 237.0, 350.0, 593.0, 666.0, 550.0, 373.0, 259.0, 165.0, 96.0, 82.0, 46.0, 39.0, 27.0, 19.0, 20.0, 10.0, 8.0, 7.0, 4.0, 3.0, 3.0, 0.0, 3.0, 0.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.28125, -0.2733287811279297, -0.2654075622558594, -0.25748634338378906, -0.24956512451171875, -0.24164390563964844, -0.23372268676757812, -0.2258014678955078, -0.2178802490234375, -0.2099590301513672, -0.20203781127929688, -0.19411659240722656, -0.18619537353515625, -0.17827415466308594, -0.17035293579101562, -0.1624317169189453, -0.154510498046875, -0.1465892791748047, -0.13866806030273438, -0.13074684143066406, -0.12282562255859375, -0.11490440368652344, -0.10698318481445312, -0.09906196594238281, -0.0911407470703125, -0.08321952819824219, -0.07529830932617188, -0.06737709045410156, -0.05945587158203125, -0.05153465270996094, -0.043613433837890625, -0.03569221496582031, -0.02777099609375, -0.019849777221679688, -0.011928558349609375, -0.0040073394775390625, 0.00391387939453125, 0.011835098266601562, 0.019756317138671875, 0.027677536010742188, 0.0355987548828125, 0.04351997375488281, 0.051441192626953125, 0.05936241149902344, 0.06728363037109375, 0.07520484924316406, 0.08312606811523438, 0.09104728698730469, 0.098968505859375, 0.10688972473144531, 0.11481094360351562, 0.12273216247558594, 0.13065338134765625, 0.13857460021972656, 0.14649581909179688, 0.1544170379638672, 0.1623382568359375, 0.1702594757080078, 0.17818069458007812, 0.18610191345214844, 0.19402313232421875, 0.20194435119628906, 0.20986557006835938, 0.2177867889404297, 0.2257080078125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 10.0, 16.0, 14.0, 33.0, 66.0, 80.0, 118.0, 153.0, 141.0, 114.0, 101.0, 67.0, 33.0, 18.0, 17.0, 13.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7533283233642578, -1.7073798179626465, -1.6614311933517456, -1.6154826879501343, -1.569534182548523, -1.5235856771469116, -1.4776370525360107, -1.4316885471343994, -1.385740041732788, -1.3397915363311768, -1.2938429117202759, -1.2478944063186646, -1.2019459009170532, -1.155997395515442, -1.110048770904541, -1.0641002655029297, -1.0181517601013184, -0.9722031950950623, -0.9262546896934509, -0.8803061246871948, -0.8343576192855835, -0.7884090542793274, -0.7424604892730713, -0.69651198387146, -0.6505633592605591, -0.604614794254303, -0.5586662888526917, -0.5127177238464355, -0.4667692184448242, -0.4208206534385681, -0.3748721182346344, -0.3289235830307007, -0.28297507762908936, -0.23702654242515564, -0.19107800722122192, -0.14512945711612701, -0.0991809219121933, -0.05323238670825958, -0.007283836603164673, 0.03866469860076904, 0.08461323380470276, 0.13056176900863647, 0.1765103042125702, 0.2224588543176651, 0.26840740442276, 0.31435590982437134, 0.36030447483062744, 0.40625301003456116, 0.4522015452384949, 0.4981500804424286, 0.5440986156463623, 0.5900471806526184, 0.6359956860542297, 0.6819442510604858, 0.7278927564620972, 0.7738413214683533, 0.8197898864746094, 0.8657384514808655, 0.9116869568824768, 0.9576355218887329, 1.0035840272903442, 1.0495325326919556, 1.0954811573028564, 1.1414296627044678, 1.187378168106079]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 4.0, 5.0, 8.0, 6.0, 12.0, 13.0, 15.0, 23.0, 26.0, 34.0, 32.0, 26.0, 46.0, 29.0, 38.0, 47.0, 46.0, 50.0, 48.0, 56.0, 41.0, 39.0, 57.0, 43.0, 41.0, 30.0, 28.0, 22.0, 23.0, 19.0, 15.0, 24.0, 15.0, 10.0, 7.0, 9.0, 4.0, 6.0, 0.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6250004172325134, -0.6062010526657104, -0.5874016284942627, -0.5686022639274597, -0.5498028993606567, -0.531003475189209, -0.512204110622406, -0.493404746055603, -0.47460535168647766, -0.4558059573173523, -0.4370065927505493, -0.41820719838142395, -0.3994078040122986, -0.3806084394454956, -0.36180904507637024, -0.3430096507072449, -0.3242102861404419, -0.30541089177131653, -0.28661152720451355, -0.2678121328353882, -0.249012753367424, -0.23021337389945984, -0.21141397953033447, -0.1926146000623703, -0.17381522059440613, -0.15501584112644196, -0.13621646165847778, -0.11741706728935242, -0.09861768782138824, -0.07981830835342407, -0.0610189214348793, -0.042219534516334534, -0.023420095443725586, -0.004620712250471115, 0.014178670942783356, 0.03297805413603783, 0.0517774373292923, 0.07057681679725647, 0.08937620371580124, 0.10817559063434601, 0.12697497010231018, 0.14577434957027435, 0.16457372903823853, 0.1833731234073639, 0.20217250287532806, 0.22097188234329224, 0.2397712767124176, 0.25857067108154297, 0.27737003564834595, 0.2961694300174713, 0.3149687945842743, 0.33376818895339966, 0.35256755352020264, 0.371366947889328, 0.39016634225845337, 0.40896570682525635, 0.4277651011943817, 0.4465644955635071, 0.46536386013031006, 0.4841632544994354, 0.5029626488685608, 0.5217620134353638, 0.5405613780021667, 0.5593608021736145, 0.5781601667404175]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 4.0, 10.0, 11.0, 16.0, 35.0, 84.0, 252.0, 905.0, 3455.0, 15006.0, 309679.0, 692597.0, 20265.0, 4537.0, 1139.0, 312.0, 109.0, 48.0, 23.0, 17.0, 10.0, 5.0, 3.0, 5.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.796875, -0.7685089111328125, -0.740142822265625, -0.7117767333984375, -0.68341064453125, -0.6550445556640625, -0.626678466796875, -0.5983123779296875, -0.5699462890625, -0.5415802001953125, -0.513214111328125, -0.4848480224609375, -0.45648193359375, -0.4281158447265625, -0.399749755859375, -0.3713836669921875, -0.343017578125, -0.3146514892578125, -0.286285400390625, -0.2579193115234375, -0.22955322265625, -0.2011871337890625, -0.172821044921875, -0.1444549560546875, -0.1160888671875, -0.0877227783203125, -0.059356689453125, -0.0309906005859375, -0.00262451171875, 0.0257415771484375, 0.054107666015625, 0.0824737548828125, 0.11083984375, 0.1392059326171875, 0.167572021484375, 0.1959381103515625, 0.22430419921875, 0.2526702880859375, 0.281036376953125, 0.3094024658203125, 0.3377685546875, 0.3661346435546875, 0.394500732421875, 0.4228668212890625, 0.45123291015625, 0.4795989990234375, 0.507965087890625, 0.5363311767578125, 0.564697265625, 0.5930633544921875, 0.621429443359375, 0.6497955322265625, 0.67816162109375, 0.7065277099609375, 0.734893798828125, 0.7632598876953125, 0.7916259765625, 0.8199920654296875, 0.848358154296875, 0.8767242431640625, 0.90509033203125, 0.9334564208984375, 0.961822509765625, 0.9901885986328125, 1.0185546875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 7.0, 7.0, 6.0, 8.0, 12.0, 20.0, 17.0, 20.0, 20.0, 31.0, 30.0, 37.0, 34.0, 29.0, 42.0, 40.0, 50.0, 47.0, 55.0, 45.0, 51.0, 48.0, 41.0, 38.0, 42.0, 30.0, 29.0, 17.0, 26.0, 21.0, 19.0, 13.0, 16.0, 14.0, 10.0, 9.0, 5.0, 3.0, 4.0, 7.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.322509765625, -0.3100433349609375, -0.297576904296875, -0.2851104736328125, -0.27264404296875, -0.2601776123046875, -0.247711181640625, -0.2352447509765625, -0.2227783203125, -0.2103118896484375, -0.197845458984375, -0.1853790283203125, -0.17291259765625, -0.1604461669921875, -0.147979736328125, -0.1355133056640625, -0.123046875, -0.1105804443359375, -0.098114013671875, -0.0856475830078125, -0.07318115234375, -0.0607147216796875, -0.048248291015625, -0.0357818603515625, -0.0233154296875, -0.0108489990234375, 0.001617431640625, 0.0140838623046875, 0.02655029296875, 0.0390167236328125, 0.051483154296875, 0.0639495849609375, 0.076416015625, 0.0888824462890625, 0.101348876953125, 0.1138153076171875, 0.12628173828125, 0.1387481689453125, 0.151214599609375, 0.1636810302734375, 0.1761474609375, 0.1886138916015625, 0.201080322265625, 0.2135467529296875, 0.22601318359375, 0.2384796142578125, 0.250946044921875, 0.2634124755859375, 0.27587890625, 0.2883453369140625, 0.300811767578125, 0.3132781982421875, 0.32574462890625, 0.3382110595703125, 0.350677490234375, 0.3631439208984375, 0.3756103515625, 0.3880767822265625, 0.400543212890625, 0.4130096435546875, 0.42547607421875, 0.4379425048828125, 0.450408935546875, 0.4628753662109375, 0.475341796875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 5.0, 7.0, 9.0, 8.0, 15.0, 21.0, 22.0, 28.0, 57.0, 81.0, 102.0, 182.0, 324.0, 634.0, 1139.0, 2628.0, 6604.0, 24736.0, 243566.0, 683734.0, 64583.0, 12261.0, 4203.0, 1723.0, 822.0, 434.0, 223.0, 136.0, 90.0, 61.0, 28.0, 26.0, 15.0, 14.0, 7.0, 6.0, 4.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.3515625, -0.34066009521484375, -0.3297576904296875, -0.31885528564453125, -0.307952880859375, -0.29705047607421875, -0.2861480712890625, -0.27524566650390625, -0.26434326171875, -0.25344085693359375, -0.2425384521484375, -0.23163604736328125, -0.220733642578125, -0.20983123779296875, -0.1989288330078125, -0.18802642822265625, -0.1771240234375, -0.16622161865234375, -0.1553192138671875, -0.14441680908203125, -0.133514404296875, -0.12261199951171875, -0.1117095947265625, -0.10080718994140625, -0.08990478515625, -0.07900238037109375, -0.0680999755859375, -0.05719757080078125, -0.046295166015625, -0.03539276123046875, -0.0244903564453125, -0.01358795166015625, -0.002685546875, 0.00821685791015625, 0.0191192626953125, 0.03002166748046875, 0.040924072265625, 0.05182647705078125, 0.0627288818359375, 0.07363128662109375, 0.08453369140625, 0.09543609619140625, 0.1063385009765625, 0.11724090576171875, 0.128143310546875, 0.13904571533203125, 0.1499481201171875, 0.16085052490234375, 0.1717529296875, 0.18265533447265625, 0.1935577392578125, 0.20446014404296875, 0.215362548828125, 0.22626495361328125, 0.2371673583984375, 0.24806976318359375, 0.25897216796875, 0.26987457275390625, 0.2807769775390625, 0.29167938232421875, 0.302581787109375, 0.31348419189453125, 0.3243865966796875, 0.33528900146484375, 0.34619140625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 7.0, 5.0, 3.0, 6.0, 4.0, 10.0, 11.0, 11.0, 10.0, 10.0, 21.0, 28.0, 25.0, 41.0, 25.0, 31.0, 36.0, 44.0, 50.0, 41.0, 45.0, 46.0, 43.0, 53.0, 44.0, 48.0, 30.0, 34.0, 32.0, 40.0, 38.0, 25.0, 14.0, 15.0, 12.0, 11.0, 8.0, 15.0, 9.0, 6.0, 8.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.810546875, -0.7858963012695312, -0.7612457275390625, -0.7365951538085938, -0.711944580078125, -0.6872940063476562, -0.6626434326171875, -0.6379928588867188, -0.61334228515625, -0.5886917114257812, -0.5640411376953125, -0.5393905639648438, -0.514739990234375, -0.49008941650390625, -0.4654388427734375, -0.44078826904296875, -0.4161376953125, -0.39148712158203125, -0.3668365478515625, -0.34218597412109375, -0.317535400390625, -0.29288482666015625, -0.2682342529296875, -0.24358367919921875, -0.21893310546875, -0.19428253173828125, -0.1696319580078125, -0.14498138427734375, -0.120330810546875, -0.09568023681640625, -0.0710296630859375, -0.04637908935546875, -0.021728515625, 0.00292205810546875, 0.0275726318359375, 0.05222320556640625, 0.076873779296875, 0.10152435302734375, 0.1261749267578125, 0.15082550048828125, 0.17547607421875, 0.20012664794921875, 0.2247772216796875, 0.24942779541015625, 0.274078369140625, 0.29872894287109375, 0.3233795166015625, 0.34803009033203125, 0.3726806640625, 0.39733123779296875, 0.4219818115234375, 0.44663238525390625, 0.471282958984375, 0.49593353271484375, 0.5205841064453125, 0.5452346801757812, 0.56988525390625, 0.5945358276367188, 0.6191864013671875, 0.6438369750976562, 0.668487548828125, 0.6931381225585938, 0.7177886962890625, 0.7424392700195312, 0.76708984375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 6.0, 8.0, 8.0, 4.0, 12.0, 10.0, 29.0, 41.0, 52.0, 110.0, 179.0, 384.0, 796.0, 2176.0, 7415.0, 40576.0, 420014.0, 513937.0, 50168.0, 8479.0, 2408.0, 897.0, 366.0, 196.0, 105.0, 63.0, 32.0, 35.0, 18.0, 6.0, 10.0, 10.0, 4.0, 6.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.093017578125, -0.08970165252685547, -0.08638572692871094, -0.0830698013305664, -0.07975387573242188, -0.07643795013427734, -0.07312202453613281, -0.06980609893798828, -0.06649017333984375, -0.06317424774169922, -0.05985832214355469, -0.056542396545410156, -0.053226470947265625, -0.049910545349121094, -0.04659461975097656, -0.04327869415283203, -0.0399627685546875, -0.03664684295654297, -0.03333091735839844, -0.030014991760253906, -0.026699066162109375, -0.023383140563964844, -0.020067214965820312, -0.01675128936767578, -0.01343536376953125, -0.010119438171386719, -0.0068035125732421875, -0.0034875869750976562, -0.000171661376953125, 0.0031442642211914062, 0.0064601898193359375, 0.009776115417480469, 0.013092041015625, 0.01640796661376953, 0.019723892211914062, 0.023039817810058594, 0.026355743408203125, 0.029671669006347656, 0.03298759460449219, 0.03630352020263672, 0.03961944580078125, 0.04293537139892578, 0.04625129699707031, 0.049567222595214844, 0.052883148193359375, 0.056199073791503906, 0.05951499938964844, 0.06283092498779297, 0.0661468505859375, 0.06946277618408203, 0.07277870178222656, 0.0760946273803711, 0.07941055297851562, 0.08272647857666016, 0.08604240417480469, 0.08935832977294922, 0.09267425537109375, 0.09599018096923828, 0.09930610656738281, 0.10262203216552734, 0.10593795776367188, 0.1092538833618164, 0.11256980895996094, 0.11588573455810547, 0.11920166015625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 10.0, 10.0, 9.0, 11.0, 24.0, 21.0, 29.0, 37.0, 51.0, 66.0, 75.0, 61.0, 96.0, 87.0, 83.0, 61.0, 60.0, 52.0, 28.0, 34.0, 17.0, 14.0, 15.0, 13.0, 7.0, 7.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.3186206817626953e-05, -2.2288411855697632e-05, -2.139061689376831e-05, -2.049282193183899e-05, -1.9595026969909668e-05, -1.8697232007980347e-05, -1.7799437046051025e-05, -1.6901642084121704e-05, -1.6003847122192383e-05, -1.5106052160263062e-05, -1.420825719833374e-05, -1.3310462236404419e-05, -1.2412667274475098e-05, -1.1514872312545776e-05, -1.0617077350616455e-05, -9.719282388687134e-06, -8.821487426757812e-06, -7.923692464828491e-06, -7.02589750289917e-06, -6.128102540969849e-06, -5.230307579040527e-06, -4.332512617111206e-06, -3.4347176551818848e-06, -2.5369226932525635e-06, -1.6391277313232422e-06, -7.413327693939209e-07, 1.564621925354004e-07, 1.0542571544647217e-06, 1.952052116394043e-06, 2.8498470783233643e-06, 3.7476420402526855e-06, 4.645437002182007e-06, 5.543231964111328e-06, 6.441026926040649e-06, 7.338821887969971e-06, 8.236616849899292e-06, 9.134411811828613e-06, 1.0032206773757935e-05, 1.0930001735687256e-05, 1.1827796697616577e-05, 1.2725591659545898e-05, 1.362338662147522e-05, 1.4521181583404541e-05, 1.5418976545333862e-05, 1.6316771507263184e-05, 1.7214566469192505e-05, 1.8112361431121826e-05, 1.9010156393051147e-05, 1.990795135498047e-05, 2.080574631690979e-05, 2.170354127883911e-05, 2.2601336240768433e-05, 2.3499131202697754e-05, 2.4396926164627075e-05, 2.5294721126556396e-05, 2.6192516088485718e-05, 2.709031105041504e-05, 2.798810601234436e-05, 2.888590097427368e-05, 2.9783695936203003e-05, 3.0681490898132324e-05, 3.1579285860061646e-05, 3.247708082199097e-05, 3.337487578392029e-05, 3.427267074584961e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 8.0, 11.0, 11.0, 15.0, 16.0, 23.0, 39.0, 63.0, 109.0, 148.0, 257.0, 468.0, 1144.0, 2658.0, 7464.0, 22705.0, 83493.0, 355188.0, 426325.0, 105947.0, 27645.0, 8928.0, 3261.0, 1276.0, 619.0, 257.0, 173.0, 92.0, 75.0, 34.0, 28.0, 25.0, 13.0, 10.0, 10.0, 8.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0863037109375, -0.08391189575195312, -0.08152008056640625, -0.07912826538085938, -0.0767364501953125, -0.07434463500976562, -0.07195281982421875, -0.06956100463867188, -0.067169189453125, -0.06477737426757812, -0.06238555908203125, -0.059993743896484375, -0.0576019287109375, -0.055210113525390625, -0.05281829833984375, -0.050426483154296875, -0.04803466796875, -0.045642852783203125, -0.04325103759765625, -0.040859222412109375, -0.0384674072265625, -0.036075592041015625, -0.03368377685546875, -0.031291961669921875, -0.028900146484375, -0.026508331298828125, -0.02411651611328125, -0.021724700927734375, -0.0193328857421875, -0.016941070556640625, -0.01454925537109375, -0.012157440185546875, -0.009765625, -0.007373809814453125, -0.00498199462890625, -0.002590179443359375, -0.0001983642578125, 0.002193450927734375, 0.00458526611328125, 0.006977081298828125, 0.009368896484375, 0.011760711669921875, 0.01415252685546875, 0.016544342041015625, 0.0189361572265625, 0.021327972412109375, 0.02371978759765625, 0.026111602783203125, 0.02850341796875, 0.030895233154296875, 0.03328704833984375, 0.035678863525390625, 0.0380706787109375, 0.040462493896484375, 0.04285430908203125, 0.045246124267578125, 0.047637939453125, 0.050029754638671875, 0.05242156982421875, 0.054813385009765625, 0.0572052001953125, 0.059597015380859375, 0.06198883056640625, 0.06438064575195312, 0.0667724609375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 4.0, 4.0, 1.0, 4.0, 9.0, 6.0, 6.0, 10.0, 9.0, 15.0, 28.0, 29.0, 16.0, 36.0, 41.0, 55.0, 73.0, 61.0, 106.0, 106.0, 66.0, 67.0, 50.0, 44.0, 33.0, 25.0, 21.0, 15.0, 10.0, 14.0, 9.0, 8.0, 7.0, 5.0, 0.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0213775634765625, -0.020745038986206055, -0.02011251449584961, -0.019479990005493164, -0.01884746551513672, -0.018214941024780273, -0.017582416534423828, -0.016949892044067383, -0.016317367553710938, -0.015684843063354492, -0.015052318572998047, -0.014419794082641602, -0.013787269592285156, -0.013154745101928711, -0.012522220611572266, -0.01188969612121582, -0.011257171630859375, -0.01062464714050293, -0.009992122650146484, -0.009359598159790039, -0.008727073669433594, -0.008094549179077148, -0.007462024688720703, -0.006829500198364258, -0.0061969757080078125, -0.005564451217651367, -0.004931926727294922, -0.0042994022369384766, -0.0036668777465820312, -0.003034353256225586, -0.0024018287658691406, -0.0017693042755126953, -0.00113677978515625, -0.0005042552947998047, 0.00012826919555664062, 0.0007607936859130859, 0.0013933181762695312, 0.0020258426666259766, 0.002658367156982422, 0.003290891647338867, 0.0039234161376953125, 0.004555940628051758, 0.005188465118408203, 0.0058209896087646484, 0.006453514099121094, 0.007086038589477539, 0.007718563079833984, 0.00835108757019043, 0.008983612060546875, 0.00961613655090332, 0.010248661041259766, 0.010881185531616211, 0.011513710021972656, 0.012146234512329102, 0.012778759002685547, 0.013411283493041992, 0.014043807983398438, 0.014676332473754883, 0.015308856964111328, 0.015941381454467773, 0.01657390594482422, 0.017206430435180664, 0.01783895492553711, 0.018471479415893555, 0.01910400390625]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 4.0, 10.0, 9.0, 17.0, 20.0, 50.0, 51.0, 86.0, 116.0, 132.0, 133.0, 117.0, 89.0, 60.0, 49.0, 14.0, 20.0, 12.0, 8.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5594156384468079, -0.5328251719474792, -0.5062346458435059, -0.47964417934417725, -0.45305368304252625, -0.42646318674087524, -0.39987272024154663, -0.37328222393989563, -0.34669172763824463, -0.32010123133659363, -0.2935107350349426, -0.266920268535614, -0.240329772233963, -0.213739275932312, -0.1871487945318222, -0.1605583131313324, -0.1339678168296814, -0.10737732797861099, -0.08078683912754059, -0.054196350276470184, -0.02760586142539978, -0.0010153651237487793, 0.025575116276741028, 0.052165597677230835, 0.07875609397888184, 0.10534658282995224, 0.13193707168102264, 0.15852755308151245, 0.18511804938316345, 0.21170854568481445, 0.23829902708530426, 0.26488950848579407, 0.2914799451828003, 0.3180704414844513, 0.3446609377861023, 0.3712514042854309, 0.3978419005870819, 0.4244323968887329, 0.4510228633880615, 0.4776133596897125, 0.5042038559913635, 0.5307943224906921, 0.5573848485946655, 0.5839753150939941, 0.6105657815933228, 0.6371563076972961, 0.6637467741966248, 0.6903373003005981, 0.7169277667999268, 0.7435182332992554, 0.7701087594032288, 0.7966992259025574, 0.8232897520065308, 0.8498802185058594, 0.876470685005188, 0.9030611515045166, 0.92965167760849, 0.9562421441078186, 0.982832670211792, 1.0094231367111206, 1.0360136032104492, 1.0626041889190674, 1.089194655418396, 1.1157851219177246, 1.1423755884170532]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 9.0, 13.0, 9.0, 14.0, 11.0, 25.0, 28.0, 22.0, 31.0, 48.0, 30.0, 38.0, 46.0, 47.0, 59.0, 40.0, 44.0, 50.0, 57.0, 45.0, 46.0, 39.0, 38.0, 34.0, 25.0, 25.0, 19.0, 24.0, 14.0, 22.0, 5.0, 13.0, 5.0, 7.0, 5.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39754223823547363, -0.38491347432136536, -0.3722847104072571, -0.3596559464931488, -0.3470271825790405, -0.33439841866493225, -0.321769654750824, -0.3091408908367157, -0.2965121269226074, -0.28388336300849915, -0.27125459909439087, -0.2586258351802826, -0.24599707126617432, -0.23336830735206604, -0.22073954343795776, -0.2081107795238495, -0.19548200070858002, -0.18285323679447174, -0.17022447288036346, -0.1575957089662552, -0.1449669450521469, -0.13233816623687744, -0.11970940977334976, -0.10708064585924149, -0.09445188194513321, -0.08182311803102493, -0.06919435411691666, -0.05656558647751808, -0.043936822563409805, -0.03130805492401123, -0.018679291009902954, -0.006050527095794678, 0.006578236818313599, 0.019207000732421875, 0.03183576464653015, 0.044464532285928726, 0.057093296200037, 0.06972206383943558, 0.08235082775354385, 0.09497959166765213, 0.1076083555817604, 0.12023711949586868, 0.13286589086055756, 0.14549465477466583, 0.1581234186887741, 0.17075218260288239, 0.18338094651699066, 0.19600971043109894, 0.20863847434520721, 0.2212672382593155, 0.23389600217342377, 0.24652476608753204, 0.2591535449028015, 0.2717823088169098, 0.28441107273101807, 0.29703983664512634, 0.3096686005592346, 0.3222973644733429, 0.33492612838745117, 0.34755489230155945, 0.3601836562156677, 0.372812420129776, 0.3854411840438843, 0.39806994795799255, 0.41069871187210083]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 13.0, 19.0, 39.0, 65.0, 106.0, 182.0, 381.0, 773.0, 1806.0, 5436.0, 21677.0, 159332.0, 738950.0, 96958.0, 15534.0, 4324.0, 1605.0, 673.0, 312.0, 160.0, 71.0, 53.0, 39.0, 19.0, 7.0, 10.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6806640625, -0.6575088500976562, -0.6343536376953125, -0.6111984252929688, -0.588043212890625, -0.5648880004882812, -0.5417327880859375, -0.5185775756835938, -0.49542236328125, -0.47226715087890625, -0.4491119384765625, -0.42595672607421875, -0.402801513671875, -0.37964630126953125, -0.3564910888671875, -0.33333587646484375, -0.3101806640625, -0.28702545166015625, -0.2638702392578125, -0.24071502685546875, -0.217559814453125, -0.19440460205078125, -0.1712493896484375, -0.14809417724609375, -0.12493896484375, -0.10178375244140625, -0.0786285400390625, -0.05547332763671875, -0.032318115234375, -0.00916290283203125, 0.0139923095703125, 0.03714752197265625, 0.060302734375, 0.08345794677734375, 0.1066131591796875, 0.12976837158203125, 0.152923583984375, 0.17607879638671875, 0.1992340087890625, 0.22238922119140625, 0.24554443359375, 0.26869964599609375, 0.2918548583984375, 0.31501007080078125, 0.338165283203125, 0.36132049560546875, 0.3844757080078125, 0.40763092041015625, 0.4307861328125, 0.45394134521484375, 0.4770965576171875, 0.5002517700195312, 0.523406982421875, 0.5465621948242188, 0.5697174072265625, 0.5928726196289062, 0.61602783203125, 0.6391830444335938, 0.6623382568359375, 0.6854934692382812, 0.708648681640625, 0.7318038940429688, 0.7549591064453125, 0.7781143188476562, 0.80126953125]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 1.0, 6.0, 7.0, 9.0, 18.0, 22.0, 19.0, 42.0, 35.0, 42.0, 49.0, 68.0, 71.0, 77.0, 81.0, 77.0, 50.0, 82.0, 50.0, 40.0, 43.0, 32.0, 19.0, 19.0, 15.0, 12.0, 13.0, 9.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.39453125, -1.3599853515625, -1.325439453125, -1.2908935546875, -1.25634765625, -1.2218017578125, -1.187255859375, -1.1527099609375, -1.1181640625, -1.0836181640625, -1.049072265625, -1.0145263671875, -0.97998046875, -0.9454345703125, -0.910888671875, -0.8763427734375, -0.841796875, -0.8072509765625, -0.772705078125, -0.7381591796875, -0.70361328125, -0.6690673828125, -0.634521484375, -0.5999755859375, -0.5654296875, -0.5308837890625, -0.496337890625, -0.4617919921875, -0.42724609375, -0.3927001953125, -0.358154296875, -0.3236083984375, -0.2890625, -0.2545166015625, -0.219970703125, -0.1854248046875, -0.15087890625, -0.1163330078125, -0.081787109375, -0.0472412109375, -0.0126953125, 0.0218505859375, 0.056396484375, 0.0909423828125, 0.12548828125, 0.1600341796875, 0.194580078125, 0.2291259765625, 0.263671875, 0.2982177734375, 0.332763671875, 0.3673095703125, 0.40185546875, 0.4364013671875, 0.470947265625, 0.5054931640625, 0.5400390625, 0.5745849609375, 0.609130859375, 0.6436767578125, 0.67822265625, 0.7127685546875, 0.747314453125, 0.7818603515625, 0.81640625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 2.0, 5.0, 5.0, 7.0, 6.0, 13.0, 11.0, 10.0, 11.0, 21.0, 28.0, 34.0, 40.0, 60.0, 88.0, 106.0, 191.0, 364.0, 1182.0, 7726.0, 315901.0, 708132.0, 12024.0, 1462.0, 451.0, 208.0, 136.0, 70.0, 62.0, 34.0, 29.0, 23.0, 32.0, 6.0, 12.0, 12.0, 8.0, 11.0, 8.0, 2.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-1.4736328125, -1.4290924072265625, -1.384552001953125, -1.3400115966796875, -1.29547119140625, -1.2509307861328125, -1.206390380859375, -1.1618499755859375, -1.1173095703125, -1.0727691650390625, -1.028228759765625, -0.9836883544921875, -0.93914794921875, -0.8946075439453125, -0.850067138671875, -0.8055267333984375, -0.760986328125, -0.7164459228515625, -0.671905517578125, -0.6273651123046875, -0.58282470703125, -0.5382843017578125, -0.493743896484375, -0.4492034912109375, -0.4046630859375, -0.3601226806640625, -0.315582275390625, -0.2710418701171875, -0.22650146484375, -0.1819610595703125, -0.137420654296875, -0.0928802490234375, -0.04833984375, -0.0037994384765625, 0.040740966796875, 0.0852813720703125, 0.12982177734375, 0.1743621826171875, 0.218902587890625, 0.2634429931640625, 0.3079833984375, 0.3525238037109375, 0.397064208984375, 0.4416046142578125, 0.48614501953125, 0.5306854248046875, 0.575225830078125, 0.6197662353515625, 0.664306640625, 0.7088470458984375, 0.753387451171875, 0.7979278564453125, 0.84246826171875, 0.8870086669921875, 0.931549072265625, 0.9760894775390625, 1.0206298828125, 1.0651702880859375, 1.109710693359375, 1.1542510986328125, 1.19879150390625, 1.2433319091796875, 1.287872314453125, 1.3324127197265625, 1.376953125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 5.0, 7.0, 6.0, 5.0, 3.0, 5.0, 7.0, 10.0, 13.0, 18.0, 22.0, 25.0, 32.0, 25.0, 37.0, 29.0, 37.0, 42.0, 49.0, 33.0, 49.0, 35.0, 55.0, 45.0, 36.0, 44.0, 51.0, 38.0, 35.0, 28.0, 23.0, 24.0, 18.0, 16.0, 9.0, 15.0, 16.0, 7.0, 10.0, 7.0, 16.0, 4.0, 1.0, 7.0, 2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.81982421875, -0.79364013671875, -0.7674560546875, -0.74127197265625, -0.715087890625, -0.68890380859375, -0.6627197265625, -0.63653564453125, -0.6103515625, -0.58416748046875, -0.5579833984375, -0.53179931640625, -0.505615234375, -0.47943115234375, -0.4532470703125, -0.42706298828125, -0.40087890625, -0.37469482421875, -0.3485107421875, -0.32232666015625, -0.296142578125, -0.26995849609375, -0.2437744140625, -0.21759033203125, -0.19140625, -0.16522216796875, -0.1390380859375, -0.11285400390625, -0.086669921875, -0.06048583984375, -0.0343017578125, -0.00811767578125, 0.01806640625, 0.04425048828125, 0.0704345703125, 0.09661865234375, 0.122802734375, 0.14898681640625, 0.1751708984375, 0.20135498046875, 0.2275390625, 0.25372314453125, 0.2799072265625, 0.30609130859375, 0.332275390625, 0.35845947265625, 0.3846435546875, 0.41082763671875, 0.43701171875, 0.46319580078125, 0.4893798828125, 0.51556396484375, 0.541748046875, 0.56793212890625, 0.5941162109375, 0.62030029296875, 0.646484375, 0.67266845703125, 0.6988525390625, 0.72503662109375, 0.751220703125, 0.77740478515625, 0.8035888671875, 0.82977294921875, 0.85595703125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 5.0, 3.0, 5.0, 5.0, 5.0, 12.0, 18.0, 22.0, 29.0, 81.0, 156.0, 316.0, 1023.0, 5595.0, 99131.0, 882490.0, 54159.0, 3977.0, 875.0, 311.0, 147.0, 71.0, 42.0, 33.0, 9.0, 16.0, 4.0, 3.0, 3.0, 6.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.446533203125, -0.4349098205566406, -0.42328643798828125, -0.4116630554199219, -0.4000396728515625, -0.3884162902832031, -0.37679290771484375, -0.3651695251464844, -0.353546142578125, -0.3419227600097656, -0.33029937744140625, -0.3186759948730469, -0.3070526123046875, -0.2954292297363281, -0.28380584716796875, -0.2721824645996094, -0.26055908203125, -0.24893569946289062, -0.23731231689453125, -0.22568893432617188, -0.2140655517578125, -0.20244216918945312, -0.19081878662109375, -0.17919540405273438, -0.167572021484375, -0.15594863891601562, -0.14432525634765625, -0.13270187377929688, -0.1210784912109375, -0.10945510864257812, -0.09783172607421875, -0.08620834350585938, -0.0745849609375, -0.06296157836914062, -0.05133819580078125, -0.039714813232421875, -0.0280914306640625, -0.016468048095703125, -0.00484466552734375, 0.006778717041015625, 0.018402099609375, 0.030025482177734375, 0.04164886474609375, 0.053272247314453125, 0.0648956298828125, 0.07651901245117188, 0.08814239501953125, 0.09976577758789062, 0.11138916015625, 0.12301254272460938, 0.13463592529296875, 0.14625930786132812, 0.1578826904296875, 0.16950607299804688, 0.18112945556640625, 0.19275283813476562, 0.204376220703125, 0.21599960327148438, 0.22762298583984375, 0.23924636840820312, 0.2508697509765625, 0.2624931335449219, 0.27411651611328125, 0.2857398986816406, 0.29736328125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 0.0, 7.0, 7.0, 7.0, 10.0, 26.0, 27.0, 50.0, 58.0, 73.0, 119.0, 185.0, 137.0, 85.0, 68.0, 55.0, 35.0, 18.0, 18.0, 11.0, 6.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4332275390625e-05, -3.287382423877716e-05, -3.141537308692932e-05, -2.9956921935081482e-05, -2.8498470783233643e-05, -2.7040019631385803e-05, -2.5581568479537964e-05, -2.4123117327690125e-05, -2.2664666175842285e-05, -2.1206215023994446e-05, -1.9747763872146606e-05, -1.8289312720298767e-05, -1.6830861568450928e-05, -1.537241041660309e-05, -1.3913959264755249e-05, -1.245550811290741e-05, -1.099705696105957e-05, -9.538605809211731e-06, -8.080154657363892e-06, -6.621703505516052e-06, -5.163252353668213e-06, -3.7048012018203735e-06, -2.246350049972534e-06, -7.878988981246948e-07, 6.705522537231445e-07, 2.129003405570984e-06, 3.5874545574188232e-06, 5.045905709266663e-06, 6.504356861114502e-06, 7.962808012962341e-06, 9.42125916481018e-06, 1.087971031665802e-05, 1.233816146850586e-05, 1.3796612620353699e-05, 1.5255063772201538e-05, 1.6713514924049377e-05, 1.8171966075897217e-05, 1.9630417227745056e-05, 2.1088868379592896e-05, 2.2547319531440735e-05, 2.4005770683288574e-05, 2.5464221835136414e-05, 2.6922672986984253e-05, 2.8381124138832092e-05, 2.983957529067993e-05, 3.129802644252777e-05, 3.275647759437561e-05, 3.421492874622345e-05, 3.567337989807129e-05, 3.713183104991913e-05, 3.859028220176697e-05, 4.004873335361481e-05, 4.1507184505462646e-05, 4.2965635657310486e-05, 4.4424086809158325e-05, 4.5882537961006165e-05, 4.7340989112854004e-05, 4.879944026470184e-05, 5.025789141654968e-05, 5.171634256839752e-05, 5.317479372024536e-05, 5.46332448720932e-05, 5.609169602394104e-05, 5.755014717578888e-05, 5.900859832763672e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 9.0, 6.0, 6.0, 10.0, 13.0, 26.0, 38.0, 59.0, 88.0, 114.0, 194.0, 294.0, 537.0, 881.0, 1629.0, 3675.0, 11291.0, 63831.0, 543557.0, 362766.0, 44045.0, 8917.0, 3101.0, 1456.0, 775.0, 454.0, 281.0, 165.0, 97.0, 80.0, 37.0, 31.0, 28.0, 16.0, 16.0, 11.0, 9.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.246337890625, -0.2390727996826172, -0.23180770874023438, -0.22454261779785156, -0.21727752685546875, -0.21001243591308594, -0.20274734497070312, -0.1954822540283203, -0.1882171630859375, -0.1809520721435547, -0.17368698120117188, -0.16642189025878906, -0.15915679931640625, -0.15189170837402344, -0.14462661743164062, -0.1373615264892578, -0.130096435546875, -0.12283134460449219, -0.11556625366210938, -0.10830116271972656, -0.10103607177734375, -0.09377098083496094, -0.08650588989257812, -0.07924079895019531, -0.0719757080078125, -0.06471061706542969, -0.057445526123046875, -0.05018043518066406, -0.04291534423828125, -0.03565025329589844, -0.028385162353515625, -0.021120071411132812, -0.01385498046875, -0.0065898895263671875, 0.000675201416015625, 0.007940292358398438, 0.01520538330078125, 0.022470474243164062, 0.029735565185546875, 0.03700065612792969, 0.0442657470703125, 0.05153083801269531, 0.058795928955078125, 0.06606101989746094, 0.07332611083984375, 0.08059120178222656, 0.08785629272460938, 0.09512138366699219, 0.102386474609375, 0.10965156555175781, 0.11691665649414062, 0.12418174743652344, 0.13144683837890625, 0.13871192932128906, 0.14597702026367188, 0.1532421112060547, 0.1605072021484375, 0.1677722930908203, 0.17503738403320312, 0.18230247497558594, 0.18956756591796875, 0.19683265686035156, 0.20409774780273438, 0.2113628387451172, 0.2186279296875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 2.0, 7.0, 4.0, 5.0, 10.0, 7.0, 17.0, 23.0, 28.0, 22.0, 30.0, 26.0, 44.0, 36.0, 47.0, 64.0, 66.0, 82.0, 84.0, 58.0, 37.0, 60.0, 38.0, 33.0, 31.0, 24.0, 24.0, 22.0, 12.0, 13.0, 9.0, 9.0, 10.0, 5.0, 4.0, 2.0, 4.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05426025390625, -0.05242919921875, -0.05059814453125, -0.04876708984375, -0.04693603515625, -0.04510498046875, -0.04327392578125, -0.04144287109375, -0.03961181640625, -0.03778076171875, -0.03594970703125, -0.03411865234375, -0.03228759765625, -0.03045654296875, -0.02862548828125, -0.02679443359375, -0.02496337890625, -0.02313232421875, -0.02130126953125, -0.01947021484375, -0.01763916015625, -0.01580810546875, -0.01397705078125, -0.01214599609375, -0.01031494140625, -0.00848388671875, -0.00665283203125, -0.00482177734375, -0.00299072265625, -0.00115966796875, 0.00067138671875, 0.00250244140625, 0.00433349609375, 0.00616455078125, 0.00799560546875, 0.00982666015625, 0.01165771484375, 0.01348876953125, 0.01531982421875, 0.01715087890625, 0.01898193359375, 0.02081298828125, 0.02264404296875, 0.02447509765625, 0.02630615234375, 0.02813720703125, 0.02996826171875, 0.03179931640625, 0.03363037109375, 0.03546142578125, 0.03729248046875, 0.03912353515625, 0.04095458984375, 0.04278564453125, 0.04461669921875, 0.04644775390625, 0.04827880859375, 0.05010986328125, 0.05194091796875, 0.05377197265625, 0.05560302734375, 0.05743408203125, 0.05926513671875, 0.06109619140625, 0.06292724609375]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 7.0, 8.0, 8.0, 18.0, 27.0, 44.0, 56.0, 57.0, 72.0, 101.0, 116.0, 102.0, 92.0, 71.0, 56.0, 46.0, 40.0, 20.0, 18.0, 13.0, 12.0, 4.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8707438707351685, -0.8307117223739624, -0.7906795740127563, -0.7506474256515503, -0.7106152772903442, -0.6705831289291382, -0.6305510401725769, -0.5905188918113708, -0.5504867434501648, -0.5104545950889587, -0.4704224467277527, -0.430390328168869, -0.39035817980766296, -0.3503260314464569, -0.31029391288757324, -0.2702617645263672, -0.23022961616516113, -0.19019746780395508, -0.15016533434391022, -0.11013319343328476, -0.0701010525226593, -0.030068904161453247, 0.009963229298591614, 0.049995362758636475, 0.09002751111984253, 0.13005965948104858, 0.17009179294109344, 0.2101239264011383, 0.25015607476234436, 0.2901882231235504, 0.3302203416824341, 0.37025249004364014, 0.41028475761413574, 0.4503169059753418, 0.49034905433654785, 0.5303812026977539, 0.57041335105896, 0.610445499420166, 0.6504775881767273, 0.6905097365379333, 0.7305418848991394, 0.7705740332603455, 0.8106061816215515, 0.8506383299827576, 0.8906704187393188, 0.9307025671005249, 0.970734715461731, 1.010766863822937, 1.050799012184143, 1.0908311605453491, 1.1308633089065552, 1.1708954572677612, 1.2109276056289673, 1.2509597539901733, 1.2909919023513794, 1.331023931503296, 1.371056079864502, 1.411088228225708, 1.451120376586914, 1.4911525249481201, 1.5311846733093262, 1.5712168216705322, 1.6112489700317383, 1.6512811183929443, 1.6913132667541504]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 4.0, 8.0, 10.0, 7.0, 8.0, 10.0, 8.0, 21.0, 23.0, 19.0, 24.0, 18.0, 33.0, 23.0, 32.0, 31.0, 32.0, 49.0, 30.0, 33.0, 35.0, 42.0, 32.0, 53.0, 27.0, 45.0, 31.0, 29.0, 29.0, 27.0, 29.0, 26.0, 20.0, 27.0, 22.0, 13.0, 18.0, 11.0, 10.0, 8.0, 12.0, 8.0, 8.0, 3.0, 9.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.230108380317688, -1.19182550907135, -1.1535425186157227, -1.1152596473693848, -1.0769767761230469, -1.038693904876709, -1.000411033630371, -0.9621280431747437, -0.9238451719284058, -0.8855623006820679, -0.8472793698310852, -0.8089964389801025, -0.7707135677337646, -0.7324306964874268, -0.6941477656364441, -0.6558648347854614, -0.6175819635391235, -0.5792990922927856, -0.541016161441803, -0.5027332305908203, -0.4644503593444824, -0.42616745829582214, -0.38788455724716187, -0.3496016561985016, -0.3113187551498413, -0.27303585410118103, -0.23475295305252075, -0.19647005200386047, -0.1581871509552002, -0.11990424990653992, -0.08162134885787964, -0.04333844780921936, -0.005055665969848633, 0.033227235078811646, 0.07151013612747192, 0.1097930371761322, 0.14807593822479248, 0.18635883927345276, 0.22464174032211304, 0.2629246413707733, 0.3012075424194336, 0.33949044346809387, 0.37777334451675415, 0.41605624556541443, 0.4543391466140747, 0.492622047662735, 0.5309049487113953, 0.5691878795623779, 0.6074707508087158, 0.6457536220550537, 0.6840365529060364, 0.722319483757019, 0.7606023550033569, 0.7988852262496948, 0.8371681571006775, 0.8754510879516602, 0.913733959197998, 0.9520168304443359, 0.9902997612953186, 1.0285826921463013, 1.0668655633926392, 1.105148434638977, 1.1434314250946045, 1.1817142963409424, 1.2199971675872803]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 6.0, 7.0, 14.0, 21.0, 49.0, 74.0, 179.0, 334.0, 713.0, 1794.0, 5257.0, 21644.0, 235762.0, 3598250.0, 297679.0, 23542.0, 5732.0, 1841.0, 734.0, 324.0, 158.0, 82.0, 49.0, 19.0, 13.0, 9.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92236328125, -0.8814315795898438, -0.8404998779296875, -0.7995681762695312, -0.758636474609375, -0.7177047729492188, -0.6767730712890625, -0.6358413696289062, -0.59490966796875, -0.5539779663085938, -0.5130462646484375, -0.47211456298828125, -0.431182861328125, -0.39025115966796875, -0.3493194580078125, -0.30838775634765625, -0.2674560546875, -0.22652435302734375, -0.1855926513671875, -0.14466094970703125, -0.103729248046875, -0.06279754638671875, -0.0218658447265625, 0.01906585693359375, 0.05999755859375, 0.10092926025390625, 0.1418609619140625, 0.18279266357421875, 0.223724365234375, 0.26465606689453125, 0.3055877685546875, 0.34651947021484375, 0.387451171875, 0.42838287353515625, 0.4693145751953125, 0.5102462768554688, 0.551177978515625, 0.5921096801757812, 0.6330413818359375, 0.6739730834960938, 0.71490478515625, 0.7558364868164062, 0.7967681884765625, 0.8376998901367188, 0.878631591796875, 0.9195632934570312, 0.9604949951171875, 1.0014266967773438, 1.0423583984375, 1.0832901000976562, 1.1242218017578125, 1.1651535034179688, 1.206085205078125, 1.2470169067382812, 1.2879486083984375, 1.3288803100585938, 1.36981201171875, 1.4107437133789062, 1.4516754150390625, 1.4926071166992188, 1.533538818359375, 1.5744705200195312, 1.6154022216796875, 1.6563339233398438, 1.697265625]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 4.0, 10.0, 13.0, 12.0, 14.0, 16.0, 22.0, 30.0, 17.0, 35.0, 44.0, 43.0, 46.0, 44.0, 47.0, 54.0, 48.0, 46.0, 43.0, 57.0, 51.0, 46.0, 40.0, 35.0, 24.0, 24.0, 32.0, 19.0, 12.0, 11.0, 12.0, 16.0, 7.0, 7.0, 4.0, 7.0, 5.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.369873046875, -0.356689453125, -0.343505859375, -0.330322265625, -0.317138671875, -0.303955078125, -0.290771484375, -0.277587890625, -0.264404296875, -0.251220703125, -0.238037109375, -0.224853515625, -0.211669921875, -0.198486328125, -0.185302734375, -0.172119140625, -0.158935546875, -0.145751953125, -0.132568359375, -0.119384765625, -0.106201171875, -0.093017578125, -0.079833984375, -0.066650390625, -0.053466796875, -0.040283203125, -0.027099609375, -0.013916015625, -0.000732421875, 0.012451171875, 0.025634765625, 0.038818359375, 0.052001953125, 0.065185546875, 0.078369140625, 0.091552734375, 0.104736328125, 0.117919921875, 0.131103515625, 0.144287109375, 0.157470703125, 0.170654296875, 0.183837890625, 0.197021484375, 0.210205078125, 0.223388671875, 0.236572265625, 0.249755859375, 0.262939453125, 0.276123046875, 0.289306640625, 0.302490234375, 0.315673828125, 0.328857421875, 0.342041015625, 0.355224609375, 0.368408203125, 0.381591796875, 0.394775390625, 0.407958984375, 0.421142578125, 0.434326171875, 0.447509765625, 0.460693359375, 0.473876953125]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 6.0, 5.0, 11.0, 27.0, 25.0, 63.0, 111.0, 281.0, 758.0, 2911.0, 19390.0, 545229.0, 3558226.0, 59296.0, 5924.0, 1246.0, 422.0, 166.0, 67.0, 45.0, 17.0, 16.0, 8.0, 3.0, 6.0, 0.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.99609375, -1.9438629150390625, -1.891632080078125, -1.8394012451171875, -1.78717041015625, -1.7349395751953125, -1.682708740234375, -1.6304779052734375, -1.5782470703125, -1.5260162353515625, -1.473785400390625, -1.4215545654296875, -1.36932373046875, -1.3170928955078125, -1.264862060546875, -1.2126312255859375, -1.160400390625, -1.1081695556640625, -1.055938720703125, -1.0037078857421875, -0.95147705078125, -0.8992462158203125, -0.847015380859375, -0.7947845458984375, -0.7425537109375, -0.6903228759765625, -0.638092041015625, -0.5858612060546875, -0.53363037109375, -0.4813995361328125, -0.429168701171875, -0.3769378662109375, -0.32470703125, -0.2724761962890625, -0.220245361328125, -0.1680145263671875, -0.11578369140625, -0.0635528564453125, -0.011322021484375, 0.0409088134765625, 0.0931396484375, 0.1453704833984375, 0.197601318359375, 0.2498321533203125, 0.30206298828125, 0.3542938232421875, 0.406524658203125, 0.4587554931640625, 0.510986328125, 0.5632171630859375, 0.615447998046875, 0.6676788330078125, 0.71990966796875, 0.7721405029296875, 0.824371337890625, 0.8766021728515625, 0.9288330078125, 0.9810638427734375, 1.033294677734375, 1.0855255126953125, 1.13775634765625, 1.1899871826171875, 1.242218017578125, 1.2944488525390625, 1.3466796875]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 9.0, 2.0, 14.0, 13.0, 9.0, 19.0, 23.0, 28.0, 43.0, 70.0, 98.0, 133.0, 180.0, 265.0, 411.0, 470.0, 548.0, 494.0, 357.0, 240.0, 179.0, 113.0, 66.0, 67.0, 62.0, 22.0, 20.0, 15.0, 27.0, 16.0, 10.0, 15.0, 4.0, 7.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.216064453125, -0.20918655395507812, -0.20230865478515625, -0.19543075561523438, -0.1885528564453125, -0.18167495727539062, -0.17479705810546875, -0.16791915893554688, -0.161041259765625, -0.15416336059570312, -0.14728546142578125, -0.14040756225585938, -0.1335296630859375, -0.12665176391601562, -0.11977386474609375, -0.11289596557617188, -0.10601806640625, -0.09914016723632812, -0.09226226806640625, -0.08538436889648438, -0.0785064697265625, -0.07162857055664062, -0.06475067138671875, -0.057872772216796875, -0.050994873046875, -0.044116973876953125, -0.03723907470703125, -0.030361175537109375, -0.0234832763671875, -0.016605377197265625, -0.00972747802734375, -0.002849578857421875, 0.0040283203125, 0.010906219482421875, 0.01778411865234375, 0.024662017822265625, 0.0315399169921875, 0.038417816162109375, 0.04529571533203125, 0.052173614501953125, 0.059051513671875, 0.06592941284179688, 0.07280731201171875, 0.07968521118164062, 0.0865631103515625, 0.09344100952148438, 0.10031890869140625, 0.10719680786132812, 0.11407470703125, 0.12095260620117188, 0.12783050537109375, 0.13470840454101562, 0.1415863037109375, 0.14846420288085938, 0.15534210205078125, 0.16222000122070312, 0.169097900390625, 0.17597579956054688, 0.18285369873046875, 0.18973159790039062, 0.1966094970703125, 0.20348739624023438, 0.21036529541015625, 0.21724319458007812, 0.22412109375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 0.0, 5.0, 2.0, 10.0, 11.0, 6.0, 15.0, 22.0, 22.0, 28.0, 32.0, 47.0, 37.0, 68.0, 76.0, 67.0, 77.0, 62.0, 75.0, 59.0, 52.0, 48.0, 42.0, 39.0, 28.0, 14.0, 11.0, 14.0, 17.0, 8.0, 9.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9504632949829102, -0.927029013633728, -0.9035947322845459, -0.8801605105400085, -0.8567262291908264, -0.8332919478416443, -0.8098576664924622, -0.7864234447479248, -0.7629891633987427, -0.7395548820495605, -0.7161206007003784, -0.6926863789558411, -0.6692520976066589, -0.6458178162574768, -0.6223835349082947, -0.5989493131637573, -0.5755150318145752, -0.5520807504653931, -0.5286464691162109, -0.5052122473716736, -0.48177796602249146, -0.4583436846733093, -0.4349094033241272, -0.41147515177726746, -0.38804084062576294, -0.3646065592765808, -0.34117230772972107, -0.31773802638053894, -0.2943037748336792, -0.27086949348449707, -0.24743522703647614, -0.2240009605884552, -0.20056670904159546, -0.17713244259357452, -0.1536981761455536, -0.13026389479637146, -0.10682963579893112, -0.08339536935091019, -0.059961095452308655, -0.03652682900428772, -0.013092562556266785, 0.0103417057543993, 0.033775974065065384, 0.05721024423837662, 0.08064451068639755, 0.10407877713441849, 0.12751305103302002, 0.15094731748104095, 0.1743815839290619, 0.19781585037708282, 0.22125011682510376, 0.2446843981742859, 0.26811864972114563, 0.29155293107032776, 0.3149871826171875, 0.33842146396636963, 0.36185574531555176, 0.3852900266647339, 0.40872427821159363, 0.43215855956077576, 0.4555928111076355, 0.4790270924568176, 0.5024613738059998, 0.5258955955505371, 0.5493298768997192]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 4.0, 5.0, 10.0, 11.0, 11.0, 18.0, 14.0, 13.0, 18.0, 17.0, 17.0, 29.0, 26.0, 37.0, 26.0, 43.0, 41.0, 42.0, 43.0, 47.0, 44.0, 42.0, 33.0, 30.0, 29.0, 50.0, 35.0, 23.0, 30.0, 34.0, 27.0, 27.0, 16.0, 18.0, 11.0, 17.0, 12.0, 10.0, 10.0, 2.0, 6.0, 6.0, 6.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43962934613227844, -0.4244328439235687, -0.409236341714859, -0.3940398693084717, -0.37884336709976196, -0.36364686489105225, -0.34845036268234253, -0.3332538604736328, -0.3180573582649231, -0.3028608560562134, -0.28766435384750366, -0.27246785163879395, -0.2572713792324066, -0.2420748770236969, -0.22687837481498718, -0.21168187260627747, -0.19648540019989014, -0.18128889799118042, -0.1660924106836319, -0.15089590847492218, -0.13569942116737366, -0.12050291895866394, -0.10530641674995422, -0.0901099219918251, -0.07491342723369598, -0.059716932475566864, -0.044520433992147446, -0.029323935508728027, -0.014127440750598907, 0.0010690540075302124, 0.01626555621623993, 0.03146205097436905, 0.04665857553482056, 0.061855070292949677, 0.0770515650510788, 0.09224806725978851, 0.10744456201791763, 0.12264105677604675, 0.13783755898475647, 0.1530340611934662, 0.1682305485010147, 0.18342705070972443, 0.19862353801727295, 0.21382004022598267, 0.22901654243469238, 0.2442130297422409, 0.2594095468521118, 0.27460601925849915, 0.28980252146720886, 0.3049990236759186, 0.3201955258846283, 0.3353919982910156, 0.35058850049972534, 0.36578500270843506, 0.3809815049171448, 0.3961780071258545, 0.4113745093345642, 0.4265710115432739, 0.44176751375198364, 0.45696401596069336, 0.4721604883670807, 0.4873569905757904, 0.5025534629821777, 0.5177499651908875, 0.5329464673995972]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 8.0, 8.0, 9.0, 10.0, 31.0, 37.0, 48.0, 88.0, 149.0, 242.0, 399.0, 613.0, 1046.0, 1774.0, 3084.0, 6112.0, 14678.0, 47386.0, 289736.0, 550295.0, 92140.0, 22239.0, 8702.0, 4144.0, 2247.0, 1269.0, 782.0, 487.0, 281.0, 191.0, 118.0, 78.0, 35.0, 27.0, 30.0, 13.0, 10.0, 5.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.35400390625, -0.34449005126953125, -0.3349761962890625, -0.32546234130859375, -0.315948486328125, -0.30643463134765625, -0.2969207763671875, -0.28740692138671875, -0.27789306640625, -0.26837921142578125, -0.2588653564453125, -0.24935150146484375, -0.239837646484375, -0.23032379150390625, -0.2208099365234375, -0.21129608154296875, -0.2017822265625, -0.19226837158203125, -0.1827545166015625, -0.17324066162109375, -0.163726806640625, -0.15421295166015625, -0.1446990966796875, -0.13518524169921875, -0.12567138671875, -0.11615753173828125, -0.1066436767578125, -0.09712982177734375, -0.087615966796875, -0.07810211181640625, -0.0685882568359375, -0.05907440185546875, -0.049560546875, -0.04004669189453125, -0.0305328369140625, -0.02101898193359375, -0.011505126953125, -0.00199127197265625, 0.0075225830078125, 0.01703643798828125, 0.02655029296875, 0.03606414794921875, 0.0455780029296875, 0.05509185791015625, 0.064605712890625, 0.07411956787109375, 0.0836334228515625, 0.09314727783203125, 0.1026611328125, 0.11217498779296875, 0.1216888427734375, 0.13120269775390625, 0.140716552734375, 0.15023040771484375, 0.1597442626953125, 0.16925811767578125, 0.17877197265625, 0.18828582763671875, 0.1977996826171875, 0.20731353759765625, 0.216827392578125, 0.22634124755859375, 0.2358551025390625, 0.24536895751953125, 0.2548828125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 2.0, 4.0, 8.0, 4.0, 1.0, 9.0, 12.0, 14.0, 10.0, 16.0, 11.0, 20.0, 25.0, 22.0, 33.0, 33.0, 29.0, 37.0, 53.0, 34.0, 41.0, 44.0, 59.0, 33.0, 47.0, 40.0, 27.0, 32.0, 28.0, 30.0, 35.0, 32.0, 38.0, 20.0, 17.0, 17.0, 9.0, 23.0, 10.0, 6.0, 9.0, 3.0, 6.0, 6.0, 4.0, 4.0, 4.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2685546875, -0.2596549987792969, -0.25075531005859375, -0.24185562133789062, -0.2329559326171875, -0.22405624389648438, -0.21515655517578125, -0.20625686645507812, -0.197357177734375, -0.18845748901367188, -0.17955780029296875, -0.17065811157226562, -0.1617584228515625, -0.15285873413085938, -0.14395904541015625, -0.13505935668945312, -0.12615966796875, -0.11725997924804688, -0.10836029052734375, -0.09946060180664062, -0.0905609130859375, -0.08166122436523438, -0.07276153564453125, -0.06386184692382812, -0.054962158203125, -0.046062469482421875, -0.03716278076171875, -0.028263092041015625, -0.0193634033203125, -0.010463714599609375, -0.00156402587890625, 0.007335662841796875, 0.0162353515625, 0.025135040283203125, 0.03403472900390625, 0.042934417724609375, 0.0518341064453125, 0.060733795166015625, 0.06963348388671875, 0.07853317260742188, 0.087432861328125, 0.09633255004882812, 0.10523223876953125, 0.11413192749023438, 0.1230316162109375, 0.13193130493164062, 0.14083099365234375, 0.14973068237304688, 0.15863037109375, 0.16753005981445312, 0.17642974853515625, 0.18532943725585938, 0.1942291259765625, 0.20312881469726562, 0.21202850341796875, 0.22092819213867188, 0.229827880859375, 0.23872756958007812, 0.24762725830078125, 0.2565269470214844, 0.2654266357421875, 0.2743263244628906, 0.28322601318359375, 0.2921257019042969, 0.301025390625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 10.0, 10.0, 8.0, 13.0, 24.0, 30.0, 36.0, 40.0, 71.0, 93.0, 170.0, 257.0, 456.0, 1034.0, 2475.0, 7346.0, 32189.0, 278488.0, 623358.0, 81181.0, 14162.0, 3967.0, 1514.0, 679.0, 343.0, 183.0, 124.0, 81.0, 35.0, 48.0, 28.0, 19.0, 18.0, 13.0, 13.0, 5.0, 4.0, 6.0, 2.0, 6.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.249267578125, -0.24074172973632812, -0.23221588134765625, -0.22369003295898438, -0.2151641845703125, -0.20663833618164062, -0.19811248779296875, -0.18958663940429688, -0.181060791015625, -0.17253494262695312, -0.16400909423828125, -0.15548324584960938, -0.1469573974609375, -0.13843154907226562, -0.12990570068359375, -0.12137985229492188, -0.11285400390625, -0.10432815551757812, -0.09580230712890625, -0.08727645874023438, -0.0787506103515625, -0.07022476196289062, -0.06169891357421875, -0.053173065185546875, -0.044647216796875, -0.036121368408203125, -0.02759552001953125, -0.019069671630859375, -0.0105438232421875, -0.002017974853515625, 0.00650787353515625, 0.015033721923828125, 0.0235595703125, 0.032085418701171875, 0.04061126708984375, 0.049137115478515625, 0.0576629638671875, 0.06618881225585938, 0.07471466064453125, 0.08324050903320312, 0.091766357421875, 0.10029220581054688, 0.10881805419921875, 0.11734390258789062, 0.1258697509765625, 0.13439559936523438, 0.14292144775390625, 0.15144729614257812, 0.15997314453125, 0.16849899291992188, 0.17702484130859375, 0.18555068969726562, 0.1940765380859375, 0.20260238647460938, 0.21112823486328125, 0.21965408325195312, 0.228179931640625, 0.23670578002929688, 0.24523162841796875, 0.2537574768066406, 0.2622833251953125, 0.2708091735839844, 0.27933502197265625, 0.2878608703613281, 0.29638671875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 5.0, 8.0, 5.0, 6.0, 9.0, 16.0, 15.0, 11.0, 14.0, 24.0, 37.0, 32.0, 31.0, 32.0, 30.0, 29.0, 47.0, 44.0, 57.0, 45.0, 48.0, 48.0, 38.0, 54.0, 45.0, 29.0, 26.0, 25.0, 30.0, 27.0, 24.0, 16.0, 18.0, 13.0, 15.0, 8.0, 9.0, 14.0, 6.0, 2.0, 4.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6181640625, -0.5995330810546875, -0.580902099609375, -0.5622711181640625, -0.54364013671875, -0.5250091552734375, -0.506378173828125, -0.4877471923828125, -0.4691162109375, -0.4504852294921875, -0.431854248046875, -0.4132232666015625, -0.39459228515625, -0.3759613037109375, -0.357330322265625, -0.3386993408203125, -0.320068359375, -0.3014373779296875, -0.282806396484375, -0.2641754150390625, -0.24554443359375, -0.2269134521484375, -0.208282470703125, -0.1896514892578125, -0.1710205078125, -0.1523895263671875, -0.133758544921875, -0.1151275634765625, -0.09649658203125, -0.0778656005859375, -0.059234619140625, -0.0406036376953125, -0.02197265625, -0.0033416748046875, 0.015289306640625, 0.0339202880859375, 0.05255126953125, 0.0711822509765625, 0.089813232421875, 0.1084442138671875, 0.1270751953125, 0.1457061767578125, 0.164337158203125, 0.1829681396484375, 0.20159912109375, 0.2202301025390625, 0.238861083984375, 0.2574920654296875, 0.276123046875, 0.2947540283203125, 0.313385009765625, 0.3320159912109375, 0.35064697265625, 0.3692779541015625, 0.387908935546875, 0.4065399169921875, 0.4251708984375, 0.4438018798828125, 0.462432861328125, 0.4810638427734375, 0.49969482421875, 0.5183258056640625, 0.536956787109375, 0.5555877685546875, 0.57421875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 0.0, 3.0, 3.0, 6.0, 7.0, 13.0, 22.0, 27.0, 36.0, 62.0, 91.0, 140.0, 220.0, 388.0, 784.0, 1545.0, 3312.0, 8467.0, 27491.0, 133210.0, 571369.0, 238834.0, 42536.0, 11733.0, 4257.0, 1889.0, 916.0, 445.0, 293.0, 156.0, 93.0, 76.0, 38.0, 32.0, 19.0, 12.0, 7.0, 5.0, 6.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08099365234375, -0.07843494415283203, -0.07587623596191406, -0.0733175277709961, -0.07075881958007812, -0.06820011138916016, -0.06564140319824219, -0.06308269500732422, -0.06052398681640625, -0.05796527862548828, -0.05540657043457031, -0.052847862243652344, -0.050289154052734375, -0.047730445861816406, -0.04517173767089844, -0.04261302947998047, -0.0400543212890625, -0.03749561309814453, -0.03493690490722656, -0.032378196716308594, -0.029819488525390625, -0.027260780334472656, -0.024702072143554688, -0.02214336395263672, -0.01958465576171875, -0.01702594757080078, -0.014467239379882812, -0.011908531188964844, -0.009349822998046875, -0.006791114807128906, -0.0042324066162109375, -0.0016736984252929688, 0.000885009765625, 0.0034437179565429688, 0.0060024261474609375, 0.008561134338378906, 0.011119842529296875, 0.013678550720214844, 0.016237258911132812, 0.01879596710205078, 0.02135467529296875, 0.02391338348388672, 0.026472091674804688, 0.029030799865722656, 0.031589508056640625, 0.034148216247558594, 0.03670692443847656, 0.03926563262939453, 0.0418243408203125, 0.04438304901123047, 0.04694175720214844, 0.049500465393066406, 0.052059173583984375, 0.054617881774902344, 0.05717658996582031, 0.05973529815673828, 0.06229400634765625, 0.06485271453857422, 0.06741142272949219, 0.06997013092041016, 0.07252883911132812, 0.0750875473022461, 0.07764625549316406, 0.08020496368408203, 0.082763671875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 2.0, 4.0, 1.0, 3.0, 7.0, 2.0, 4.0, 11.0, 6.0, 17.0, 24.0, 26.0, 36.0, 34.0, 34.0, 61.0, 57.0, 77.0, 86.0, 66.0, 68.0, 65.0, 70.0, 48.0, 36.0, 38.0, 26.0, 12.0, 14.0, 21.0, 7.0, 5.0, 10.0, 3.0, 3.0, 1.0, 3.0, 4.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.8848648071289062e-05, -2.7970410883426666e-05, -2.709217369556427e-05, -2.6213936507701874e-05, -2.5335699319839478e-05, -2.445746213197708e-05, -2.3579224944114685e-05, -2.270098775625229e-05, -2.1822750568389893e-05, -2.0944513380527496e-05, -2.00662761926651e-05, -1.9188039004802704e-05, -1.8309801816940308e-05, -1.743156462907791e-05, -1.6553327441215515e-05, -1.567509025335312e-05, -1.4796853065490723e-05, -1.3918615877628326e-05, -1.304037868976593e-05, -1.2162141501903534e-05, -1.1283904314041138e-05, -1.0405667126178741e-05, -9.527429938316345e-06, -8.649192750453949e-06, -7.770955562591553e-06, -6.8927183747291565e-06, -6.01448118686676e-06, -5.136243999004364e-06, -4.258006811141968e-06, -3.3797696232795715e-06, -2.5015324354171753e-06, -1.623295247554779e-06, -7.450580596923828e-07, 1.3317912817001343e-07, 1.0114163160324097e-06, 1.889653503894806e-06, 2.767890691757202e-06, 3.6461278796195984e-06, 4.524365067481995e-06, 5.402602255344391e-06, 6.280839443206787e-06, 7.159076631069183e-06, 8.03731381893158e-06, 8.915551006793976e-06, 9.793788194656372e-06, 1.0672025382518768e-05, 1.1550262570381165e-05, 1.242849975824356e-05, 1.3306736946105957e-05, 1.4184974133968353e-05, 1.506321132183075e-05, 1.5941448509693146e-05, 1.6819685697555542e-05, 1.7697922885417938e-05, 1.8576160073280334e-05, 1.945439726114273e-05, 2.0332634449005127e-05, 2.1210871636867523e-05, 2.208910882472992e-05, 2.2967346012592316e-05, 2.3845583200454712e-05, 2.4723820388317108e-05, 2.5602057576179504e-05, 2.64802947640419e-05, 2.7358531951904297e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 1.0, 3.0, 6.0, 6.0, 9.0, 18.0, 26.0, 34.0, 67.0, 113.0, 194.0, 376.0, 741.0, 1601.0, 3836.0, 9588.0, 25338.0, 84474.0, 349981.0, 417479.0, 105223.0, 30404.0, 10924.0, 4419.0, 1921.0, 857.0, 413.0, 185.0, 129.0, 52.0, 47.0, 37.0, 15.0, 14.0, 7.0, 10.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.08453369140625, -0.08189868927001953, -0.07926368713378906, -0.0766286849975586, -0.07399368286132812, -0.07135868072509766, -0.06872367858886719, -0.06608867645263672, -0.06345367431640625, -0.06081867218017578, -0.05818367004394531, -0.055548667907714844, -0.052913665771484375, -0.050278663635253906, -0.04764366149902344, -0.04500865936279297, -0.0423736572265625, -0.03973865509033203, -0.03710365295410156, -0.034468650817871094, -0.031833648681640625, -0.029198646545410156, -0.026563644409179688, -0.02392864227294922, -0.02129364013671875, -0.01865863800048828, -0.016023635864257812, -0.013388633728027344, -0.010753631591796875, -0.008118629455566406, -0.0054836273193359375, -0.0028486251831054688, -0.000213623046875, 0.0024213790893554688, 0.0050563812255859375, 0.007691383361816406, 0.010326385498046875, 0.012961387634277344, 0.015596389770507812, 0.01823139190673828, 0.02086639404296875, 0.02350139617919922, 0.026136398315429688, 0.028771400451660156, 0.031406402587890625, 0.034041404724121094, 0.03667640686035156, 0.03931140899658203, 0.0419464111328125, 0.04458141326904297, 0.04721641540527344, 0.049851417541503906, 0.052486419677734375, 0.055121421813964844, 0.05775642395019531, 0.06039142608642578, 0.06302642822265625, 0.06566143035888672, 0.06829643249511719, 0.07093143463134766, 0.07356643676757812, 0.0762014389038086, 0.07883644104003906, 0.08147144317626953, 0.0841064453125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 1.0, 2.0, 4.0, 5.0, 10.0, 4.0, 15.0, 19.0, 13.0, 30.0, 42.0, 55.0, 75.0, 89.0, 103.0, 119.0, 112.0, 69.0, 53.0, 48.0, 34.0, 22.0, 18.0, 16.0, 8.0, 6.0, 10.0, 8.0, 1.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0279541015625, -0.02718067169189453, -0.026407241821289062, -0.025633811950683594, -0.024860382080078125, -0.024086952209472656, -0.023313522338867188, -0.02254009246826172, -0.02176666259765625, -0.02099323272705078, -0.020219802856445312, -0.019446372985839844, -0.018672943115234375, -0.017899513244628906, -0.017126083374023438, -0.01635265350341797, -0.0155792236328125, -0.014805793762207031, -0.014032363891601562, -0.013258934020996094, -0.012485504150390625, -0.011712074279785156, -0.010938644409179688, -0.010165214538574219, -0.00939178466796875, -0.008618354797363281, -0.007844924926757812, -0.007071495056152344, -0.006298065185546875, -0.005524635314941406, -0.0047512054443359375, -0.003977775573730469, -0.003204345703125, -0.0024309158325195312, -0.0016574859619140625, -0.0008840560913085938, -0.000110626220703125, 0.0006628036499023438, 0.0014362335205078125, 0.0022096633911132812, 0.00298309326171875, 0.0037565231323242188, 0.0045299530029296875, 0.005303382873535156, 0.006076812744140625, 0.006850242614746094, 0.0076236724853515625, 0.008397102355957031, 0.0091705322265625, 0.009943962097167969, 0.010717391967773438, 0.011490821838378906, 0.012264251708984375, 0.013037681579589844, 0.013811111450195312, 0.014584541320800781, 0.01535797119140625, 0.01613140106201172, 0.016904830932617188, 0.017678260803222656, 0.018451690673828125, 0.019225120544433594, 0.019998550415039062, 0.02077198028564453, 0.02154541015625]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 4.0, 5.0, 9.0, 6.0, 15.0, 14.0, 17.0, 19.0, 17.0, 33.0, 27.0, 30.0, 61.0, 46.0, 55.0, 55.0, 70.0, 47.0, 57.0, 63.0, 50.0, 47.0, 34.0, 44.0, 33.0, 32.0, 28.0, 14.0, 15.0, 13.0, 10.0, 4.0, 5.0, 9.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.36110061407089233, -0.350521445274353, -0.3399422764778137, -0.3293631076812744, -0.3187839388847351, -0.3082047998905182, -0.2976256310939789, -0.2870464622974396, -0.27646729350090027, -0.26588812470436096, -0.25530895590782166, -0.24472980201244354, -0.23415063321590424, -0.22357146441936493, -0.21299231052398682, -0.2024131417274475, -0.1918339729309082, -0.1812548041343689, -0.1706756353378296, -0.16009648144245148, -0.14951731264591217, -0.13893814384937286, -0.12835898995399475, -0.11777982115745544, -0.10720065236091614, -0.09662148356437683, -0.08604232221841812, -0.07546316087245941, -0.0648839920759201, -0.0543048270046711, -0.04372566193342209, -0.03314650058746338, -0.02256736159324646, -0.011988196521997452, -0.0014090314507484436, 0.009170133620500565, 0.019749298691749573, 0.03032846376299858, 0.04090762883424759, 0.0514867901802063, 0.062065958976745605, 0.07264512777328491, 0.08322428911924362, 0.09380345046520233, 0.10438261926174164, 0.11496178805828094, 0.12554094195365906, 0.13612011075019836, 0.14669927954673767, 0.15727844834327698, 0.16785761713981628, 0.1784367710351944, 0.1890159398317337, 0.199595108628273, 0.21017426252365112, 0.22075343132019043, 0.23133260011672974, 0.24191176891326904, 0.25249093770980835, 0.26307010650634766, 0.27364927530288696, 0.2842284142971039, 0.2948075830936432, 0.3053867518901825, 0.3159659206867218]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 1.0, 2.0, 6.0, 6.0, 7.0, 5.0, 11.0, 9.0, 18.0, 10.0, 15.0, 17.0, 21.0, 18.0, 32.0, 32.0, 29.0, 26.0, 53.0, 42.0, 45.0, 37.0, 47.0, 46.0, 48.0, 34.0, 39.0, 39.0, 40.0, 30.0, 30.0, 31.0, 25.0, 25.0, 17.0, 24.0, 18.0, 13.0, 19.0, 6.0, 3.0, 10.0, 5.0, 6.0, 3.0, 1.0, 2.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2630304992198944, -0.2541731894016266, -0.24531584978103638, -0.23645852506160736, -0.22760120034217834, -0.21874389052391052, -0.2098865658044815, -0.2010292410850525, -0.19217191636562347, -0.18331459164619446, -0.17445726692676544, -0.16559994220733643, -0.1567426323890686, -0.1478852927684784, -0.13902798295021057, -0.13017065823078156, -0.12131333351135254, -0.11245600879192352, -0.1035986840724945, -0.09474136680364609, -0.08588404208421707, -0.07702671736478806, -0.06816940009593964, -0.05931207537651062, -0.050454750657081604, -0.04159742593765259, -0.03274010494351387, -0.023882782086730003, -0.015025459229946136, -0.00616813451051712, 0.0026891864836215973, 0.011546507477760315, 0.02040386199951172, 0.029261184856295586, 0.03811850771307945, 0.04697582870721817, 0.055833153426647186, 0.0646904781460762, 0.07354779541492462, 0.08240512013435364, 0.09126244485378265, 0.10011976957321167, 0.10897709429264069, 0.1178344115614891, 0.12669172883033752, 0.13554906845092773, 0.14440637826919556, 0.15326370298862457, 0.1621210277080536, 0.1709783524274826, 0.17983567714691162, 0.18869300186634064, 0.19755032658576965, 0.20640763640403748, 0.2152649611234665, 0.2241222858428955, 0.23297961056232452, 0.24183693528175354, 0.25069424510002136, 0.2595515847206116, 0.2684088945388794, 0.2772662341594696, 0.2861235439777374, 0.29498088359832764, 0.30383819341659546]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 0.0, 9.0, 5.0, 13.0, 6.0, 18.0, 25.0, 19.0, 41.0, 26.0, 55.0, 103.0, 162.0, 251.0, 393.0, 597.0, 959.0, 1571.0, 2754.0, 4926.0, 9105.0, 18348.0, 41728.0, 109437.0, 301974.0, 337178.0, 127878.0, 47408.0, 20688.0, 9986.0, 5332.0, 3012.0, 1769.0, 999.0, 599.0, 373.0, 272.0, 181.0, 97.0, 70.0, 38.0, 35.0, 33.0, 21.0, 19.0, 10.0, 8.0, 5.0, 8.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 1.0, 0.0, 2.0], "bins": [-0.384765625, -0.37238311767578125, -0.3600006103515625, -0.34761810302734375, -0.335235595703125, -0.32285308837890625, -0.3104705810546875, -0.29808807373046875, -0.28570556640625, -0.27332305908203125, -0.2609405517578125, -0.24855804443359375, -0.236175537109375, -0.22379302978515625, -0.2114105224609375, -0.19902801513671875, -0.1866455078125, -0.17426300048828125, -0.1618804931640625, -0.14949798583984375, -0.137115478515625, -0.12473297119140625, -0.1123504638671875, -0.09996795654296875, -0.08758544921875, -0.07520294189453125, -0.0628204345703125, -0.05043792724609375, -0.038055419921875, -0.02567291259765625, -0.0132904052734375, -0.00090789794921875, 0.011474609375, 0.02385711669921875, 0.0362396240234375, 0.04862213134765625, 0.061004638671875, 0.07338714599609375, 0.0857696533203125, 0.09815216064453125, 0.11053466796875, 0.12291717529296875, 0.1352996826171875, 0.14768218994140625, 0.160064697265625, 0.17244720458984375, 0.1848297119140625, 0.19721221923828125, 0.2095947265625, 0.22197723388671875, 0.2343597412109375, 0.24674224853515625, 0.259124755859375, 0.27150726318359375, 0.2838897705078125, 0.29627227783203125, 0.30865478515625, 0.32103729248046875, 0.3334197998046875, 0.34580230712890625, 0.358184814453125, 0.37056732177734375, 0.3829498291015625, 0.39533233642578125, 0.40771484375]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 6.0, 6.0, 5.0, 4.0, 7.0, 6.0, 7.0, 10.0, 15.0, 13.0, 19.0, 16.0, 22.0, 23.0, 35.0, 25.0, 41.0, 36.0, 41.0, 42.0, 47.0, 53.0, 44.0, 34.0, 43.0, 39.0, 38.0, 46.0, 37.0, 27.0, 31.0, 25.0, 25.0, 19.0, 14.0, 24.0, 17.0, 14.0, 10.0, 8.0, 7.0, 6.0, 6.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.56201171875, -0.5443649291992188, -0.5267181396484375, -0.5090713500976562, -0.491424560546875, -0.47377777099609375, -0.4561309814453125, -0.43848419189453125, -0.42083740234375, -0.40319061279296875, -0.3855438232421875, -0.36789703369140625, -0.350250244140625, -0.33260345458984375, -0.3149566650390625, -0.29730987548828125, -0.2796630859375, -0.26201629638671875, -0.2443695068359375, -0.22672271728515625, -0.209075927734375, -0.19142913818359375, -0.1737823486328125, -0.15613555908203125, -0.13848876953125, -0.12084197998046875, -0.1031951904296875, -0.08554840087890625, -0.067901611328125, -0.05025482177734375, -0.0326080322265625, -0.01496124267578125, 0.002685546875, 0.02033233642578125, 0.0379791259765625, 0.05562591552734375, 0.073272705078125, 0.09091949462890625, 0.1085662841796875, 0.12621307373046875, 0.14385986328125, 0.16150665283203125, 0.1791534423828125, 0.19680023193359375, 0.214447021484375, 0.23209381103515625, 0.2497406005859375, 0.26738739013671875, 0.2850341796875, 0.30268096923828125, 0.3203277587890625, 0.33797454833984375, 0.355621337890625, 0.37326812744140625, 0.3909149169921875, 0.40856170654296875, 0.42620849609375, 0.44385528564453125, 0.4615020751953125, 0.47914886474609375, 0.496795654296875, 0.5144424438476562, 0.5320892333984375, 0.5497360229492188, 0.5673828125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 3.0, 6.0, 11.0, 23.0, 21.0, 39.0, 59.0, 102.0, 143.0, 262.0, 506.0, 1176.0, 3351.0, 13186.0, 74035.0, 597215.0, 308871.0, 37624.0, 7867.0, 2227.0, 862.0, 394.0, 186.0, 116.0, 76.0, 47.0, 35.0, 34.0, 15.0, 16.0, 16.0, 4.0, 10.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.876953125, -0.8517684936523438, -0.8265838623046875, -0.8013992309570312, -0.776214599609375, -0.7510299682617188, -0.7258453369140625, -0.7006607055664062, -0.67547607421875, -0.6502914428710938, -0.6251068115234375, -0.5999221801757812, -0.574737548828125, -0.5495529174804688, -0.5243682861328125, -0.49918365478515625, -0.4739990234375, -0.44881439208984375, -0.4236297607421875, -0.39844512939453125, -0.373260498046875, -0.34807586669921875, -0.3228912353515625, -0.29770660400390625, -0.27252197265625, -0.24733734130859375, -0.2221527099609375, -0.19696807861328125, -0.171783447265625, -0.14659881591796875, -0.1214141845703125, -0.09622955322265625, -0.071044921875, -0.04586029052734375, -0.0206756591796875, 0.00450897216796875, 0.029693603515625, 0.05487823486328125, 0.0800628662109375, 0.10524749755859375, 0.13043212890625, 0.15561676025390625, 0.1808013916015625, 0.20598602294921875, 0.231170654296875, 0.25635528564453125, 0.2815399169921875, 0.30672454833984375, 0.3319091796875, 0.35709381103515625, 0.3822784423828125, 0.40746307373046875, 0.432647705078125, 0.45783233642578125, 0.4830169677734375, 0.5082015991210938, 0.53338623046875, 0.5585708618164062, 0.5837554931640625, 0.6089401245117188, 0.634124755859375, 0.6593093872070312, 0.6844940185546875, 0.7096786499023438, 0.73486328125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 9.0, 13.0, 7.0, 14.0, 19.0, 14.0, 27.0, 27.0, 30.0, 35.0, 40.0, 40.0, 36.0, 46.0, 50.0, 68.0, 53.0, 54.0, 55.0, 35.0, 41.0, 38.0, 43.0, 33.0, 28.0, 21.0, 15.0, 21.0, 18.0, 14.0, 14.0, 8.0, 8.0, 5.0, 5.0, 0.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.8173828125, -0.7937240600585938, -0.7700653076171875, -0.7464065551757812, -0.722747802734375, -0.6990890502929688, -0.6754302978515625, -0.6517715454101562, -0.62811279296875, -0.6044540405273438, -0.5807952880859375, -0.5571365356445312, -0.533477783203125, -0.5098190307617188, -0.4861602783203125, -0.46250152587890625, -0.4388427734375, -0.41518402099609375, -0.3915252685546875, -0.36786651611328125, -0.344207763671875, -0.32054901123046875, -0.2968902587890625, -0.27323150634765625, -0.24957275390625, -0.22591400146484375, -0.2022552490234375, -0.17859649658203125, -0.154937744140625, -0.13127899169921875, -0.1076202392578125, -0.08396148681640625, -0.060302734375, -0.03664398193359375, -0.0129852294921875, 0.01067352294921875, 0.034332275390625, 0.05799102783203125, 0.0816497802734375, 0.10530853271484375, 0.12896728515625, 0.15262603759765625, 0.1762847900390625, 0.19994354248046875, 0.223602294921875, 0.24726104736328125, 0.2709197998046875, 0.29457855224609375, 0.3182373046875, 0.34189605712890625, 0.3655548095703125, 0.38921356201171875, 0.412872314453125, 0.43653106689453125, 0.4601898193359375, 0.48384857177734375, 0.50750732421875, 0.5311660766601562, 0.5548248291015625, 0.5784835815429688, 0.602142333984375, 0.6258010864257812, 0.6494598388671875, 0.6731185913085938, 0.69677734375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 6.0, 12.0, 12.0, 19.0, 30.0, 92.0, 218.0, 896.0, 6463.0, 286220.0, 740953.0, 11809.0, 1339.0, 303.0, 80.0, 51.0, 15.0, 15.0, 7.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.472900390625, -0.4581756591796875, -0.443450927734375, -0.4287261962890625, -0.41400146484375, -0.3992767333984375, -0.384552001953125, -0.3698272705078125, -0.3551025390625, -0.3403778076171875, -0.325653076171875, -0.3109283447265625, -0.29620361328125, -0.2814788818359375, -0.266754150390625, -0.2520294189453125, -0.2373046875, -0.2225799560546875, -0.207855224609375, -0.1931304931640625, -0.17840576171875, -0.1636810302734375, -0.148956298828125, -0.1342315673828125, -0.1195068359375, -0.1047821044921875, -0.090057373046875, -0.0753326416015625, -0.06060791015625, -0.0458831787109375, -0.031158447265625, -0.0164337158203125, -0.001708984375, 0.0130157470703125, 0.027740478515625, 0.0424652099609375, 0.05718994140625, 0.0719146728515625, 0.086639404296875, 0.1013641357421875, 0.1160888671875, 0.1308135986328125, 0.145538330078125, 0.1602630615234375, 0.17498779296875, 0.1897125244140625, 0.204437255859375, 0.2191619873046875, 0.23388671875, 0.2486114501953125, 0.263336181640625, 0.2780609130859375, 0.29278564453125, 0.3075103759765625, 0.322235107421875, 0.3369598388671875, 0.3516845703125, 0.3664093017578125, 0.381134033203125, 0.3958587646484375, 0.41058349609375, 0.4253082275390625, 0.440032958984375, 0.4547576904296875, 0.469482421875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 3.0, 5.0, 8.0, 10.0, 21.0, 25.0, 33.0, 56.0, 109.0, 115.0, 157.0, 140.0, 115.0, 63.0, 43.0, 31.0, 20.0, 8.0, 11.0, 7.0, 7.0, 4.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.7206878662109375e-05, -4.598498344421387e-05, -4.476308822631836e-05, -4.354119300842285e-05, -4.2319297790527344e-05, -4.1097402572631836e-05, -3.987550735473633e-05, -3.865361213684082e-05, -3.743171691894531e-05, -3.6209821701049805e-05, -3.49879264831543e-05, -3.376603126525879e-05, -3.254413604736328e-05, -3.1322240829467773e-05, -3.0100345611572266e-05, -2.8878450393676758e-05, -2.765655517578125e-05, -2.6434659957885742e-05, -2.5212764739990234e-05, -2.3990869522094727e-05, -2.276897430419922e-05, -2.154707908630371e-05, -2.0325183868408203e-05, -1.9103288650512695e-05, -1.7881393432617188e-05, -1.665949821472168e-05, -1.5437602996826172e-05, -1.4215707778930664e-05, -1.2993812561035156e-05, -1.1771917343139648e-05, -1.055002212524414e-05, -9.328126907348633e-06, -8.106231689453125e-06, -6.884336471557617e-06, -5.662441253662109e-06, -4.4405460357666016e-06, -3.2186508178710938e-06, -1.996755599975586e-06, -7.748603820800781e-07, 4.470348358154297e-07, 1.6689300537109375e-06, 2.8908252716064453e-06, 4.112720489501953e-06, 5.334615707397461e-06, 6.556510925292969e-06, 7.778406143188477e-06, 9.000301361083984e-06, 1.0222196578979492e-05, 1.1444091796875e-05, 1.2665987014770508e-05, 1.3887882232666016e-05, 1.5109777450561523e-05, 1.633167266845703e-05, 1.755356788635254e-05, 1.8775463104248047e-05, 1.9997358322143555e-05, 2.1219253540039062e-05, 2.244114875793457e-05, 2.3663043975830078e-05, 2.4884939193725586e-05, 2.6106834411621094e-05, 2.73287296295166e-05, 2.855062484741211e-05, 2.9772520065307617e-05, 3.0994415283203125e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 10.0, 5.0, 8.0, 9.0, 24.0, 24.0, 51.0, 82.0, 124.0, 221.0, 409.0, 826.0, 1927.0, 4538.0, 14889.0, 77018.0, 490825.0, 383065.0, 55829.0, 11615.0, 3803.0, 1634.0, 743.0, 371.0, 215.0, 114.0, 59.0, 34.0, 22.0, 17.0, 15.0, 6.0, 9.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.218017578125, -0.2113933563232422, -0.20476913452148438, -0.19814491271972656, -0.19152069091796875, -0.18489646911621094, -0.17827224731445312, -0.1716480255126953, -0.1650238037109375, -0.1583995819091797, -0.15177536010742188, -0.14515113830566406, -0.13852691650390625, -0.13190269470214844, -0.12527847290039062, -0.11865425109863281, -0.112030029296875, -0.10540580749511719, -0.09878158569335938, -0.09215736389160156, -0.08553314208984375, -0.07890892028808594, -0.07228469848632812, -0.06566047668457031, -0.0590362548828125, -0.05241203308105469, -0.045787811279296875, -0.03916358947753906, -0.03253936767578125, -0.025915145874023438, -0.019290924072265625, -0.012666702270507812, -0.00604248046875, 0.0005817413330078125, 0.007205963134765625, 0.013830184936523438, 0.02045440673828125, 0.027078628540039062, 0.033702850341796875, 0.04032707214355469, 0.0469512939453125, 0.05357551574707031, 0.060199737548828125, 0.06682395935058594, 0.07344818115234375, 0.08007240295410156, 0.08669662475585938, 0.09332084655761719, 0.099945068359375, 0.10656929016113281, 0.11319351196289062, 0.11981773376464844, 0.12644195556640625, 0.13306617736816406, 0.13969039916992188, 0.1463146209716797, 0.1529388427734375, 0.1595630645751953, 0.16618728637695312, 0.17281150817871094, 0.17943572998046875, 0.18605995178222656, 0.19268417358398438, 0.1993083953857422, 0.2059326171875]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 13.0, 12.0, 22.0, 25.0, 21.0, 35.0, 48.0, 63.0, 81.0, 99.0, 110.0, 106.0, 91.0, 68.0, 52.0, 42.0, 33.0, 16.0, 16.0, 10.0, 14.0, 5.0, 3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10223388671875, -0.09908008575439453, -0.09592628479003906, -0.0927724838256836, -0.08961868286132812, -0.08646488189697266, -0.08331108093261719, -0.08015727996826172, -0.07700347900390625, -0.07384967803955078, -0.07069587707519531, -0.06754207611083984, -0.06438827514648438, -0.061234474182128906, -0.05808067321777344, -0.05492687225341797, -0.0517730712890625, -0.04861927032470703, -0.04546546936035156, -0.042311668395996094, -0.039157867431640625, -0.036004066467285156, -0.03285026550292969, -0.02969646453857422, -0.02654266357421875, -0.02338886260986328, -0.020235061645507812, -0.017081260681152344, -0.013927459716796875, -0.010773658752441406, -0.0076198577880859375, -0.004466056823730469, -0.001312255859375, 0.0018415451049804688, 0.0049953460693359375, 0.008149147033691406, 0.011302947998046875, 0.014456748962402344, 0.017610549926757812, 0.02076435089111328, 0.02391815185546875, 0.02707195281982422, 0.030225753784179688, 0.033379554748535156, 0.036533355712890625, 0.039687156677246094, 0.04284095764160156, 0.04599475860595703, 0.0491485595703125, 0.05230236053466797, 0.05545616149902344, 0.058609962463378906, 0.061763763427734375, 0.06491756439208984, 0.06807136535644531, 0.07122516632080078, 0.07437896728515625, 0.07753276824951172, 0.08068656921386719, 0.08384037017822266, 0.08699417114257812, 0.0901479721069336, 0.09330177307128906, 0.09645557403564453, 0.099609375]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 6.0, 15.0, 24.0, 45.0, 61.0, 101.0, 143.0, 167.0, 139.0, 127.0, 72.0, 54.0, 27.0, 14.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6877877712249756, -1.6309486627578735, -1.5741095542907715, -1.5172704458236694, -1.4604313373565674, -1.4035923480987549, -1.3467532396316528, -1.2899141311645508, -1.2330750226974487, -1.1762359142303467, -1.1193968057632446, -1.0625576972961426, -1.00571870803833, -0.9488795399665833, -0.892040491104126, -0.8352013826370239, -0.7783622741699219, -0.7215231657028198, -0.6646840572357178, -0.6078450083732605, -0.5510058999061584, -0.4941667914390564, -0.43732771277427673, -0.38048863410949707, -0.323649525642395, -0.26681041717529297, -0.2099713385105133, -0.15313224494457245, -0.09629315137863159, -0.03945404291152954, 0.017385035753250122, 0.07422411441802979, 0.1310633420944214, 0.18790243566036224, 0.2447415292263031, 0.30158060789108276, 0.3584197163581848, 0.41525882482528687, 0.47209790349006653, 0.5289369821548462, 0.5857760906219482, 0.6426151990890503, 0.6994543075561523, 0.7562933564186096, 0.8131324648857117, 0.8699715733528137, 0.926810622215271, 0.983649730682373, 1.040488839149475, 1.0973279476165771, 1.1541670560836792, 1.2110061645507812, 1.2678451538085938, 1.3246843814849854, 1.3815233707427979, 1.4383624792099, 1.495201587677002, 1.552040696144104, 1.608879804611206, 1.665718913078308, 1.7225580215454102, 1.7793970108032227, 1.8362361192703247, 1.8930752277374268, 1.9499143362045288]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 3.0, 3.0, 2.0, 6.0, 3.0, 3.0, 4.0, 10.0, 9.0, 11.0, 14.0, 12.0, 15.0, 20.0, 19.0, 27.0, 31.0, 26.0, 35.0, 30.0, 34.0, 34.0, 47.0, 33.0, 34.0, 35.0, 41.0, 27.0, 34.0, 44.0, 33.0, 42.0, 28.0, 26.0, 24.0, 23.0, 21.0, 28.0, 19.0, 14.0, 21.0, 15.0, 13.0, 11.0, 12.0, 7.0, 10.0, 3.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.832724928855896, -0.803977370262146, -0.7752298712730408, -0.7464823126792908, -0.7177348136901855, -0.6889872550964355, -0.6602396965026855, -0.6314921975135803, -0.6027446985244751, -0.5739971399307251, -0.5452496409416199, -0.5165020823478699, -0.48775458335876465, -0.45900702476501465, -0.43025949597358704, -0.4015119671821594, -0.3727644085884094, -0.3440168797969818, -0.3152693510055542, -0.2865217924118042, -0.257774293422699, -0.22902674973011017, -0.20027920603752136, -0.17153167724609375, -0.14278414845466614, -0.11403661966323853, -0.08528908342123032, -0.05654154717922211, -0.027794018387794495, 0.0009535104036331177, 0.029701054096221924, 0.058448582887649536, 0.08719611167907715, 0.11594364047050476, 0.14469116926193237, 0.17343871295452118, 0.2021862417459488, 0.2309337705373764, 0.2596813142299652, 0.2884288430213928, 0.31717637181282043, 0.34592390060424805, 0.37467142939567566, 0.40341895818710327, 0.43216651678085327, 0.4609140157699585, 0.4896615743637085, 0.5184091329574585, 0.5471566319465637, 0.5759041905403137, 0.604651689529419, 0.633399248123169, 0.6621467471122742, 0.6908943057060242, 0.7196418046951294, 0.7483893632888794, 0.7771369218826294, 0.8058844804763794, 0.8346319794654846, 0.8633795380592346, 0.8921270370483398, 0.9208745956420898, 0.9496221542358398, 0.9783696532249451, 1.0071171522140503]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 9.0, 3.0, 8.0, 8.0, 17.0, 15.0, 32.0, 22.0, 42.0, 54.0, 98.0, 154.0, 263.0, 406.0, 909.0, 1837.0, 4687.0, 14590.0, 84133.0, 1902418.0, 2073988.0, 86521.0, 15269.0, 4853.0, 1938.0, 914.0, 457.0, 213.0, 124.0, 81.0, 56.0, 43.0, 31.0, 28.0, 21.0, 12.0, 4.0, 4.0, 6.0, 6.0, 6.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7978515625, -0.770355224609375, -0.74285888671875, -0.715362548828125, -0.6878662109375, -0.660369873046875, -0.63287353515625, -0.605377197265625, -0.577880859375, -0.550384521484375, -0.52288818359375, -0.495391845703125, -0.4678955078125, -0.440399169921875, -0.41290283203125, -0.385406494140625, -0.35791015625, -0.330413818359375, -0.30291748046875, -0.275421142578125, -0.2479248046875, -0.220428466796875, -0.19293212890625, -0.165435791015625, -0.137939453125, -0.110443115234375, -0.08294677734375, -0.055450439453125, -0.0279541015625, -0.000457763671875, 0.02703857421875, 0.054534912109375, 0.08203125, 0.109527587890625, 0.13702392578125, 0.164520263671875, 0.1920166015625, 0.219512939453125, 0.24700927734375, 0.274505615234375, 0.302001953125, 0.329498291015625, 0.35699462890625, 0.384490966796875, 0.4119873046875, 0.439483642578125, 0.46697998046875, 0.494476318359375, 0.52197265625, 0.549468994140625, 0.57696533203125, 0.604461669921875, 0.6319580078125, 0.659454345703125, 0.68695068359375, 0.714447021484375, 0.741943359375, 0.769439697265625, 0.79693603515625, 0.824432373046875, 0.8519287109375, 0.879425048828125, 0.90692138671875, 0.934417724609375, 0.9619140625]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 8.0, 5.0, 3.0, 8.0, 12.0, 12.0, 7.0, 20.0, 33.0, 26.0, 24.0, 24.0, 35.0, 43.0, 40.0, 44.0, 43.0, 44.0, 55.0, 57.0, 46.0, 49.0, 51.0, 40.0, 32.0, 41.0, 24.0, 30.0, 25.0, 23.0, 19.0, 11.0, 12.0, 13.0, 12.0, 7.0, 8.0, 6.0, 4.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.31005859375, -0.3001251220703125, -0.290191650390625, -0.2802581787109375, -0.27032470703125, -0.2603912353515625, -0.250457763671875, -0.2405242919921875, -0.2305908203125, -0.2206573486328125, -0.210723876953125, -0.2007904052734375, -0.19085693359375, -0.1809234619140625, -0.170989990234375, -0.1610565185546875, -0.151123046875, -0.1411895751953125, -0.131256103515625, -0.1213226318359375, -0.11138916015625, -0.1014556884765625, -0.091522216796875, -0.0815887451171875, -0.0716552734375, -0.0617218017578125, -0.051788330078125, -0.0418548583984375, -0.03192138671875, -0.0219879150390625, -0.012054443359375, -0.0021209716796875, 0.0078125, 0.0177459716796875, 0.027679443359375, 0.0376129150390625, 0.04754638671875, 0.0574798583984375, 0.067413330078125, 0.0773468017578125, 0.0872802734375, 0.0972137451171875, 0.107147216796875, 0.1170806884765625, 0.12701416015625, 0.1369476318359375, 0.146881103515625, 0.1568145751953125, 0.166748046875, 0.1766815185546875, 0.186614990234375, 0.1965484619140625, 0.20648193359375, 0.2164154052734375, 0.226348876953125, 0.2362823486328125, 0.2462158203125, 0.2561492919921875, 0.266082763671875, 0.2760162353515625, 0.28594970703125, 0.2958831787109375, 0.305816650390625, 0.3157501220703125, 0.32568359375]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 17.0, 19.0, 40.0, 93.0, 266.0, 949.0, 6535.0, 326404.0, 3833368.0, 23867.0, 2011.0, 428.0, 159.0, 47.0, 40.0, 20.0, 9.0, 6.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.134765625, -2.0723876953125, -2.010009765625, -1.9476318359375, -1.88525390625, -1.8228759765625, -1.760498046875, -1.6981201171875, -1.6357421875, -1.5733642578125, -1.510986328125, -1.4486083984375, -1.38623046875, -1.3238525390625, -1.261474609375, -1.1990966796875, -1.13671875, -1.0743408203125, -1.011962890625, -0.9495849609375, -0.88720703125, -0.8248291015625, -0.762451171875, -0.7000732421875, -0.6376953125, -0.5753173828125, -0.512939453125, -0.4505615234375, -0.38818359375, -0.3258056640625, -0.263427734375, -0.2010498046875, -0.138671875, -0.0762939453125, -0.013916015625, 0.0484619140625, 0.11083984375, 0.1732177734375, 0.235595703125, 0.2979736328125, 0.3603515625, 0.4227294921875, 0.485107421875, 0.5474853515625, 0.60986328125, 0.6722412109375, 0.734619140625, 0.7969970703125, 0.859375, 0.9217529296875, 0.984130859375, 1.0465087890625, 1.10888671875, 1.1712646484375, 1.233642578125, 1.2960205078125, 1.3583984375, 1.4207763671875, 1.483154296875, 1.5455322265625, 1.60791015625, 1.6702880859375, 1.732666015625, 1.7950439453125, 1.857421875]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 7.0, 14.0, 15.0, 15.0, 30.0, 43.0, 64.0, 113.0, 229.0, 404.0, 682.0, 868.0, 668.0, 400.0, 224.0, 120.0, 57.0, 43.0, 26.0, 20.0, 13.0, 5.0, 7.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2646484375, -0.2550086975097656, -0.24536895751953125, -0.23572921752929688, -0.2260894775390625, -0.21644973754882812, -0.20680999755859375, -0.19717025756835938, -0.187530517578125, -0.17789077758789062, -0.16825103759765625, -0.15861129760742188, -0.1489715576171875, -0.13933181762695312, -0.12969207763671875, -0.12005233764648438, -0.11041259765625, -0.10077285766601562, -0.09113311767578125, -0.08149337768554688, -0.0718536376953125, -0.062213897705078125, -0.05257415771484375, -0.042934417724609375, -0.033294677734375, -0.023654937744140625, -0.01401519775390625, -0.004375457763671875, 0.0052642822265625, 0.014904022216796875, 0.02454376220703125, 0.034183502197265625, 0.0438232421875, 0.053462982177734375, 0.06310272216796875, 0.07274246215820312, 0.0823822021484375, 0.09202194213867188, 0.10166168212890625, 0.11130142211914062, 0.120941162109375, 0.13058090209960938, 0.14022064208984375, 0.14986038208007812, 0.1595001220703125, 0.16913986206054688, 0.17877960205078125, 0.18841934204101562, 0.19805908203125, 0.20769882202148438, 0.21733856201171875, 0.22697830200195312, 0.2366180419921875, 0.24625778198242188, 0.25589752197265625, 0.2655372619628906, 0.275177001953125, 0.2848167419433594, 0.29445648193359375, 0.3040962219238281, 0.3137359619140625, 0.3233757019042969, 0.33301544189453125, 0.3426551818847656, 0.352294921875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 6.0, 0.0, 12.0, 10.0, 16.0, 23.0, 29.0, 30.0, 40.0, 39.0, 44.0, 37.0, 70.0, 41.0, 53.0, 52.0, 47.0, 52.0, 45.0, 46.0, 44.0, 51.0, 38.0, 33.0, 26.0, 20.0, 26.0, 14.0, 11.0, 9.0, 7.0, 8.0, 4.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45826905965805054, -0.44269654154777527, -0.4271239936351776, -0.41155147552490234, -0.3959789574146271, -0.3804064393043518, -0.36483389139175415, -0.3492613732814789, -0.3336888551712036, -0.31811633706092834, -0.3025437891483307, -0.2869712710380554, -0.27139875292778015, -0.2558262348175049, -0.24025368690490723, -0.22468116879463196, -0.2091086208820343, -0.19353608787059784, -0.17796356976032257, -0.1623910367488861, -0.14681851863861084, -0.13124598562717438, -0.11567345261573792, -0.10010092705488205, -0.08452840149402618, -0.06895587593317032, -0.053383346647024155, -0.03781081736087799, -0.022238291800022125, -0.00666576623916626, 0.008906766772270203, 0.024479292333126068, 0.040051817893981934, 0.0556243434548378, 0.07119686901569366, 0.08676940202713013, 0.10234192758798599, 0.11791445314884186, 0.13348698616027832, 0.1490595042705536, 0.16463203728199005, 0.1802045702934265, 0.19577708840370178, 0.21134962141513824, 0.2269221544265747, 0.24249467253684998, 0.25806719064712524, 0.2736397385597229, 0.28921225666999817, 0.30478477478027344, 0.3203573226928711, 0.33592984080314636, 0.35150235891342163, 0.3670749068260193, 0.38264742493629456, 0.3982199430465698, 0.4137924909591675, 0.42936500906944275, 0.4449375569820404, 0.4605100750923157, 0.47608259320259094, 0.4916551113128662, 0.5072276592254639, 0.5228002071380615, 0.5383726954460144]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 9.0, 7.0, 6.0, 3.0, 6.0, 8.0, 16.0, 21.0, 17.0, 17.0, 14.0, 15.0, 26.0, 28.0, 30.0, 34.0, 23.0, 32.0, 34.0, 43.0, 32.0, 34.0, 31.0, 40.0, 26.0, 38.0, 31.0, 33.0, 32.0, 33.0, 29.0, 38.0, 26.0, 26.0, 24.0, 29.0, 15.0, 17.0, 10.0, 17.0, 9.0, 8.0, 8.0, 9.0, 7.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3586704134941101, -0.3468731641769409, -0.33507591485977173, -0.32327866554260254, -0.31148141622543335, -0.29968416690826416, -0.28788691759109497, -0.2760896682739258, -0.2642924189567566, -0.2524951696395874, -0.2406979203224182, -0.22890067100524902, -0.21710342168807983, -0.20530617237091064, -0.19350892305374146, -0.18171167373657227, -0.16991443932056427, -0.15811719000339508, -0.1463199406862259, -0.1345226913690567, -0.12272544205188751, -0.11092819273471832, -0.09913095086812973, -0.08733370155096054, -0.07553645223379135, -0.06373920291662216, -0.05194195359945297, -0.04014470800757408, -0.028347458690404892, -0.016550209373235703, -0.0047529637813568115, 0.007044285535812378, 0.018841534852981567, 0.030638784170150757, 0.042436033487319946, 0.05423327907919884, 0.06603053212165833, 0.07782778143882751, 0.08962502330541611, 0.1014222726225853, 0.11321952193975449, 0.12501676380634308, 0.13681401312351227, 0.14861126244068146, 0.16040851175785065, 0.17220576107501984, 0.18400301039218903, 0.19580025970935822, 0.2075975090265274, 0.2193947583436966, 0.23119200766086578, 0.24298925697803497, 0.25478649139404297, 0.26658374071121216, 0.27838099002838135, 0.29017823934555054, 0.3019754886627197, 0.3137727379798889, 0.3255699872970581, 0.3373672366142273, 0.3491644859313965, 0.3609617352485657, 0.37275898456573486, 0.38455623388290405, 0.39635348320007324]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 8.0, 4.0, 11.0, 8.0, 24.0, 20.0, 22.0, 37.0, 64.0, 82.0, 111.0, 188.0, 291.0, 428.0, 751.0, 1253.0, 2161.0, 3876.0, 6862.0, 12679.0, 28708.0, 114272.0, 463903.0, 307342.0, 62227.0, 20082.0, 10040.0, 5474.0, 3155.0, 1756.0, 1013.0, 625.0, 375.0, 233.0, 148.0, 76.0, 58.0, 56.0, 32.0, 37.0, 19.0, 13.0, 13.0, 8.0, 6.0, 5.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.1778564453125, -0.1727466583251953, -0.16763687133789062, -0.16252708435058594, -0.15741729736328125, -0.15230751037597656, -0.14719772338867188, -0.1420879364013672, -0.1369781494140625, -0.1318683624267578, -0.12675857543945312, -0.12164878845214844, -0.11653900146484375, -0.11142921447753906, -0.10631942749023438, -0.10120964050292969, -0.096099853515625, -0.09099006652832031, -0.08588027954101562, -0.08077049255371094, -0.07566070556640625, -0.07055091857910156, -0.06544113159179688, -0.06033134460449219, -0.0552215576171875, -0.05011177062988281, -0.045001983642578125, -0.03989219665527344, -0.03478240966796875, -0.029672622680664062, -0.024562835693359375, -0.019453048706054688, -0.01434326171875, -0.009233474731445312, -0.004123687744140625, 0.0009860992431640625, 0.00609588623046875, 0.011205673217773438, 0.016315460205078125, 0.021425247192382812, 0.0265350341796875, 0.03164482116699219, 0.036754608154296875, 0.04186439514160156, 0.04697418212890625, 0.05208396911621094, 0.057193756103515625, 0.06230354309082031, 0.067413330078125, 0.07252311706542969, 0.07763290405273438, 0.08274269104003906, 0.08785247802734375, 0.09296226501464844, 0.09807205200195312, 0.10318183898925781, 0.1082916259765625, 0.11340141296386719, 0.11851119995117188, 0.12362098693847656, 0.12873077392578125, 0.13384056091308594, 0.13895034790039062, 0.1440601348876953, 0.149169921875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 8.0, 7.0, 16.0, 9.0, 13.0, 18.0, 17.0, 19.0, 16.0, 27.0, 23.0, 26.0, 24.0, 40.0, 23.0, 37.0, 39.0, 38.0, 33.0, 49.0, 34.0, 43.0, 31.0, 32.0, 29.0, 35.0, 35.0, 37.0, 27.0, 40.0, 26.0, 28.0, 16.0, 17.0, 14.0, 12.0, 17.0, 13.0, 4.0, 11.0, 1.0, 6.0, 6.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.227783203125, -0.21980667114257812, -0.21183013916015625, -0.20385360717773438, -0.1958770751953125, -0.18790054321289062, -0.17992401123046875, -0.17194747924804688, -0.163970947265625, -0.15599441528320312, -0.14801788330078125, -0.14004135131835938, -0.1320648193359375, -0.12408828735351562, -0.11611175537109375, -0.10813522338867188, -0.10015869140625, -0.09218215942382812, -0.08420562744140625, -0.07622909545898438, -0.0682525634765625, -0.060276031494140625, -0.05229949951171875, -0.044322967529296875, -0.036346435546875, -0.028369903564453125, -0.02039337158203125, -0.012416839599609375, -0.0044403076171875, 0.003536224365234375, 0.01151275634765625, 0.019489288330078125, 0.0274658203125, 0.035442352294921875, 0.04341888427734375, 0.051395416259765625, 0.0593719482421875, 0.06734848022460938, 0.07532501220703125, 0.08330154418945312, 0.091278076171875, 0.09925460815429688, 0.10723114013671875, 0.11520767211914062, 0.1231842041015625, 0.13116073608398438, 0.13913726806640625, 0.14711380004882812, 0.15509033203125, 0.16306686401367188, 0.17104339599609375, 0.17901992797851562, 0.1869964599609375, 0.19497299194335938, 0.20294952392578125, 0.21092605590820312, 0.218902587890625, 0.22687911987304688, 0.23485565185546875, 0.24283218383789062, 0.2508087158203125, 0.2587852478027344, 0.26676177978515625, 0.2747383117675781, 0.28271484375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 6.0, 10.0, 7.0, 9.0, 16.0, 24.0, 28.0, 70.0, 92.0, 198.0, 375.0, 901.0, 2729.0, 9298.0, 49122.0, 517444.0, 417500.0, 38785.0, 7969.0, 2234.0, 890.0, 394.0, 166.0, 89.0, 59.0, 36.0, 23.0, 18.0, 17.0, 10.0, 9.0, 8.0, 8.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2783203125, -0.27117347717285156, -0.2640266418457031, -0.2568798065185547, -0.24973297119140625, -0.2425861358642578, -0.23543930053710938, -0.22829246520996094, -0.2211456298828125, -0.21399879455566406, -0.20685195922851562, -0.1997051239013672, -0.19255828857421875, -0.1854114532470703, -0.17826461791992188, -0.17111778259277344, -0.163970947265625, -0.15682411193847656, -0.14967727661132812, -0.1425304412841797, -0.13538360595703125, -0.1282367706298828, -0.12108993530273438, -0.11394309997558594, -0.1067962646484375, -0.09964942932128906, -0.09250259399414062, -0.08535575866699219, -0.07820892333984375, -0.07106208801269531, -0.06391525268554688, -0.05676841735839844, -0.04962158203125, -0.04247474670410156, -0.035327911376953125, -0.028181076049804688, -0.02103424072265625, -0.013887405395507812, -0.006740570068359375, 0.0004062652587890625, 0.0075531005859375, 0.014699935913085938, 0.021846771240234375, 0.028993606567382812, 0.03614044189453125, 0.04328727722167969, 0.050434112548828125, 0.05758094787597656, 0.064727783203125, 0.07187461853027344, 0.07902145385742188, 0.08616828918457031, 0.09331512451171875, 0.10046195983886719, 0.10760879516601562, 0.11475563049316406, 0.1219024658203125, 0.12904930114746094, 0.13619613647460938, 0.1433429718017578, 0.15048980712890625, 0.1576366424560547, 0.16478347778320312, 0.17193031311035156, 0.1790771484375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 5.0, 8.0, 7.0, 5.0, 13.0, 15.0, 17.0, 15.0, 29.0, 20.0, 30.0, 26.0, 35.0, 36.0, 44.0, 39.0, 30.0, 37.0, 39.0, 40.0, 37.0, 56.0, 47.0, 37.0, 35.0, 32.0, 32.0, 28.0, 29.0, 36.0, 22.0, 21.0, 19.0, 18.0, 8.0, 7.0, 10.0, 11.0, 11.0, 6.0, 3.0, 1.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.71923828125, -0.6986541748046875, -0.678070068359375, -0.6574859619140625, -0.63690185546875, -0.6163177490234375, -0.595733642578125, -0.5751495361328125, -0.5545654296875, -0.5339813232421875, -0.513397216796875, -0.4928131103515625, -0.47222900390625, -0.4516448974609375, -0.431060791015625, -0.4104766845703125, -0.389892578125, -0.3693084716796875, -0.348724365234375, -0.3281402587890625, -0.30755615234375, -0.2869720458984375, -0.266387939453125, -0.2458038330078125, -0.2252197265625, -0.2046356201171875, -0.184051513671875, -0.1634674072265625, -0.14288330078125, -0.1222991943359375, -0.101715087890625, -0.0811309814453125, -0.060546875, -0.0399627685546875, -0.019378662109375, 0.0012054443359375, 0.02178955078125, 0.0423736572265625, 0.062957763671875, 0.0835418701171875, 0.1041259765625, 0.1247100830078125, 0.145294189453125, 0.1658782958984375, 0.18646240234375, 0.2070465087890625, 0.227630615234375, 0.2482147216796875, 0.268798828125, 0.2893829345703125, 0.309967041015625, 0.3305511474609375, 0.35113525390625, 0.3717193603515625, 0.392303466796875, 0.4128875732421875, 0.4334716796875, 0.4540557861328125, 0.474639892578125, 0.4952239990234375, 0.51580810546875, 0.5363922119140625, 0.556976318359375, 0.5775604248046875, 0.59814453125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 7.0, 6.0, 8.0, 8.0, 17.0, 21.0, 31.0, 46.0, 59.0, 83.0, 127.0, 230.0, 435.0, 753.0, 1413.0, 2699.0, 6111.0, 15206.0, 62146.0, 614966.0, 293050.0, 31823.0, 10373.0, 4343.0, 2029.0, 1077.0, 550.0, 345.0, 193.0, 128.0, 77.0, 59.0, 43.0, 28.0, 17.0, 17.0, 9.0, 8.0, 5.0, 5.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.10699462890625, -0.10392093658447266, -0.10084724426269531, -0.09777355194091797, -0.09469985961914062, -0.09162616729736328, -0.08855247497558594, -0.0854787826538086, -0.08240509033203125, -0.0793313980102539, -0.07625770568847656, -0.07318401336669922, -0.07011032104492188, -0.06703662872314453, -0.06396293640136719, -0.060889244079589844, -0.0578155517578125, -0.054741859436035156, -0.05166816711425781, -0.04859447479248047, -0.045520782470703125, -0.04244709014892578, -0.03937339782714844, -0.036299705505371094, -0.03322601318359375, -0.030152320861816406, -0.027078628540039062, -0.02400493621826172, -0.020931243896484375, -0.01785755157470703, -0.014783859252929688, -0.011710166931152344, -0.008636474609375, -0.005562782287597656, -0.0024890899658203125, 0.0005846023559570312, 0.003658294677734375, 0.006731986999511719, 0.009805679321289062, 0.012879371643066406, 0.01595306396484375, 0.019026756286621094, 0.022100448608398438, 0.02517414093017578, 0.028247833251953125, 0.03132152557373047, 0.03439521789550781, 0.037468910217285156, 0.0405426025390625, 0.043616294860839844, 0.04668998718261719, 0.04976367950439453, 0.052837371826171875, 0.05591106414794922, 0.05898475646972656, 0.062058448791503906, 0.06513214111328125, 0.0682058334350586, 0.07127952575683594, 0.07435321807861328, 0.07742691040039062, 0.08050060272216797, 0.08357429504394531, 0.08664798736572266, 0.0897216796875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 1.0, 2.0, 2.0, 5.0, 7.0, 7.0, 11.0, 27.0, 64.0, 156.0, 274.0, 220.0, 100.0, 48.0, 28.0, 12.0, 9.0, 6.0, 2.0, 1.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.053945541381836e-05, -8.793827146291733e-05, -8.53370875120163e-05, -8.273590356111526e-05, -8.013471961021423e-05, -7.75335356593132e-05, -7.493235170841217e-05, -7.233116775751114e-05, -6.972998380661011e-05, -6.712879985570908e-05, -6.452761590480804e-05, -6.192643195390701e-05, -5.932524800300598e-05, -5.672406405210495e-05, -5.412288010120392e-05, -5.152169615030289e-05, -4.8920512199401855e-05, -4.6319328248500824e-05, -4.371814429759979e-05, -4.111696034669876e-05, -3.851577639579773e-05, -3.59145924448967e-05, -3.3313408493995667e-05, -3.0712224543094635e-05, -2.8111040592193604e-05, -2.5509856641292572e-05, -2.290867269039154e-05, -2.030748873949051e-05, -1.7706304788589478e-05, -1.5105120837688446e-05, -1.2503936886787415e-05, -9.902752935886383e-06, -7.3015689849853516e-06, -4.70038503408432e-06, -2.0992010831832886e-06, 5.019828677177429e-07, 3.1031668186187744e-06, 5.704350769519806e-06, 8.305534720420837e-06, 1.0906718671321869e-05, 1.35079026222229e-05, 1.6109086573123932e-05, 1.8710270524024963e-05, 2.1311454474925995e-05, 2.3912638425827026e-05, 2.6513822376728058e-05, 2.911500632762909e-05, 3.171619027853012e-05, 3.431737422943115e-05, 3.6918558180332184e-05, 3.9519742131233215e-05, 4.212092608213425e-05, 4.472211003303528e-05, 4.732329398393631e-05, 4.992447793483734e-05, 5.252566188573837e-05, 5.5126845836639404e-05, 5.7728029787540436e-05, 6.032921373844147e-05, 6.29303976893425e-05, 6.553158164024353e-05, 6.813276559114456e-05, 7.07339495420456e-05, 7.333513349294662e-05, 7.593631744384766e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 5.0, 7.0, 6.0, 12.0, 17.0, 17.0, 25.0, 40.0, 65.0, 77.0, 124.0, 203.0, 248.0, 384.0, 585.0, 836.0, 1306.0, 1898.0, 3124.0, 5576.0, 10037.0, 21804.0, 57711.0, 191725.0, 404286.0, 227614.0, 69074.0, 24627.0, 11255.0, 6088.0, 3493.0, 2089.0, 1394.0, 909.0, 612.0, 436.0, 300.0, 179.0, 132.0, 63.0, 66.0, 41.0, 23.0, 15.0, 8.0, 12.0, 8.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05633544921875, -0.054605960845947266, -0.05287647247314453, -0.0511469841003418, -0.04941749572753906, -0.04768800735473633, -0.045958518981933594, -0.04422903060913086, -0.042499542236328125, -0.04077005386352539, -0.039040565490722656, -0.03731107711791992, -0.03558158874511719, -0.03385210037231445, -0.03212261199951172, -0.030393123626708984, -0.02866363525390625, -0.026934146881103516, -0.02520465850830078, -0.023475170135498047, -0.021745681762695312, -0.020016193389892578, -0.018286705017089844, -0.01655721664428711, -0.014827728271484375, -0.01309823989868164, -0.011368751525878906, -0.009639263153076172, -0.007909774780273438, -0.006180286407470703, -0.004450798034667969, -0.0027213096618652344, -0.0009918212890625, 0.0007376670837402344, 0.0024671554565429688, 0.004196643829345703, 0.0059261322021484375, 0.007655620574951172, 0.009385108947753906, 0.01111459732055664, 0.012844085693359375, 0.01457357406616211, 0.016303062438964844, 0.018032550811767578, 0.019762039184570312, 0.021491527557373047, 0.02322101593017578, 0.024950504302978516, 0.02667999267578125, 0.028409481048583984, 0.03013896942138672, 0.03186845779418945, 0.03359794616699219, 0.03532743453979492, 0.037056922912597656, 0.03878641128540039, 0.040515899658203125, 0.04224538803100586, 0.043974876403808594, 0.04570436477661133, 0.04743385314941406, 0.0491633415222168, 0.05089282989501953, 0.052622318267822266, 0.054351806640625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 5.0, 6.0, 5.0, 7.0, 10.0, 16.0, 25.0, 40.0, 58.0, 80.0, 107.0, 137.0, 133.0, 98.0, 94.0, 44.0, 36.0, 17.0, 23.0, 9.0, 8.0, 7.0, 8.0, 8.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0263671875, -0.025513887405395508, -0.024660587310791016, -0.023807287216186523, -0.02295398712158203, -0.02210068702697754, -0.021247386932373047, -0.020394086837768555, -0.019540786743164062, -0.01868748664855957, -0.017834186553955078, -0.016980886459350586, -0.016127586364746094, -0.015274286270141602, -0.01442098617553711, -0.013567686080932617, -0.012714385986328125, -0.011861085891723633, -0.01100778579711914, -0.010154485702514648, -0.009301185607910156, -0.008447885513305664, -0.007594585418701172, -0.00674128532409668, -0.0058879852294921875, -0.005034685134887695, -0.004181385040283203, -0.003328084945678711, -0.0024747848510742188, -0.0016214847564697266, -0.0007681846618652344, 8.511543273925781e-05, 0.00093841552734375, 0.0017917156219482422, 0.0026450157165527344, 0.0034983158111572266, 0.004351615905761719, 0.005204916000366211, 0.006058216094970703, 0.006911516189575195, 0.0077648162841796875, 0.00861811637878418, 0.009471416473388672, 0.010324716567993164, 0.011178016662597656, 0.012031316757202148, 0.01288461685180664, 0.013737916946411133, 0.014591217041015625, 0.015444517135620117, 0.01629781723022461, 0.0171511173248291, 0.018004417419433594, 0.018857717514038086, 0.019711017608642578, 0.02056431770324707, 0.021417617797851562, 0.022270917892456055, 0.023124217987060547, 0.02397751808166504, 0.02483081817626953, 0.025684118270874023, 0.026537418365478516, 0.027390718460083008, 0.0282440185546875]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 8.0, 9.0, 18.0, 13.0, 22.0, 27.0, 47.0, 50.0, 58.0, 61.0, 84.0, 70.0, 71.0, 57.0, 61.0, 64.0, 67.0, 50.0, 48.0, 30.0, 26.0, 15.0, 10.0, 13.0, 10.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2583247721195221, -0.24578982591629028, -0.23325487971305847, -0.22071994841098785, -0.20818500220775604, -0.19565005600452423, -0.1831151247024536, -0.1705801784992218, -0.15804523229599, -0.14551028609275818, -0.13297533988952637, -0.12044040858745575, -0.10790546238422394, -0.09537051618099213, -0.08283557742834091, -0.0703006386756897, -0.057765692472457886, -0.04523074999451637, -0.03269580751657486, -0.020160865038633347, -0.0076259225606918335, 0.004909023642539978, 0.017443962395191193, 0.029978901147842407, 0.04251384735107422, 0.05504878982901573, 0.06758373230695724, 0.08011867105960846, 0.09265361726284027, 0.10518856346607208, 0.1177235022187233, 0.1302584409713745, 0.14279335737228394, 0.15532830357551575, 0.16786324977874756, 0.18039818108081818, 0.19293312728405, 0.2054680734872818, 0.21800300478935242, 0.23053795099258423, 0.24307289719581604, 0.25560784339904785, 0.26814278960227966, 0.2806777358055115, 0.2932126522064209, 0.3057476282119751, 0.3182825446128845, 0.33081749081611633, 0.34335243701934814, 0.35588738322257996, 0.36842232942581177, 0.3809572756290436, 0.3934922218322754, 0.4060271382331848, 0.4185620844364166, 0.43109703063964844, 0.44363197684288025, 0.45616692304611206, 0.46870186924934387, 0.4812368154525757, 0.4937717318534851, 0.5063067078590393, 0.5188416242599487, 0.5313766002655029, 0.5439115166664124]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 3.0, 4.0, 1.0, 4.0, 10.0, 7.0, 6.0, 13.0, 9.0, 14.0, 12.0, 15.0, 14.0, 18.0, 21.0, 21.0, 30.0, 27.0, 30.0, 41.0, 35.0, 31.0, 41.0, 29.0, 38.0, 34.0, 37.0, 35.0, 26.0, 32.0, 35.0, 39.0, 38.0, 26.0, 31.0, 29.0, 20.0, 22.0, 22.0, 17.0, 14.0, 14.0, 16.0, 8.0, 6.0, 6.0, 7.0, 5.0, 7.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21297743916511536, -0.2057407796382904, -0.19850412011146545, -0.1912674605846405, -0.18403080105781555, -0.1767941415309906, -0.16955748200416565, -0.1623208224773407, -0.15508416295051575, -0.1478475034236908, -0.14061084389686584, -0.1333741843700409, -0.12613752484321594, -0.11890086531639099, -0.11166421324014664, -0.10442755371332169, -0.09719090163707733, -0.08995424211025238, -0.08271758258342743, -0.07548092305660248, -0.06824426352977753, -0.061007607728242874, -0.05377095192670822, -0.04653429239988327, -0.03929763287305832, -0.03206097334623337, -0.024824315682053566, -0.017587658017873764, -0.010350998491048813, -0.0031143389642238617, 0.004122316837310791, 0.011358976364135742, 0.018595635890960693, 0.025832295417785645, 0.033068954944610596, 0.04030561074614525, 0.0475422702729702, 0.05477892979979515, 0.0620155856013298, 0.06925224512815475, 0.0764889046549797, 0.08372556418180466, 0.09096222370862961, 0.09819887578487396, 0.10543553531169891, 0.11267219483852386, 0.11990885436534882, 0.12714551389217377, 0.13438217341899872, 0.14161883294582367, 0.14885549247264862, 0.15609215199947357, 0.16332881152629852, 0.17056547105312347, 0.17780211567878723, 0.18503877520561218, 0.19227543473243713, 0.19951209425926208, 0.20674875378608704, 0.213985413312912, 0.22122207283973694, 0.2284587323665619, 0.23569539189338684, 0.2429320514202118, 0.25016871094703674]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 5.0, 0.0, 6.0, 5.0, 11.0, 10.0, 18.0, 26.0, 23.0, 41.0, 63.0, 87.0, 108.0, 179.0, 264.0, 418.0, 627.0, 979.0, 1734.0, 2872.0, 4953.0, 8576.0, 15551.0, 28557.0, 54189.0, 108856.0, 209304.0, 262507.0, 169230.0, 84786.0, 42151.0, 22485.0, 12478.0, 6979.0, 4050.0, 2361.0, 1483.0, 891.0, 534.0, 370.0, 273.0, 160.0, 113.0, 73.0, 45.0, 39.0, 25.0, 21.0, 13.0, 9.0, 6.0, 9.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.354736328125, -0.3440895080566406, -0.33344268798828125, -0.3227958679199219, -0.3121490478515625, -0.3015022277832031, -0.29085540771484375, -0.2802085876464844, -0.269561767578125, -0.2589149475097656, -0.24826812744140625, -0.23762130737304688, -0.2269744873046875, -0.21632766723632812, -0.20568084716796875, -0.19503402709960938, -0.18438720703125, -0.17374038696289062, -0.16309356689453125, -0.15244674682617188, -0.1417999267578125, -0.13115310668945312, -0.12050628662109375, -0.10985946655273438, -0.099212646484375, -0.08856582641601562, -0.07791900634765625, -0.06727218627929688, -0.0566253662109375, -0.045978546142578125, -0.03533172607421875, -0.024684906005859375, -0.0140380859375, -0.003391265869140625, 0.00725555419921875, 0.017902374267578125, 0.0285491943359375, 0.039196014404296875, 0.04984283447265625, 0.060489654541015625, 0.071136474609375, 0.08178329467773438, 0.09243011474609375, 0.10307693481445312, 0.1137237548828125, 0.12437057495117188, 0.13501739501953125, 0.14566421508789062, 0.15631103515625, 0.16695785522460938, 0.17760467529296875, 0.18825149536132812, 0.1988983154296875, 0.20954513549804688, 0.22019195556640625, 0.23083877563476562, 0.241485595703125, 0.2521324157714844, 0.26277923583984375, 0.2734260559082031, 0.2840728759765625, 0.2947196960449219, 0.30536651611328125, 0.3160133361816406, 0.32666015625]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 2.0, 6.0, 6.0, 7.0, 7.0, 10.0, 15.0, 7.0, 10.0, 13.0, 15.0, 17.0, 19.0, 34.0, 28.0, 23.0, 28.0, 32.0, 36.0, 40.0, 34.0, 36.0, 38.0, 48.0, 39.0, 47.0, 34.0, 21.0, 29.0, 32.0, 29.0, 28.0, 27.0, 37.0, 20.0, 23.0, 16.0, 18.0, 15.0, 13.0, 11.0, 12.0, 7.0, 6.0, 9.0, 5.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.378173828125, -0.3663368225097656, -0.35449981689453125, -0.3426628112792969, -0.3308258056640625, -0.3189888000488281, -0.30715179443359375, -0.2953147888183594, -0.283477783203125, -0.2716407775878906, -0.25980377197265625, -0.24796676635742188, -0.2361297607421875, -0.22429275512695312, -0.21245574951171875, -0.20061874389648438, -0.18878173828125, -0.17694473266601562, -0.16510772705078125, -0.15327072143554688, -0.1414337158203125, -0.12959671020507812, -0.11775970458984375, -0.10592269897460938, -0.094085693359375, -0.08224868774414062, -0.07041168212890625, -0.058574676513671875, -0.0467376708984375, -0.034900665283203125, -0.02306365966796875, -0.011226654052734375, 0.0006103515625, 0.012447357177734375, 0.02428436279296875, 0.036121368408203125, 0.0479583740234375, 0.059795379638671875, 0.07163238525390625, 0.08346939086914062, 0.095306396484375, 0.10714340209960938, 0.11898040771484375, 0.13081741333007812, 0.1426544189453125, 0.15449142456054688, 0.16632843017578125, 0.17816543579101562, 0.19000244140625, 0.20183944702148438, 0.21367645263671875, 0.22551345825195312, 0.2373504638671875, 0.24918746948242188, 0.26102447509765625, 0.2728614807128906, 0.284698486328125, 0.2965354919433594, 0.30837249755859375, 0.3202095031738281, 0.3320465087890625, 0.3438835144042969, 0.35572052001953125, 0.3675575256347656, 0.37939453125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 0.0, 3.0, 2.0, 3.0, 11.0, 6.0, 13.0, 14.0, 15.0, 18.0, 28.0, 53.0, 85.0, 116.0, 153.0, 276.0, 461.0, 680.0, 1285.0, 2356.0, 4527.0, 9229.0, 19761.0, 45892.0, 113214.0, 273824.0, 321160.0, 148499.0, 58687.0, 24723.0, 11572.0, 5338.0, 2872.0, 1479.0, 806.0, 489.0, 303.0, 187.0, 122.0, 93.0, 53.0, 37.0, 34.0, 15.0, 23.0, 11.0, 12.0, 6.0, 3.0, 4.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.447998046875, -0.4336128234863281, -0.41922760009765625, -0.4048423767089844, -0.3904571533203125, -0.3760719299316406, -0.36168670654296875, -0.3473014831542969, -0.332916259765625, -0.3185310363769531, -0.30414581298828125, -0.2897605895996094, -0.2753753662109375, -0.2609901428222656, -0.24660491943359375, -0.23221969604492188, -0.21783447265625, -0.20344924926757812, -0.18906402587890625, -0.17467880249023438, -0.1602935791015625, -0.14590835571289062, -0.13152313232421875, -0.11713790893554688, -0.102752685546875, -0.08836746215820312, -0.07398223876953125, -0.059597015380859375, -0.0452117919921875, -0.030826568603515625, -0.01644134521484375, -0.002056121826171875, 0.0123291015625, 0.026714324951171875, 0.04109954833984375, 0.055484771728515625, 0.0698699951171875, 0.08425521850585938, 0.09864044189453125, 0.11302566528320312, 0.127410888671875, 0.14179611206054688, 0.15618133544921875, 0.17056655883789062, 0.1849517822265625, 0.19933700561523438, 0.21372222900390625, 0.22810745239257812, 0.24249267578125, 0.2568778991699219, 0.27126312255859375, 0.2856483459472656, 0.3000335693359375, 0.3144187927246094, 0.32880401611328125, 0.3431892395019531, 0.357574462890625, 0.3719596862792969, 0.38634490966796875, 0.4007301330566406, 0.4151153564453125, 0.4295005798339844, 0.44388580322265625, 0.4582710266113281, 0.47265625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 8.0, 6.0, 14.0, 8.0, 8.0, 11.0, 18.0, 24.0, 18.0, 23.0, 22.0, 19.0, 23.0, 36.0, 33.0, 40.0, 45.0, 59.0, 45.0, 51.0, 41.0, 38.0, 42.0, 44.0, 39.0, 42.0, 25.0, 23.0, 22.0, 21.0, 22.0, 25.0, 23.0, 11.0, 13.0, 9.0, 5.0, 7.0, 6.0, 3.0, 8.0, 5.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.435302734375, -0.42096710205078125, -0.4066314697265625, -0.39229583740234375, -0.377960205078125, -0.36362457275390625, -0.3492889404296875, -0.33495330810546875, -0.32061767578125, -0.30628204345703125, -0.2919464111328125, -0.27761077880859375, -0.263275146484375, -0.24893951416015625, -0.2346038818359375, -0.22026824951171875, -0.2059326171875, -0.19159698486328125, -0.1772613525390625, -0.16292572021484375, -0.148590087890625, -0.13425445556640625, -0.1199188232421875, -0.10558319091796875, -0.09124755859375, -0.07691192626953125, -0.0625762939453125, -0.04824066162109375, -0.033905029296875, -0.01956939697265625, -0.0052337646484375, 0.00910186767578125, 0.0234375, 0.03777313232421875, 0.0521087646484375, 0.06644439697265625, 0.080780029296875, 0.09511566162109375, 0.1094512939453125, 0.12378692626953125, 0.13812255859375, 0.15245819091796875, 0.1667938232421875, 0.18112945556640625, 0.195465087890625, 0.20980072021484375, 0.2241363525390625, 0.23847198486328125, 0.2528076171875, 0.26714324951171875, 0.2814788818359375, 0.29581451416015625, 0.310150146484375, 0.32448577880859375, 0.3388214111328125, 0.35315704345703125, 0.36749267578125, 0.38182830810546875, 0.3961639404296875, 0.41049957275390625, 0.424835205078125, 0.43917083740234375, 0.4535064697265625, 0.46784210205078125, 0.482177734375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 8.0, 9.0, 10.0, 15.0, 20.0, 33.0, 51.0, 67.0, 125.0, 212.0, 342.0, 647.0, 1283.0, 2563.0, 5422.0, 12080.0, 28673.0, 71440.0, 169510.0, 352770.0, 226941.0, 103049.0, 41563.0, 17011.0, 7590.0, 3406.0, 1699.0, 883.0, 456.0, 265.0, 150.0, 89.0, 52.0, 43.0, 20.0, 18.0, 13.0, 12.0, 8.0, 4.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.09765625, -0.09492111206054688, -0.09218597412109375, -0.08945083618164062, -0.0867156982421875, -0.08398056030273438, -0.08124542236328125, -0.07851028442382812, -0.075775146484375, -0.07304000854492188, -0.07030487060546875, -0.06756973266601562, -0.0648345947265625, -0.062099456787109375, -0.05936431884765625, -0.056629180908203125, -0.05389404296875, -0.051158905029296875, -0.04842376708984375, -0.045688629150390625, -0.0429534912109375, -0.040218353271484375, -0.03748321533203125, -0.034748077392578125, -0.032012939453125, -0.029277801513671875, -0.02654266357421875, -0.023807525634765625, -0.0210723876953125, -0.018337249755859375, -0.01560211181640625, -0.012866973876953125, -0.0101318359375, -0.007396697998046875, -0.00466156005859375, -0.001926422119140625, 0.0008087158203125, 0.003543853759765625, 0.00627899169921875, 0.009014129638671875, 0.011749267578125, 0.014484405517578125, 0.01721954345703125, 0.019954681396484375, 0.0226898193359375, 0.025424957275390625, 0.02816009521484375, 0.030895233154296875, 0.03363037109375, 0.036365509033203125, 0.03910064697265625, 0.041835784912109375, 0.0445709228515625, 0.047306060791015625, 0.05004119873046875, 0.052776336669921875, 0.055511474609375, 0.058246612548828125, 0.06098175048828125, 0.06371688842773438, 0.0664520263671875, 0.06918716430664062, 0.07192230224609375, 0.07465744018554688, 0.077392578125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 3.0, 9.0, 6.0, 6.0, 13.0, 19.0, 15.0, 7.0, 16.0, 30.0, 32.0, 40.0, 32.0, 29.0, 42.0, 41.0, 54.0, 59.0, 101.0, 68.0, 52.0, 50.0, 46.0, 33.0, 21.0, 19.0, 27.0, 25.0, 19.0, 17.0, 13.0, 11.0, 9.0, 1.0, 4.0, 4.0, 6.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4662742614746094e-05, -1.4180317521095276e-05, -1.3697892427444458e-05, -1.321546733379364e-05, -1.2733042240142822e-05, -1.2250617146492004e-05, -1.1768192052841187e-05, -1.1285766959190369e-05, -1.080334186553955e-05, -1.0320916771888733e-05, -9.838491678237915e-06, -9.356066584587097e-06, -8.87364149093628e-06, -8.391216397285461e-06, -7.908791303634644e-06, -7.426366209983826e-06, -6.943941116333008e-06, -6.46151602268219e-06, -5.979090929031372e-06, -5.496665835380554e-06, -5.014240741729736e-06, -4.5318156480789185e-06, -4.049390554428101e-06, -3.5669654607772827e-06, -3.084540367126465e-06, -2.602115273475647e-06, -2.119690179824829e-06, -1.6372650861740112e-06, -1.1548399925231934e-06, -6.724148988723755e-07, -1.8998980522155762e-07, 2.9243528842926025e-07, 7.748603820800781e-07, 1.257285475730896e-06, 1.7397105693817139e-06, 2.2221356630325317e-06, 2.7045607566833496e-06, 3.1869858503341675e-06, 3.6694109439849854e-06, 4.151836037635803e-06, 4.634261131286621e-06, 5.116686224937439e-06, 5.599111318588257e-06, 6.081536412239075e-06, 6.563961505889893e-06, 7.0463865995407104e-06, 7.528811693191528e-06, 8.011236786842346e-06, 8.493661880493164e-06, 8.976086974143982e-06, 9.4585120677948e-06, 9.940937161445618e-06, 1.0423362255096436e-05, 1.0905787348747253e-05, 1.1388212442398071e-05, 1.187063753604889e-05, 1.2353062629699707e-05, 1.2835487723350525e-05, 1.3317912817001343e-05, 1.380033791065216e-05, 1.4282763004302979e-05, 1.4765188097953796e-05, 1.5247613191604614e-05, 1.5730038285255432e-05, 1.621246337890625e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 8.0, 8.0, 18.0, 39.0, 43.0, 58.0, 92.0, 168.0, 215.0, 368.0, 660.0, 962.0, 1662.0, 3177.0, 6287.0, 14491.0, 39792.0, 121563.0, 350456.0, 326163.0, 116372.0, 38195.0, 14240.0, 6213.0, 3070.0, 1643.0, 973.0, 578.0, 376.0, 223.0, 150.0, 103.0, 69.0, 49.0, 23.0, 19.0, 11.0, 5.0, 8.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.12091064453125, -0.11724472045898438, -0.11357879638671875, -0.10991287231445312, -0.1062469482421875, -0.10258102416992188, -0.09891510009765625, -0.09524917602539062, -0.091583251953125, -0.08791732788085938, -0.08425140380859375, -0.08058547973632812, -0.0769195556640625, -0.07325363159179688, -0.06958770751953125, -0.06592178344726562, -0.062255859375, -0.058589935302734375, -0.05492401123046875, -0.051258087158203125, -0.0475921630859375, -0.043926239013671875, -0.04026031494140625, -0.036594390869140625, -0.032928466796875, -0.029262542724609375, -0.02559661865234375, -0.021930694580078125, -0.0182647705078125, -0.014598846435546875, -0.01093292236328125, -0.007266998291015625, -0.00360107421875, 6.4849853515625e-05, 0.00373077392578125, 0.007396697998046875, 0.0110626220703125, 0.014728546142578125, 0.01839447021484375, 0.022060394287109375, 0.025726318359375, 0.029392242431640625, 0.03305816650390625, 0.036724090576171875, 0.0403900146484375, 0.044055938720703125, 0.04772186279296875, 0.051387786865234375, 0.0550537109375, 0.058719635009765625, 0.06238555908203125, 0.06605148315429688, 0.0697174072265625, 0.07338333129882812, 0.07704925537109375, 0.08071517944335938, 0.084381103515625, 0.08804702758789062, 0.09171295166015625, 0.09537887573242188, 0.0990447998046875, 0.10271072387695312, 0.10637664794921875, 0.11004257202148438, 0.11370849609375]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 2.0, 6.0, 8.0, 7.0, 13.0, 10.0, 19.0, 24.0, 32.0, 46.0, 85.0, 88.0, 92.0, 145.0, 83.0, 79.0, 76.0, 46.0, 40.0, 36.0, 19.0, 16.0, 15.0, 5.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09442138671875, -0.09175491333007812, -0.08908843994140625, -0.08642196655273438, -0.0837554931640625, -0.08108901977539062, -0.07842254638671875, -0.07575607299804688, -0.073089599609375, -0.07042312622070312, -0.06775665283203125, -0.06509017944335938, -0.0624237060546875, -0.059757232666015625, -0.05709075927734375, -0.054424285888671875, -0.0517578125, -0.049091339111328125, -0.04642486572265625, -0.043758392333984375, -0.0410919189453125, -0.038425445556640625, -0.03575897216796875, -0.033092498779296875, -0.030426025390625, -0.027759552001953125, -0.02509307861328125, -0.022426605224609375, -0.0197601318359375, -0.017093658447265625, -0.01442718505859375, -0.011760711669921875, -0.00909423828125, -0.006427764892578125, -0.00376129150390625, -0.001094818115234375, 0.0015716552734375, 0.004238128662109375, 0.00690460205078125, 0.009571075439453125, 0.012237548828125, 0.014904022216796875, 0.01757049560546875, 0.020236968994140625, 0.0229034423828125, 0.025569915771484375, 0.02823638916015625, 0.030902862548828125, 0.0335693359375, 0.036235809326171875, 0.03890228271484375, 0.041568756103515625, 0.0442352294921875, 0.046901702880859375, 0.04956817626953125, 0.052234649658203125, 0.054901123046875, 0.057567596435546875, 0.06023406982421875, 0.06290054321289062, 0.0655670166015625, 0.06823348999023438, 0.07089996337890625, 0.07356643676757812, 0.07623291015625]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 1.0, 16.0, 30.0, 76.0, 119.0, 177.0, 226.0, 184.0, 97.0, 43.0, 21.0, 10.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7090682983398438, -0.6407623887062073, -0.5724564790725708, -0.5041505098342896, -0.4358446002006531, -0.3675386905670166, -0.29923275113105774, -0.23092681169509888, -0.1626209020614624, -0.09431497752666473, -0.026009052991867065, 0.0422968715429306, 0.11060279607772827, 0.17890870571136475, 0.2472146451473236, 0.31552058458328247, 0.38382649421691895, 0.4521324038505554, 0.5204383134841919, 0.5887442827224731, 0.6570501923561096, 0.7253561019897461, 0.7936620712280273, 0.8619679808616638, 0.9302738904953003, 0.9985798001289368, 1.0668857097625732, 1.1351916790008545, 1.2034976482391357, 1.2718034982681274, 1.3401094675064087, 1.4084153175354004, 1.4767210483551025, 1.5450270175933838, 1.6133328676223755, 1.6816388368606567, 1.7499446868896484, 1.8182506561279297, 1.886556625366211, 1.9548625946044922, 2.0231685638427734, 2.0914745330810547, 2.159780502319336, 2.228086233139038, 2.2963922023773193, 2.3646981716156006, 2.433004140853882, 2.501310110092163, 2.5696158409118652, 2.6379218101501465, 2.7062277793884277, 2.77453351020813, 2.842839479446411, 2.9111454486846924, 2.9794514179229736, 3.047757387161255, 3.116063117980957, 3.1843690872192383, 3.2526750564575195, 3.3209807872772217, 3.389286756515503, 3.457592725753784, 3.5258986949920654, 3.5942046642303467, 3.662510633468628]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 3.0, 8.0, 4.0, 10.0, 12.0, 14.0, 20.0, 17.0, 22.0, 17.0, 34.0, 19.0, 31.0, 28.0, 29.0, 37.0, 38.0, 40.0, 44.0, 47.0, 47.0, 41.0, 44.0, 42.0, 34.0, 36.0, 35.0, 37.0, 21.0, 25.0, 34.0, 21.0, 22.0, 13.0, 12.0, 15.0, 4.0, 10.0, 6.0, 4.0, 5.0, 4.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.8490684032440186, -0.8241899013519287, -0.7993113398551941, -0.7744328379631042, -0.7495542764663696, -0.7246757745742798, -0.6997972726821899, -0.6749187707901001, -0.6500402092933655, -0.6251617074012756, -0.600283145904541, -0.5754046440124512, -0.5505261421203613, -0.5256475806236267, -0.5007690787315369, -0.47589054703712463, -0.4510120153427124, -0.42613348364830017, -0.40125495195388794, -0.3763764500617981, -0.35149791836738586, -0.32661938667297363, -0.3017408847808838, -0.27686235308647156, -0.2519838213920593, -0.2271052896976471, -0.20222677290439606, -0.17734825611114502, -0.1524697244167328, -0.12759119272232056, -0.10271267592906952, -0.07783415913581848, -0.052955687046051025, -0.02807716280221939, -0.0031986385583877563, 0.021679885685443878, 0.04655840992927551, 0.07143693417310715, 0.09631545841693878, 0.12119397521018982, 0.14607250690460205, 0.17095103859901428, 0.19582955539226532, 0.22070807218551636, 0.2455866038799286, 0.2704651355743408, 0.29534363746643066, 0.3202221691608429, 0.3451007008552551, 0.36997923254966736, 0.3948577642440796, 0.41973626613616943, 0.44461479783058167, 0.4694933295249939, 0.49437183141708374, 0.5192503929138184, 0.5441288948059082, 0.569007396697998, 0.5938859581947327, 0.6187644600868225, 0.6436430215835571, 0.668521523475647, 0.6934000253677368, 0.7182785272598267, 0.7431570887565613]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 3.0, 6.0, 5.0, 8.0, 15.0, 20.0, 33.0, 30.0, 42.0, 45.0, 97.0, 83.0, 153.0, 190.0, 310.0, 458.0, 803.0, 1463.0, 3090.0, 7410.0, 1009392.0, 14480.0, 6452.0, 2674.0, 1292.0, 674.0, 407.0, 250.0, 172.0, 136.0, 109.0, 82.0, 52.0, 44.0, 27.0, 21.0, 19.0, 9.0, 13.0, 7.0, 3.0, 6.0, 7.0, 1.0, 6.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.1484733819961548, -1.1146049499511719, -1.0807366371154785, -1.0468682050704956, -1.0129997730255127, -0.9791313409805298, -0.9452629685401917, -0.9113945960998535, -0.8775261640548706, -0.8436577320098877, -0.8097893595695496, -0.7759209871292114, -0.7420525550842285, -0.7081841230392456, -0.6743157505989075, -0.6404473781585693, -0.6065789461135864, -0.5727105140686035, -0.5388421416282654, -0.5049737691879272, -0.47110533714294434, -0.4372369349002838, -0.4033685326576233, -0.36950013041496277, -0.33563172817230225, -0.3017633259296417, -0.2678949236869812, -0.23402652144432068, -0.20015811920166016, -0.16628971695899963, -0.1324213147163391, -0.09855291247367859, -0.06468462944030762, -0.030816227197647095, 0.0030521750450134277, 0.03692057728767395, 0.07078897953033447, 0.104657381772995, 0.13852578401565552, 0.17239418625831604, 0.20626258850097656, 0.24013099074363708, 0.2739993929862976, 0.30786779522895813, 0.34173619747161865, 0.3756045997142792, 0.4094730019569397, 0.4433414041996002, 0.47720980644226074, 0.5110782384872437, 0.5449466109275818, 0.5788149833679199, 0.6126834154129028, 0.6465518474578857, 0.6804202198982239, 0.714288592338562, 0.7481570243835449, 0.7820254564285278, 0.815893828868866, 0.8497622013092041, 0.883630633354187, 0.9174990653991699, 0.9513674378395081, 0.9852358102798462, 1.019104242324829]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 5.0, 11.0, 29.0, 61.0, 105.0, 208.0, 418.0, 874.0, 2020.0, 5420.0, 51447384.0, 9048.0, 2588.0, 1120.0, 514.0, 264.0, 131.0, 62.0, 34.0, 12.0, 8.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.287032127380371, -13.804903030395508, -13.322772979736328, -12.840643882751465, -12.358513832092285, -11.876384735107422, -11.394254684448242, -10.912125587463379, -10.429996490478516, -9.947867393493652, -9.465737342834473, -8.98360824584961, -8.50147819519043, -8.019349098205566, -7.537219524383545, -7.055089950561523, -6.572959899902344, -6.090830326080322, -5.608700752258301, -5.1265716552734375, -4.644441604614258, -4.1623125076293945, -3.680182933807373, -3.1980533599853516, -2.71592378616333, -2.2337942123413086, -1.7516647577285767, -1.2695353031158447, -0.7874057292938232, -0.30527615547180176, 0.17685317993164062, 0.6589827537536621, 1.1411113739013672, 1.6232409477233887, 2.10537052154541, 2.5874998569488525, 3.069629430770874, 3.5517590045928955, 4.033888339996338, 4.516017913818359, 4.998147487640381, 5.480277061462402, 5.962406635284424, 6.444536209106445, 6.926665306091309, 7.408795356750488, 7.890924453735352, 8.373054504394531, 8.855183601379395, 9.337312698364258, 9.819442749023438, 10.3015718460083, 10.78370189666748, 11.265830993652344, 11.747961044311523, 12.230090141296387, 12.71221923828125, 13.194348335266113, 13.676478385925293, 14.158607482910156, 14.640737533569336, 15.1228666305542, 15.604995727539062, 16.087125778198242, 16.569255828857422]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 6.0, 4.0, 8.0, 14.0, 19.0, 30.0, 52.0, 71.0, 114.0, 166.0, 253.0, 405.0, 628.0, 1024.0, 1675.0, 2754.0, 4600.0, 7713.0, 13153.0, 22544.0, 39135.0, 66645.0, 114921.0, 189876.0, 292441.0, 433725.0, 2556657.0, 1453624.0, 397620.0, 270369.0, 173204.0, 103507.0, 59736.0, 34902.0, 20177.0, 11734.0, 7298.0, 4051.0, 2540.0, 1509.0, 925.0, 605.0, 390.0, 230.0, 133.0, 86.0, 49.0, 33.0, 28.0, 15.0, 17.0, 12.0, 4.0, 6.0, 1.0, 3.0, 3.0, 3.0], "bins": [-0.75244140625, -0.7295684814453125, -0.706695556640625, -0.6838226318359375, -0.66094970703125, -0.6380767822265625, -0.615203857421875, -0.5923309326171875, -0.5694580078125, -0.5465850830078125, -0.523712158203125, -0.5008392333984375, -0.47796630859375, -0.4550933837890625, -0.432220458984375, -0.4093475341796875, -0.386474609375, -0.3636016845703125, -0.340728759765625, -0.3178558349609375, -0.29498291015625, -0.2721099853515625, -0.249237060546875, -0.2263641357421875, -0.2034912109375, -0.1806182861328125, -0.157745361328125, -0.1348724365234375, -0.11199951171875, -0.0891265869140625, -0.066253662109375, -0.0433807373046875, -0.0205078125, 0.0023651123046875, 0.025238037109375, 0.0481109619140625, 0.07098388671875, 0.0938568115234375, 0.116729736328125, 0.1396026611328125, 0.1624755859375, 0.1853485107421875, 0.208221435546875, 0.2310943603515625, 0.25396728515625, 0.2768402099609375, 0.299713134765625, 0.3225860595703125, 0.345458984375, 0.3683319091796875, 0.391204833984375, 0.4140777587890625, 0.43695068359375, 0.4598236083984375, 0.482696533203125, 0.5055694580078125, 0.5284423828125, 0.5513153076171875, 0.574188232421875, 0.5970611572265625, 0.61993408203125, 0.6428070068359375, 0.665679931640625, 0.6885528564453125, 0.71142578125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 5.0, 12.0, 18.0, 16.0, 26.0, 21.0, 32.0, 44.0, 47.0, 34.0, 57.0, 58.0, 73.0, 181.0, 842.0, 155.0, 46.0, 56.0, 51.0, 44.0, 43.0, 37.0, 27.0, 24.0, 22.0, 9.0, 16.0, 10.0, 11.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2734375, -6.067626953125, -5.86181640625, -5.656005859375, -5.4501953125, -5.244384765625, -5.03857421875, -4.832763671875, -4.626953125, -4.421142578125, -4.21533203125, -4.009521484375, -3.8037109375, -3.597900390625, -3.39208984375, -3.186279296875, -2.98046875, -2.774658203125, -2.56884765625, -2.363037109375, -2.1572265625, -1.951416015625, -1.74560546875, -1.539794921875, -1.333984375, -1.128173828125, -0.92236328125, -0.716552734375, -0.5107421875, -0.304931640625, -0.09912109375, 0.106689453125, 0.3125, 0.518310546875, 0.72412109375, 0.929931640625, 1.1357421875, 1.341552734375, 1.54736328125, 1.753173828125, 1.958984375, 2.164794921875, 2.37060546875, 2.576416015625, 2.7822265625, 2.988037109375, 3.19384765625, 3.399658203125, 3.60546875, 3.811279296875, 4.01708984375, 4.222900390625, 4.4287109375, 4.634521484375, 4.84033203125, 5.046142578125, 5.251953125, 5.457763671875, 5.66357421875, 5.869384765625, 6.0751953125, 6.281005859375, 6.48681640625, 6.692626953125, 6.8984375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 8.0, 11.0, 14.0, 20.0, 35.0, 40.0, 50.0, 103.0, 164.0, 266.0, 417.0, 704.0, 1176.0, 2016.0, 3382.0, 5499.0, 9739.0, 16588.0, 29018.0, 49187.0, 81849.0, 132435.0, 202653.0, 286933.0, 377619.0, 2510639.0, 1454403.0, 360090.0, 272514.0, 189285.0, 122927.0, 74437.0, 44368.0, 26135.0, 15130.0, 8778.0, 5138.0, 3047.0, 1770.0, 1110.0, 646.0, 429.0, 271.0, 133.0, 89.0, 49.0, 37.0, 28.0, 25.0, 10.0, 9.0, 8.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.5283203125, -0.5117645263671875, -0.495208740234375, -0.4786529541015625, -0.46209716796875, -0.4455413818359375, -0.428985595703125, -0.4124298095703125, -0.3958740234375, -0.3793182373046875, -0.362762451171875, -0.3462066650390625, -0.32965087890625, -0.3130950927734375, -0.296539306640625, -0.2799835205078125, -0.263427734375, -0.2468719482421875, -0.230316162109375, -0.2137603759765625, -0.19720458984375, -0.1806488037109375, -0.164093017578125, -0.1475372314453125, -0.1309814453125, -0.1144256591796875, -0.097869873046875, -0.0813140869140625, -0.06475830078125, -0.0482025146484375, -0.031646728515625, -0.0150909423828125, 0.00146484375, 0.0180206298828125, 0.034576416015625, 0.0511322021484375, 0.06768798828125, 0.0842437744140625, 0.100799560546875, 0.1173553466796875, 0.1339111328125, 0.1504669189453125, 0.167022705078125, 0.1835784912109375, 0.20013427734375, 0.2166900634765625, 0.233245849609375, 0.2498016357421875, 0.266357421875, 0.2829132080078125, 0.299468994140625, 0.3160247802734375, 0.33258056640625, 0.3491363525390625, 0.365692138671875, 0.3822479248046875, 0.3988037109375, 0.4153594970703125, 0.431915283203125, 0.4484710693359375, 0.46502685546875, 0.4815826416015625, 0.498138427734375, 0.5146942138671875, 0.53125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 5.0, 9.0, 6.0, 6.0, 21.0, 10.0, 11.0, 18.0, 21.0, 38.0, 22.0, 29.0, 26.0, 47.0, 37.0, 37.0, 47.0, 65.0, 379.0, 667.0, 107.0, 46.0, 43.0, 41.0, 30.0, 27.0, 37.0, 30.0, 16.0, 28.0, 30.0, 19.0, 12.0, 15.0, 12.0, 9.0, 9.0, 3.0, 3.0, 1.0, 7.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.140625, -4.998626708984375, -4.85662841796875, -4.714630126953125, -4.5726318359375, -4.430633544921875, -4.28863525390625, -4.146636962890625, -4.004638671875, -3.862640380859375, -3.72064208984375, -3.578643798828125, -3.4366455078125, -3.294647216796875, -3.15264892578125, -3.010650634765625, -2.86865234375, -2.726654052734375, -2.58465576171875, -2.442657470703125, -2.3006591796875, -2.158660888671875, -2.01666259765625, -1.874664306640625, -1.732666015625, -1.590667724609375, -1.44866943359375, -1.306671142578125, -1.1646728515625, -1.022674560546875, -0.88067626953125, -0.738677978515625, -0.5966796875, -0.454681396484375, -0.31268310546875, -0.170684814453125, -0.0286865234375, 0.113311767578125, 0.25531005859375, 0.397308349609375, 0.539306640625, 0.681304931640625, 0.82330322265625, 0.965301513671875, 1.1072998046875, 1.249298095703125, 1.39129638671875, 1.533294677734375, 1.67529296875, 1.817291259765625, 1.95928955078125, 2.101287841796875, 2.2432861328125, 2.385284423828125, 2.52728271484375, 2.669281005859375, 2.811279296875, 2.953277587890625, 3.09527587890625, 3.237274169921875, 3.3792724609375, 3.521270751953125, 3.66326904296875, 3.805267333984375, 3.947265625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 11.0, 20.0, 14.0, 25.0, 30.0, 38.0, 50.0, 70.0, 98.0, 122.0, 142.0, 165.0, 221.0, 348.0, 498.0, 664.0, 950.0, 1371.0, 2206.0, 3283.0, 5863.0, 10869.0, 20747.0, 41642.0, 82416.0, 199664.0, 5628422.0, 144634.0, 69916.0, 35027.0, 17762.0, 9602.0, 5236.0, 3121.0, 1923.0, 1268.0, 856.0, 613.0, 391.0, 288.0, 217.0, 156.0, 124.0, 88.0, 66.0, 43.0, 51.0, 32.0, 24.0, 12.0, 13.0, 8.0, 5.0, 2.0, 5.0, 7.0, 2.0], "bins": [-1.46875, -1.42474365234375, -1.3807373046875, -1.33673095703125, -1.292724609375, -1.24871826171875, -1.2047119140625, -1.16070556640625, -1.11669921875, -1.07269287109375, -1.0286865234375, -0.98468017578125, -0.940673828125, -0.89666748046875, -0.8526611328125, -0.80865478515625, -0.7646484375, -0.72064208984375, -0.6766357421875, -0.63262939453125, -0.588623046875, -0.54461669921875, -0.5006103515625, -0.45660400390625, -0.41259765625, -0.36859130859375, -0.3245849609375, -0.28057861328125, -0.236572265625, -0.19256591796875, -0.1485595703125, -0.10455322265625, -0.060546875, -0.01654052734375, 0.0274658203125, 0.07147216796875, 0.115478515625, 0.15948486328125, 0.2034912109375, 0.24749755859375, 0.29150390625, 0.33551025390625, 0.3795166015625, 0.42352294921875, 0.467529296875, 0.51153564453125, 0.5555419921875, 0.59954833984375, 0.6435546875, 0.68756103515625, 0.7315673828125, 0.77557373046875, 0.819580078125, 0.86358642578125, 0.9075927734375, 0.95159912109375, 0.99560546875, 1.03961181640625, 1.0836181640625, 1.12762451171875, 1.171630859375, 1.21563720703125, 1.2596435546875, 1.30364990234375, 1.34765625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 5.0, 6.0, 5.0, 5.0, 12.0, 10.0, 11.0, 21.0, 19.0, 30.0, 29.0, 43.0, 39.0, 41.0, 45.0, 33.0, 44.0, 43.0, 415.0, 693.0, 70.0, 42.0, 53.0, 42.0, 47.0, 41.0, 34.0, 26.0, 27.0, 17.0, 8.0, 28.0, 11.0, 10.0, 5.0, 2.0, 4.0, 4.0, 6.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.58203125, -5.4232177734375, -5.264404296875, -5.1055908203125, -4.94677734375, -4.7879638671875, -4.629150390625, -4.4703369140625, -4.3115234375, -4.1527099609375, -3.993896484375, -3.8350830078125, -3.67626953125, -3.5174560546875, -3.358642578125, -3.1998291015625, -3.041015625, -2.8822021484375, -2.723388671875, -2.5645751953125, -2.40576171875, -2.2469482421875, -2.088134765625, -1.9293212890625, -1.7705078125, -1.6116943359375, -1.452880859375, -1.2940673828125, -1.13525390625, -0.9764404296875, -0.817626953125, -0.6588134765625, -0.5, -0.3411865234375, -0.182373046875, -0.0235595703125, 0.13525390625, 0.2940673828125, 0.452880859375, 0.6116943359375, 0.7705078125, 0.9293212890625, 1.088134765625, 1.2469482421875, 1.40576171875, 1.5645751953125, 1.723388671875, 1.8822021484375, 2.041015625, 2.1998291015625, 2.358642578125, 2.5174560546875, 2.67626953125, 2.8350830078125, 2.993896484375, 3.1527099609375, 3.3115234375, 3.4703369140625, 3.629150390625, 3.7879638671875, 3.94677734375, 4.1055908203125, 4.264404296875, 4.4232177734375, 4.58203125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 0.0, 4.0, 3.0, 7.0, 7.0, 11.0, 22.0, 26.0, 31.0, 63.0, 62.0, 88.0, 248.0, 138.0, 62.0, 65.0, 36.0, 31.0, 23.0, 16.0, 11.0, 13.0, 10.0, 10.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-57.83089065551758, -56.24897766113281, -54.66706848144531, -53.08515548706055, -51.50324249267578, -49.92133331298828, -48.339420318603516, -46.75750732421875, -45.17559814453125, -43.593685150146484, -42.011775970458984, -40.42986297607422, -38.84795379638672, -37.26604080200195, -35.68412780761719, -34.10221862792969, -32.52030563354492, -30.93839454650879, -29.356483459472656, -27.77457046508789, -26.192659378051758, -24.610748291015625, -23.02883529663086, -21.446924209594727, -19.865013122558594, -18.28310203552246, -16.701190948486328, -15.119277954101562, -13.53736686706543, -11.955455780029297, -10.373543739318848, -8.791631698608398, -7.209724426269531, -5.62781286239624, -4.045901298522949, -2.463989734649658, -0.8820781707763672, 0.6998333930969238, 2.281744956970215, 3.863656997680664, 5.445568084716797, 7.027479648590088, 8.609391212463379, 10.191303253173828, 11.773214340209961, 13.355125427246094, 14.937037467956543, 16.518949508666992, 18.100860595703125, 19.682771682739258, 21.26468276977539, 22.846595764160156, 24.42850685119629, 26.010417938232422, 27.592330932617188, 29.17424201965332, 30.756153106689453, 32.33806610107422, 33.91997528076172, 35.501888275146484, 37.08380126953125, 38.66571044921875, 40.247623443603516, 41.82953643798828, 43.41144561767578]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 3.0, 4.0, 6.0, 3.0, 6.0, 7.0, 12.0, 12.0, 12.0, 8.0, 9.0, 24.0, 20.0, 23.0, 34.0, 27.0, 47.0, 83.0, 123.0, 149.0, 99.0, 53.0, 43.0, 29.0, 30.0, 23.0, 22.0, 13.0, 15.0, 12.0, 13.0, 6.0, 5.0, 7.0, 4.0, 4.0, 5.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-94.89051818847656, -91.75249481201172, -88.61446380615234, -85.4764404296875, -82.33841705322266, -79.20039367675781, -76.06236267089844, -72.9243392944336, -69.78631591796875, -66.6482925415039, -63.5102653503418, -60.37223815917969, -57.234214782714844, -54.096187591552734, -50.958160400390625, -47.82013702392578, -44.68210983276367, -41.54408264160156, -38.40605926513672, -35.26803207397461, -32.130008697509766, -28.991981506347656, -25.85395622253418, -22.715930938720703, -19.577905654907227, -16.43988037109375, -13.301855087280273, -10.16382884979248, -7.025803565979004, -3.8877782821655273, -0.7497520446777344, 2.388273239135742, 5.526298522949219, 8.664323806762695, 11.802349090576172, 14.940375328063965, 18.078399658203125, 21.216426849365234, 24.35445213317871, 27.492477416992188, 30.630502700805664, 33.76852798461914, 36.90655517578125, 40.044578552246094, 43.1826057434082, 46.32062911987305, 49.458656311035156, 52.5966796875, 55.73470687866211, 58.87273406982422, 62.01075744628906, 65.1487808227539, 68.28681182861328, 71.42483520507812, 74.56285858154297, 77.70088195800781, 80.83891296386719, 83.97693634033203, 87.1149673461914, 90.25299072265625, 93.3910140991211, 96.52903747558594, 99.66706848144531, 102.80509185791016, 105.943115234375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 9.0, 8.0, 9.0, 18.0, 23.0, 32.0, 75.0, 110.0, 194.0, 379.0, 663.0, 1457.0, 3057.0, 7974.0, 26339.0, 186639.0, 3834828.0, 102666.0, 18885.0, 6062.0, 2477.0, 1140.0, 554.0, 292.0, 157.0, 83.0, 53.0, 39.0, 16.0, 15.0, 9.0, 5.0, 7.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1011962890625, -0.09786605834960938, -0.09453582763671875, -0.09120559692382812, -0.0878753662109375, -0.08454513549804688, -0.08121490478515625, -0.07788467407226562, -0.074554443359375, -0.07122421264648438, -0.06789398193359375, -0.06456375122070312, -0.0612335205078125, -0.057903289794921875, -0.05457305908203125, -0.051242828369140625, -0.04791259765625, -0.044582366943359375, -0.04125213623046875, -0.037921905517578125, -0.0345916748046875, -0.031261444091796875, -0.02793121337890625, -0.024600982666015625, -0.021270751953125, -0.017940521240234375, -0.01461029052734375, -0.011280059814453125, -0.0079498291015625, -0.004619598388671875, -0.00128936767578125, 0.002040863037109375, 0.00537109375, 0.008701324462890625, 0.01203155517578125, 0.015361785888671875, 0.0186920166015625, 0.022022247314453125, 0.02535247802734375, 0.028682708740234375, 0.032012939453125, 0.035343170166015625, 0.03867340087890625, 0.042003631591796875, 0.0453338623046875, 0.048664093017578125, 0.05199432373046875, 0.055324554443359375, 0.05865478515625, 0.061985015869140625, 0.06531524658203125, 0.06864547729492188, 0.0719757080078125, 0.07530593872070312, 0.07863616943359375, 0.08196640014648438, 0.085296630859375, 0.08862686157226562, 0.09195709228515625, 0.09528732299804688, 0.0986175537109375, 0.10194778442382812, 0.10527801513671875, 0.10860824584960938, 0.1119384765625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 4.0, 1.0, 6.0, 5.0, 8.0, 8.0, 2.0, 6.0, 5.0, 5.0, 8.0, 18.0, 13.0, 14.0, 13.0, 14.0, 23.0, 21.0, 26.0, 33.0, 47.0, 336.0, 101.0, 45.0, 27.0, 32.0, 22.0, 22.0, 18.0, 15.0, 17.0, 14.0, 8.0, 12.0, 11.0, 3.0, 5.0, 8.0, 3.0, 3.0, 13.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03265380859375, -0.031659841537475586, -0.030665874481201172, -0.029671907424926758, -0.028677940368652344, -0.02768397331237793, -0.026690006256103516, -0.0256960391998291, -0.024702072143554688, -0.023708105087280273, -0.02271413803100586, -0.021720170974731445, -0.02072620391845703, -0.019732236862182617, -0.018738269805908203, -0.01774430274963379, -0.016750335693359375, -0.01575636863708496, -0.014762401580810547, -0.013768434524536133, -0.012774467468261719, -0.011780500411987305, -0.01078653335571289, -0.009792566299438477, -0.008798599243164062, -0.0078046321868896484, -0.006810665130615234, -0.00581669807434082, -0.004822731018066406, -0.003828763961791992, -0.002834796905517578, -0.001840829849243164, -0.00084686279296875, 0.00014710426330566406, 0.0011410713195800781, 0.002135038375854492, 0.0031290054321289062, 0.00412297248840332, 0.005116939544677734, 0.0061109066009521484, 0.0071048736572265625, 0.008098840713500977, 0.00909280776977539, 0.010086774826049805, 0.011080741882324219, 0.012074708938598633, 0.013068675994873047, 0.014062643051147461, 0.015056610107421875, 0.01605057716369629, 0.017044544219970703, 0.018038511276245117, 0.01903247833251953, 0.020026445388793945, 0.02102041244506836, 0.022014379501342773, 0.023008346557617188, 0.0240023136138916, 0.024996280670166016, 0.02599024772644043, 0.026984214782714844, 0.027978181838989258, 0.028972148895263672, 0.029966115951538086, 0.0309600830078125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 1.0, 4.0, 8.0, 7.0, 6.0, 6.0, 20.0, 24.0, 48.0, 98.0, 184.0, 405.0, 1019.0, 3046.0, 12477.0, 76498.0, 1831257.0, 2170872.0, 80684.0, 12492.0, 3278.0, 1026.0, 407.0, 171.0, 111.0, 53.0, 30.0, 15.0, 14.0, 8.0, 9.0, 5.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10870361328125, -0.10482311248779297, -0.10094261169433594, -0.0970621109008789, -0.09318161010742188, -0.08930110931396484, -0.08542060852050781, -0.08154010772705078, -0.07765960693359375, -0.07377910614013672, -0.06989860534667969, -0.06601810455322266, -0.062137603759765625, -0.058257102966308594, -0.05437660217285156, -0.05049610137939453, -0.0466156005859375, -0.04273509979248047, -0.03885459899902344, -0.034974098205566406, -0.031093597412109375, -0.027213096618652344, -0.023332595825195312, -0.01945209503173828, -0.01557159423828125, -0.011691093444824219, -0.0078105926513671875, -0.003930091857910156, -4.9591064453125e-05, 0.0038309097290039062, 0.0077114105224609375, 0.011591911315917969, 0.015472412109375, 0.01935291290283203, 0.023233413696289062, 0.027113914489746094, 0.030994415283203125, 0.034874916076660156, 0.03875541687011719, 0.04263591766357422, 0.04651641845703125, 0.05039691925048828, 0.05427742004394531, 0.058157920837402344, 0.062038421630859375, 0.0659189224243164, 0.06979942321777344, 0.07367992401123047, 0.0775604248046875, 0.08144092559814453, 0.08532142639160156, 0.0892019271850586, 0.09308242797851562, 0.09696292877197266, 0.10084342956542969, 0.10472393035888672, 0.10860443115234375, 0.11248493194580078, 0.11636543273925781, 0.12024593353271484, 0.12412643432617188, 0.1280069351196289, 0.13188743591308594, 0.13576793670654297, 0.1396484375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 2.0, 1.0, 4.0, 6.0, 2.0, 1.0, 6.0, 4.0, 5.0, 8.0, 7.0, 20.0, 23.0, 28.0, 30.0, 34.0, 48.0, 55.0, 86.0, 136.0, 169.0, 278.0, 465.0, 956.0, 639.0, 333.0, 185.0, 144.0, 97.0, 74.0, 49.0, 43.0, 39.0, 17.0, 27.0, 15.0, 11.0, 8.0, 8.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0282135009765625, -0.027156591415405273, -0.026099681854248047, -0.02504277229309082, -0.023985862731933594, -0.022928953170776367, -0.02187204360961914, -0.020815134048461914, -0.019758224487304688, -0.01870131492614746, -0.017644405364990234, -0.016587495803833008, -0.015530586242675781, -0.014473676681518555, -0.013416767120361328, -0.012359857559204102, -0.011302947998046875, -0.010246038436889648, -0.009189128875732422, -0.008132219314575195, -0.007075309753417969, -0.006018400192260742, -0.004961490631103516, -0.003904581069946289, -0.0028476715087890625, -0.001790761947631836, -0.0007338523864746094, 0.0003230571746826172, 0.0013799667358398438, 0.0024368762969970703, 0.003493785858154297, 0.0045506954193115234, 0.00560760498046875, 0.0066645145416259766, 0.007721424102783203, 0.00877833366394043, 0.009835243225097656, 0.010892152786254883, 0.01194906234741211, 0.013005971908569336, 0.014062881469726562, 0.015119791030883789, 0.016176700592041016, 0.017233610153198242, 0.01829051971435547, 0.019347429275512695, 0.020404338836669922, 0.02146124839782715, 0.022518157958984375, 0.0235750675201416, 0.024631977081298828, 0.025688886642456055, 0.02674579620361328, 0.027802705764770508, 0.028859615325927734, 0.02991652488708496, 0.030973434448242188, 0.032030344009399414, 0.03308725357055664, 0.03414416313171387, 0.035201072692871094, 0.03625798225402832, 0.03731489181518555, 0.03837180137634277, 0.0394287109375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 9.0, 8.0, 35.0, 271.0, 485.0, 175.0, 18.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.792648434638977, -0.7743672728538513, -0.7560861706733704, -0.7378050088882446, -0.7195239067077637, -0.7012427449226379, -0.6829615831375122, -0.6646804809570312, -0.6463993191719055, -0.6281181573867798, -0.6098370552062988, -0.5915558934211731, -0.5732747912406921, -0.5549936294555664, -0.5367125272750854, -0.5184313654899597, -0.500150203704834, -0.48186907172203064, -0.4635879397392273, -0.44530677795410156, -0.4270256459712982, -0.4087445139884949, -0.39046338200569153, -0.3721822500228882, -0.3539011478424072, -0.3356200158596039, -0.31733888387680054, -0.2990577220916748, -0.28077659010887146, -0.2624954581260681, -0.24421432614326477, -0.22593317925930023, -0.20765206217765808, -0.18937093019485474, -0.1710897833108902, -0.15280865132808685, -0.13452750444412231, -0.11624637246131897, -0.09796524047851562, -0.07968409359455109, -0.06140296161174774, -0.0431218221783638, -0.024840686470270157, -0.006559550762176514, 0.011721588671207428, 0.03000272810459137, 0.048283860087394714, 0.06656500697135925, 0.0848461389541626, 0.10312727838754654, 0.12140841782093048, 0.13968954980373383, 0.15797069668769836, 0.1762518286705017, 0.19453296065330505, 0.2128141075372696, 0.23109523952007294, 0.24937637150287628, 0.2676575183868408, 0.28593865036964417, 0.3042197823524475, 0.32250094413757324, 0.3407820463180542, 0.35906320810317993, 0.3773443400859833]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 1.0, 0.0, 6.0, 0.0, 6.0, 7.0, 6.0, 16.0, 5.0, 12.0, 14.0, 28.0, 29.0, 34.0, 31.0, 49.0, 49.0, 43.0, 57.0, 49.0, 58.0, 68.0, 65.0, 55.0, 53.0, 36.0, 30.0, 31.0, 32.0, 21.0, 23.0, 14.0, 26.0, 15.0, 7.0, 8.0, 7.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.16186141967773438, -0.15732398629188538, -0.15278655290603638, -0.14824911952018738, -0.14371168613433838, -0.13917425274848938, -0.13463681936264038, -0.13009938597679138, -0.12556195259094238, -0.12102451920509338, -0.11648708581924438, -0.11194965243339539, -0.10741221904754639, -0.10287478566169739, -0.09833734482526779, -0.09379991143941879, -0.0892624706029892, -0.0847250372171402, -0.0801876038312912, -0.0756501704454422, -0.0711127370595932, -0.0665753036737442, -0.062037862837314606, -0.05750042945146561, -0.05296299606561661, -0.04842556267976761, -0.04388812929391861, -0.03935069218277931, -0.03481325879693031, -0.030275825411081314, -0.025738390162587166, -0.021200954914093018, -0.01666352152824402, -0.012126087211072445, -0.007588652893900871, -0.0030512185767292976, 0.001486215740442276, 0.006023649126291275, 0.010561084374785423, 0.015098519623279572, 0.01963595300912857, 0.02417338639497757, 0.028710821643471718, 0.033248256891965866, 0.037785690277814865, 0.042323123663663864, 0.04686056077480316, 0.05139799416065216, 0.05593542754650116, 0.06047286093235016, 0.06501029431819916, 0.06954772770404816, 0.07408516108989716, 0.07862259447574615, 0.08316003531217575, 0.08769746869802475, 0.09223490208387375, 0.09677233546972275, 0.10130976885557175, 0.10584720224142075, 0.11038464307785034, 0.11492207646369934, 0.11945950984954834, 0.12399694323539734, 0.12853437662124634]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 8.0, 8.0, 14.0, 21.0, 35.0, 59.0, 81.0, 122.0, 151.0, 229.0, 308.0, 493.0, 722.0, 998.0, 1559.0, 2196.0, 3538.0, 5313.0, 8458.0, 14529.0, 26427.0, 53737.0, 137151.0, 602492.0, 94030.0, 41828.0, 21103.0, 12282.0, 7118.0, 4597.0, 2923.0, 1883.0, 1308.0, 916.0, 568.0, 398.0, 311.0, 168.0, 128.0, 105.0, 68.0, 52.0, 33.0, 31.0, 21.0, 13.0, 8.0, 6.0, 4.0, 3.0, 2.0, 3.0, 0.0, 5.0], "bins": [-0.0712890625, -0.06914997100830078, -0.06701087951660156, -0.06487178802490234, -0.06273269653320312, -0.060593605041503906, -0.05845451354980469, -0.05631542205810547, -0.05417633056640625, -0.05203723907470703, -0.04989814758300781, -0.047759056091308594, -0.045619964599609375, -0.043480873107910156, -0.04134178161621094, -0.03920269012451172, -0.0370635986328125, -0.03492450714111328, -0.03278541564941406, -0.030646324157714844, -0.028507232666015625, -0.026368141174316406, -0.024229049682617188, -0.02208995819091797, -0.01995086669921875, -0.01781177520751953, -0.015672683715820312, -0.013533592224121094, -0.011394500732421875, -0.009255409240722656, -0.0071163177490234375, -0.004977226257324219, -0.002838134765625, -0.0006990432739257812, 0.0014400482177734375, 0.0035791397094726562, 0.005718231201171875, 0.007857322692871094, 0.009996414184570312, 0.012135505676269531, 0.01427459716796875, 0.01641368865966797, 0.018552780151367188, 0.020691871643066406, 0.022830963134765625, 0.024970054626464844, 0.027109146118164062, 0.02924823760986328, 0.0313873291015625, 0.03352642059326172, 0.03566551208496094, 0.037804603576660156, 0.039943695068359375, 0.042082786560058594, 0.04422187805175781, 0.04636096954345703, 0.04850006103515625, 0.05063915252685547, 0.05277824401855469, 0.054917335510253906, 0.057056427001953125, 0.059195518493652344, 0.06133460998535156, 0.06347370147705078, 0.06561279296875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 6.0, 4.0, 4.0, 4.0, 7.0, 10.0, 7.0, 4.0, 10.0, 13.0, 7.0, 14.0, 16.0, 18.0, 23.0, 17.0, 25.0, 32.0, 51.0, 263.0, 168.0, 44.0, 25.0, 35.0, 26.0, 20.0, 22.0, 17.0, 14.0, 16.0, 12.0, 13.0, 4.0, 12.0, 4.0, 3.0, 4.0, 8.0, 8.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.03265380859375, -0.031661272048950195, -0.03066873550415039, -0.029676198959350586, -0.02868366241455078, -0.027691125869750977, -0.026698589324951172, -0.025706052780151367, -0.024713516235351562, -0.023720979690551758, -0.022728443145751953, -0.02173590660095215, -0.020743370056152344, -0.01975083351135254, -0.018758296966552734, -0.01776576042175293, -0.016773223876953125, -0.01578068733215332, -0.014788150787353516, -0.013795614242553711, -0.012803077697753906, -0.011810541152954102, -0.010818004608154297, -0.009825468063354492, -0.008832931518554688, -0.007840394973754883, -0.006847858428955078, -0.0058553218841552734, -0.004862785339355469, -0.003870248794555664, -0.0028777122497558594, -0.0018851757049560547, -0.00089263916015625, 9.989738464355469e-05, 0.0010924339294433594, 0.002084970474243164, 0.0030775070190429688, 0.0040700435638427734, 0.005062580108642578, 0.006055116653442383, 0.0070476531982421875, 0.008040189743041992, 0.009032726287841797, 0.010025262832641602, 0.011017799377441406, 0.012010335922241211, 0.013002872467041016, 0.01399540901184082, 0.014987945556640625, 0.01598048210144043, 0.016973018646240234, 0.01796555519104004, 0.018958091735839844, 0.01995062828063965, 0.020943164825439453, 0.021935701370239258, 0.022928237915039062, 0.023920774459838867, 0.024913311004638672, 0.025905847549438477, 0.02689838409423828, 0.027890920639038086, 0.02888345718383789, 0.029875993728637695, 0.0308685302734375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 1.0, 5.0, 3.0, 11.0, 7.0, 15.0, 22.0, 21.0, 25.0, 34.0, 53.0, 54.0, 71.0, 105.0, 144.0, 216.0, 353.0, 540.0, 1073.0, 2387.0, 6576.0, 24680.0, 130477.0, 563688.0, 256496.0, 44345.0, 10339.0, 3396.0, 1424.0, 678.0, 404.0, 241.0, 159.0, 114.0, 103.0, 72.0, 36.0, 40.0, 31.0, 25.0, 19.0, 20.0, 15.0, 9.0, 7.0, 4.0, 3.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0872802734375, -0.0846099853515625, -0.081939697265625, -0.0792694091796875, -0.07659912109375, -0.0739288330078125, -0.071258544921875, -0.0685882568359375, -0.06591796875, -0.0632476806640625, -0.060577392578125, -0.0579071044921875, -0.05523681640625, -0.0525665283203125, -0.049896240234375, -0.0472259521484375, -0.0445556640625, -0.0418853759765625, -0.039215087890625, -0.0365447998046875, -0.03387451171875, -0.0312042236328125, -0.028533935546875, -0.0258636474609375, -0.023193359375, -0.0205230712890625, -0.017852783203125, -0.0151824951171875, -0.01251220703125, -0.0098419189453125, -0.007171630859375, -0.0045013427734375, -0.0018310546875, 0.0008392333984375, 0.003509521484375, 0.0061798095703125, 0.00885009765625, 0.0115203857421875, 0.014190673828125, 0.0168609619140625, 0.01953125, 0.0222015380859375, 0.024871826171875, 0.0275421142578125, 0.03021240234375, 0.0328826904296875, 0.035552978515625, 0.0382232666015625, 0.0408935546875, 0.0435638427734375, 0.046234130859375, 0.0489044189453125, 0.05157470703125, 0.0542449951171875, 0.056915283203125, 0.0595855712890625, 0.062255859375, 0.0649261474609375, 0.067596435546875, 0.0702667236328125, 0.07293701171875, 0.0756072998046875, 0.078277587890625, 0.0809478759765625, 0.0836181640625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 1.0, 4.0, 8.0, 8.0, 5.0, 6.0, 13.0, 9.0, 11.0, 16.0, 11.0, 26.0, 11.0, 21.0, 19.0, 26.0, 38.0, 35.0, 27.0, 31.0, 38.0, 38.0, 41.0, 49.0, 34.0, 43.0, 50.0, 35.0, 21.0, 37.0, 33.0, 32.0, 28.0, 26.0, 24.0, 27.0, 18.0, 15.0, 17.0, 17.0, 9.0, 7.0, 11.0, 10.0, 2.0, 5.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.11456298828125, -0.11097145080566406, -0.10737991333007812, -0.10378837585449219, -0.10019683837890625, -0.09660530090332031, -0.09301376342773438, -0.08942222595214844, -0.0858306884765625, -0.08223915100097656, -0.07864761352539062, -0.07505607604980469, -0.07146453857421875, -0.06787300109863281, -0.06428146362304688, -0.06068992614746094, -0.057098388671875, -0.05350685119628906, -0.049915313720703125, -0.04632377624511719, -0.04273223876953125, -0.03914070129394531, -0.035549163818359375, -0.03195762634277344, -0.0283660888671875, -0.024774551391601562, -0.021183013916015625, -0.017591476440429688, -0.01399993896484375, -0.010408401489257812, -0.006816864013671875, -0.0032253265380859375, 0.0003662109375, 0.0039577484130859375, 0.007549285888671875, 0.011140823364257812, 0.01473236083984375, 0.018323898315429688, 0.021915435791015625, 0.025506973266601562, 0.0290985107421875, 0.03269004821777344, 0.036281585693359375, 0.03987312316894531, 0.04346466064453125, 0.04705619812011719, 0.050647735595703125, 0.05423927307128906, 0.057830810546875, 0.06142234802246094, 0.06501388549804688, 0.06860542297363281, 0.07219696044921875, 0.07578849792480469, 0.07938003540039062, 0.08297157287597656, 0.0865631103515625, 0.09015464782714844, 0.09374618530273438, 0.09733772277832031, 0.10092926025390625, 0.10452079772949219, 0.10811233520507812, 0.11170387268066406, 0.11529541015625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 7.0, 7.0, 16.0, 21.0, 24.0, 52.0, 88.0, 146.0, 323.0, 799.0, 2557.0, 16050.0, 769785.0, 246859.0, 8825.0, 1795.0, 589.0, 261.0, 152.0, 77.0, 47.0, 27.0, 16.0, 14.0, 4.0, 10.0, 0.0, 2.0, 0.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09674072265625, -0.09388446807861328, -0.09102821350097656, -0.08817195892333984, -0.08531570434570312, -0.0824594497680664, -0.07960319519042969, -0.07674694061279297, -0.07389068603515625, -0.07103443145751953, -0.06817817687988281, -0.0653219223022461, -0.062465667724609375, -0.059609413146972656, -0.05675315856933594, -0.05389690399169922, -0.0510406494140625, -0.04818439483642578, -0.04532814025878906, -0.042471885681152344, -0.039615631103515625, -0.036759376525878906, -0.03390312194824219, -0.03104686737060547, -0.02819061279296875, -0.02533435821533203, -0.022478103637695312, -0.019621849060058594, -0.016765594482421875, -0.013909339904785156, -0.011053085327148438, -0.008196830749511719, -0.005340576171875, -0.0024843215942382812, 0.0003719329833984375, 0.0032281875610351562, 0.006084442138671875, 0.008940696716308594, 0.011796951293945312, 0.014653205871582031, 0.01750946044921875, 0.02036571502685547, 0.023221969604492188, 0.026078224182128906, 0.028934478759765625, 0.031790733337402344, 0.03464698791503906, 0.03750324249267578, 0.0403594970703125, 0.04321575164794922, 0.04607200622558594, 0.048928260803222656, 0.051784515380859375, 0.054640769958496094, 0.05749702453613281, 0.06035327911376953, 0.06320953369140625, 0.06606578826904297, 0.06892204284667969, 0.0717782974243164, 0.07463455200195312, 0.07749080657958984, 0.08034706115722656, 0.08320331573486328, 0.0860595703125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 11.0, 12.0, 9.0, 20.0, 20.0, 25.0, 39.0, 40.0, 49.0, 60.0, 67.0, 86.0, 103.0, 105.0, 77.0, 70.0, 51.0, 42.0, 31.0, 26.0, 13.0, 4.0, 10.0, 10.0, 7.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.673004150390625e-05, -4.541035741567612e-05, -4.4090673327445984e-05, -4.277098923921585e-05, -4.145130515098572e-05, -4.0131621062755585e-05, -3.881193697452545e-05, -3.749225288629532e-05, -3.6172568798065186e-05, -3.485288470983505e-05, -3.353320062160492e-05, -3.2213516533374786e-05, -3.089383244514465e-05, -2.957414835691452e-05, -2.8254464268684387e-05, -2.6934780180454254e-05, -2.561509609222412e-05, -2.4295412003993988e-05, -2.2975727915763855e-05, -2.1656043827533722e-05, -2.033635973930359e-05, -1.9016675651073456e-05, -1.7696991562843323e-05, -1.637730747461319e-05, -1.5057623386383057e-05, -1.3737939298152924e-05, -1.241825520992279e-05, -1.1098571121692657e-05, -9.778887033462524e-06, -8.459202945232391e-06, -7.139518857002258e-06, -5.819834768772125e-06, -4.500150680541992e-06, -3.180466592311859e-06, -1.860782504081726e-06, -5.41098415851593e-07, 7.7858567237854e-07, 2.098269760608673e-06, 3.417953848838806e-06, 4.737637937068939e-06, 6.057322025299072e-06, 7.377006113529205e-06, 8.696690201759338e-06, 1.0016374289989471e-05, 1.1336058378219604e-05, 1.2655742466449738e-05, 1.397542655467987e-05, 1.5295110642910004e-05, 1.6614794731140137e-05, 1.793447881937027e-05, 1.9254162907600403e-05, 2.0573846995830536e-05, 2.189353108406067e-05, 2.3213215172290802e-05, 2.4532899260520935e-05, 2.5852583348751068e-05, 2.71722674369812e-05, 2.8491951525211334e-05, 2.9811635613441467e-05, 3.11313197016716e-05, 3.2451003789901733e-05, 3.3770687878131866e-05, 3.5090371966362e-05, 3.641005605459213e-05, 3.7729740142822266e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 12.0, 11.0, 19.0, 12.0, 18.0, 32.0, 43.0, 74.0, 117.0, 206.0, 374.0, 729.0, 1596.0, 4131.0, 13474.0, 75468.0, 602233.0, 300400.0, 36354.0, 8168.0, 2611.0, 1135.0, 588.0, 291.0, 161.0, 95.0, 64.0, 43.0, 16.0, 26.0, 16.0, 12.0, 11.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03662109375, -0.03530406951904297, -0.03398704528808594, -0.032670021057128906, -0.031352996826171875, -0.030035972595214844, -0.028718948364257812, -0.02740192413330078, -0.02608489990234375, -0.02476787567138672, -0.023450851440429688, -0.022133827209472656, -0.020816802978515625, -0.019499778747558594, -0.018182754516601562, -0.01686573028564453, -0.0155487060546875, -0.014231681823730469, -0.012914657592773438, -0.011597633361816406, -0.010280609130859375, -0.008963584899902344, -0.0076465606689453125, -0.006329536437988281, -0.00501251220703125, -0.0036954879760742188, -0.0023784637451171875, -0.0010614395141601562, 0.000255584716796875, 0.0015726089477539062, 0.0028896331787109375, 0.004206657409667969, 0.005523681640625, 0.006840705871582031, 0.008157730102539062, 0.009474754333496094, 0.010791778564453125, 0.012108802795410156, 0.013425827026367188, 0.014742851257324219, 0.01605987548828125, 0.01737689971923828, 0.018693923950195312, 0.020010948181152344, 0.021327972412109375, 0.022644996643066406, 0.023962020874023438, 0.02527904510498047, 0.0265960693359375, 0.02791309356689453, 0.029230117797851562, 0.030547142028808594, 0.031864166259765625, 0.033181190490722656, 0.03449821472167969, 0.03581523895263672, 0.03713226318359375, 0.03844928741455078, 0.03976631164550781, 0.041083335876464844, 0.042400360107421875, 0.043717384338378906, 0.04503440856933594, 0.04635143280029297, 0.04766845703125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 10.0, 1.0, 6.0, 8.0, 7.0, 8.0, 15.0, 20.0, 17.0, 24.0, 35.0, 42.0, 51.0, 72.0, 101.0, 89.0, 89.0, 92.0, 73.0, 62.0, 45.0, 26.0, 24.0, 25.0, 10.0, 11.0, 9.0, 8.0, 5.0, 5.0, 6.0, 7.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.03594970703125, -0.0346064567565918, -0.033263206481933594, -0.03191995620727539, -0.030576705932617188, -0.029233455657958984, -0.02789020538330078, -0.026546955108642578, -0.025203704833984375, -0.023860454559326172, -0.02251720428466797, -0.021173954010009766, -0.019830703735351562, -0.01848745346069336, -0.017144203186035156, -0.015800952911376953, -0.01445770263671875, -0.013114452362060547, -0.011771202087402344, -0.01042795181274414, -0.009084701538085938, -0.007741451263427734, -0.006398200988769531, -0.005054950714111328, -0.003711700439453125, -0.002368450164794922, -0.0010251998901367188, 0.0003180503845214844, 0.0016613006591796875, 0.0030045509338378906, 0.004347801208496094, 0.005691051483154297, 0.0070343017578125, 0.008377552032470703, 0.009720802307128906, 0.01106405258178711, 0.012407302856445312, 0.013750553131103516, 0.015093803405761719, 0.016437053680419922, 0.017780303955078125, 0.019123554229736328, 0.02046680450439453, 0.021810054779052734, 0.023153305053710938, 0.02449655532836914, 0.025839805603027344, 0.027183055877685547, 0.02852630615234375, 0.029869556427001953, 0.031212806701660156, 0.03255605697631836, 0.03389930725097656, 0.035242557525634766, 0.03658580780029297, 0.03792905807495117, 0.039272308349609375, 0.04061555862426758, 0.04195880889892578, 0.043302059173583984, 0.04464530944824219, 0.04598855972290039, 0.047331809997558594, 0.0486750602722168, 0.050018310546875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 8.0, 26.0, 65.0, 350.0, 469.0, 65.0, 15.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9441184997558594, -2.885402202606201, -2.826685905456543, -2.7679696083068848, -2.7092533111572266, -2.6505370140075684, -2.59182071685791, -2.533104419708252, -2.4743881225585938, -2.4156718254089355, -2.3569555282592773, -2.298239231109619, -2.239522933959961, -2.1808066368103027, -2.1220903396606445, -2.0633740425109863, -2.004657745361328, -1.94594144821167, -1.8872251510620117, -1.8285088539123535, -1.7697925567626953, -1.711076259613037, -1.652359962463379, -1.5936436653137207, -1.5349271297454834, -1.4762108325958252, -1.417494535446167, -1.3587782382965088, -1.3000619411468506, -1.2413456439971924, -1.1826293468475342, -1.123913049697876, -1.0651967525482178, -1.0064804553985596, -0.9477641582489014, -0.8890478610992432, -0.830331563949585, -0.7716152667999268, -0.7128989100456238, -0.6541826128959656, -0.5954663753509521, -0.536750078201294, -0.47803378105163574, -0.41931745409965515, -0.36060115694999695, -0.30188485980033875, -0.24316853284835815, -0.18445223569869995, -0.12573593854904175, -0.06701963394880295, -0.008303329348564148, 0.05041298270225525, 0.10912927985191345, 0.16784557700157166, 0.22656190395355225, 0.28527820110321045, 0.34399449825286865, 0.40271079540252686, 0.46142709255218506, 0.5201433897018433, 0.5788596868515015, 0.6375759840011597, 0.6962923407554626, 0.7550086379051208, 0.813724935054779]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 8.0, 6.0, 5.0, 5.0, 19.0, 22.0, 34.0, 63.0, 83.0, 137.0, 161.0, 133.0, 93.0, 62.0, 34.0, 24.0, 20.0, 11.0, 10.0, 10.0, 5.0, 7.0, 4.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8981820344924927, -1.8322393894195557, -1.7662968635559082, -1.7003542184829712, -1.6344115734100342, -1.5684689283370972, -1.5025262832641602, -1.4365837574005127, -1.3706411123275757, -1.3046984672546387, -1.2387559413909912, -1.1728132963180542, -1.1068706512451172, -1.0409280061721802, -0.9749854207038879, -0.9090428352355957, -0.8431001901626587, -0.7771575450897217, -0.7112149596214294, -0.6452723741531372, -0.5793297290802002, -0.5133870840072632, -0.44744449853897095, -0.3815018832683563, -0.3155592679977417, -0.24961665272712708, -0.18367403745651245, -0.11773142218589783, -0.0517888069152832, 0.014153808355331421, 0.08009642362594604, 0.14603903889656067, 0.21198177337646484, 0.27792438864707947, 0.3438670039176941, 0.4098096191883087, 0.47575223445892334, 0.5416948795318604, 0.6076374650001526, 0.6735800504684448, 0.7395226955413818, 0.8054653406143188, 0.8714079260826111, 0.9373505115509033, 1.0032931566238403, 1.0692358016967773, 1.1351783275604248, 1.2011209726333618, 1.2670636177062988, 1.3330062627792358, 1.3989489078521729, 1.4648914337158203, 1.5308340787887573, 1.5967767238616943, 1.6627192497253418, 1.7286618947982788, 1.7946045398712158, 1.8605471849441528, 1.9264898300170898, 1.9924323558807373, 2.0583748817443848, 2.1243176460266113, 2.190260171890259, 2.2562029361724854, 2.322145462036133]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 10.0, 9.0, 14.0, 15.0, 18.0, 27.0, 33.0, 68.0, 125.0, 172.0, 293.0, 508.0, 911.0, 1669.0, 3482.0, 7065.0, 16481.0, 50495.0, 368016.0, 3596709.0, 99269.0, 27041.0, 10945.0, 5085.0, 2526.0, 1384.0, 755.0, 414.0, 228.0, 166.0, 113.0, 65.0, 37.0, 45.0, 15.0, 21.0, 15.0, 9.0, 11.0, 8.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.26123046875, -0.25258636474609375, -0.2439422607421875, -0.23529815673828125, -0.226654052734375, -0.21800994873046875, -0.2093658447265625, -0.20072174072265625, -0.19207763671875, -0.18343353271484375, -0.1747894287109375, -0.16614532470703125, -0.157501220703125, -0.14885711669921875, -0.1402130126953125, -0.13156890869140625, -0.1229248046875, -0.11428070068359375, -0.1056365966796875, -0.09699249267578125, -0.088348388671875, -0.07970428466796875, -0.0710601806640625, -0.06241607666015625, -0.05377197265625, -0.04512786865234375, -0.0364837646484375, -0.02783966064453125, -0.019195556640625, -0.01055145263671875, -0.0019073486328125, 0.00673675537109375, 0.015380859375, 0.02402496337890625, 0.0326690673828125, 0.04131317138671875, 0.049957275390625, 0.05860137939453125, 0.0672454833984375, 0.07588958740234375, 0.08453369140625, 0.09317779541015625, 0.1018218994140625, 0.11046600341796875, 0.119110107421875, 0.12775421142578125, 0.1363983154296875, 0.14504241943359375, 0.1536865234375, 0.16233062744140625, 0.1709747314453125, 0.17961883544921875, 0.188262939453125, 0.19690704345703125, 0.2055511474609375, 0.21419525146484375, 0.22283935546875, 0.23148345947265625, 0.2401275634765625, 0.24877166748046875, 0.257415771484375, 0.26605987548828125, 0.2747039794921875, 0.28334808349609375, 0.2919921875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 4.0, 6.0, 5.0, 3.0, 9.0, 8.0, 11.0, 12.0, 17.0, 18.0, 16.0, 19.0, 29.0, 26.0, 44.0, 76.0, 204.0, 152.0, 64.0, 53.0, 28.0, 31.0, 22.0, 20.0, 20.0, 14.0, 10.0, 13.0, 11.0, 12.0, 6.0, 6.0, 4.0, 8.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.034332275390625, -0.033356428146362305, -0.03238058090209961, -0.031404733657836914, -0.03042888641357422, -0.029453039169311523, -0.028477191925048828, -0.027501344680786133, -0.026525497436523438, -0.025549650192260742, -0.024573802947998047, -0.02359795570373535, -0.022622108459472656, -0.02164626121520996, -0.020670413970947266, -0.01969456672668457, -0.018718719482421875, -0.01774287223815918, -0.016767024993896484, -0.01579117774963379, -0.014815330505371094, -0.013839483261108398, -0.012863636016845703, -0.011887788772583008, -0.010911941528320312, -0.009936094284057617, -0.008960247039794922, -0.007984399795532227, -0.007008552551269531, -0.006032705307006836, -0.005056858062744141, -0.004081010818481445, -0.00310516357421875, -0.0021293163299560547, -0.0011534690856933594, -0.00017762184143066406, 0.0007982254028320312, 0.0017740726470947266, 0.002749919891357422, 0.003725767135620117, 0.0047016143798828125, 0.005677461624145508, 0.006653308868408203, 0.0076291561126708984, 0.008605003356933594, 0.009580850601196289, 0.010556697845458984, 0.01153254508972168, 0.012508392333984375, 0.01348423957824707, 0.014460086822509766, 0.015435934066772461, 0.016411781311035156, 0.01738762855529785, 0.018363475799560547, 0.019339323043823242, 0.020315170288085938, 0.021291017532348633, 0.022266864776611328, 0.023242712020874023, 0.02421855926513672, 0.025194406509399414, 0.02617025375366211, 0.027146100997924805, 0.0281219482421875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 6.0, 8.0, 13.0, 14.0, 20.0, 27.0, 39.0, 80.0, 97.0, 164.0, 340.0, 574.0, 1146.0, 2431.0, 5842.0, 15621.0, 51855.0, 274627.0, 3381587.0, 366278.0, 62975.0, 18111.0, 6748.0, 2790.0, 1290.0, 677.0, 376.0, 200.0, 118.0, 69.0, 42.0, 36.0, 24.0, 14.0, 8.0, 11.0, 8.0, 1.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1934814453125, -0.1867084503173828, -0.17993545532226562, -0.17316246032714844, -0.16638946533203125, -0.15961647033691406, -0.15284347534179688, -0.1460704803466797, -0.1392974853515625, -0.1325244903564453, -0.12575149536132812, -0.11897850036621094, -0.11220550537109375, -0.10543251037597656, -0.09865951538085938, -0.09188652038574219, -0.085113525390625, -0.07834053039550781, -0.07156753540039062, -0.06479454040527344, -0.05802154541015625, -0.05124855041503906, -0.044475555419921875, -0.03770256042480469, -0.0309295654296875, -0.024156570434570312, -0.017383575439453125, -0.010610580444335938, -0.00383758544921875, 0.0029354095458984375, 0.009708404541015625, 0.016481399536132812, 0.02325439453125, 0.030027389526367188, 0.036800384521484375, 0.04357337951660156, 0.05034637451171875, 0.05711936950683594, 0.06389236450195312, 0.07066535949707031, 0.0774383544921875, 0.08421134948730469, 0.09098434448242188, 0.09775733947753906, 0.10453033447265625, 0.11130332946777344, 0.11807632446289062, 0.12484931945800781, 0.131622314453125, 0.1383953094482422, 0.14516830444335938, 0.15194129943847656, 0.15871429443359375, 0.16548728942871094, 0.17226028442382812, 0.1790332794189453, 0.1858062744140625, 0.1925792694091797, 0.19935226440429688, 0.20612525939941406, 0.21289825439453125, 0.21967124938964844, 0.22644424438476562, 0.2332172393798828, 0.239990234375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 6.0, 2.0, 8.0, 9.0, 11.0, 22.0, 24.0, 30.0, 46.0, 62.0, 73.0, 129.0, 213.0, 359.0, 1373.0, 813.0, 299.0, 175.0, 133.0, 68.0, 44.0, 41.0, 24.0, 23.0, 11.0, 10.0, 5.0, 15.0, 8.0, 2.0, 6.0, 5.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.043365478515625, -0.04204750061035156, -0.040729522705078125, -0.03941154479980469, -0.03809356689453125, -0.03677558898925781, -0.035457611083984375, -0.03413963317871094, -0.0328216552734375, -0.03150367736816406, -0.030185699462890625, -0.028867721557617188, -0.02754974365234375, -0.026231765747070312, -0.024913787841796875, -0.023595809936523438, -0.02227783203125, -0.020959854125976562, -0.019641876220703125, -0.018323898315429688, -0.01700592041015625, -0.015687942504882812, -0.014369964599609375, -0.013051986694335938, -0.0117340087890625, -0.010416030883789062, -0.009098052978515625, -0.0077800750732421875, -0.00646209716796875, -0.0051441192626953125, -0.003826141357421875, -0.0025081634521484375, -0.001190185546875, 0.0001277923583984375, 0.001445770263671875, 0.0027637481689453125, 0.00408172607421875, 0.0053997039794921875, 0.006717681884765625, 0.008035659790039062, 0.0093536376953125, 0.010671615600585938, 0.011989593505859375, 0.013307571411132812, 0.01462554931640625, 0.015943527221679688, 0.017261505126953125, 0.018579483032226562, 0.0198974609375, 0.021215438842773438, 0.022533416748046875, 0.023851394653320312, 0.02516937255859375, 0.026487350463867188, 0.027805328369140625, 0.029123306274414062, 0.0304412841796875, 0.03175926208496094, 0.033077239990234375, 0.03439521789550781, 0.03571319580078125, 0.03703117370605469, 0.038349151611328125, 0.03966712951660156, 0.040985107421875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 10.0, 222.0, 709.0, 53.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.150829792022705, -2.1112453937530518, -2.0716609954833984, -2.032076597213745, -1.9924921989440918, -1.9529078006744385, -1.9133234024047852, -1.8737390041351318, -1.8341546058654785, -1.7945702075958252, -1.7549858093261719, -1.7154014110565186, -1.6758170127868652, -1.636232614517212, -1.5966482162475586, -1.5570638179779053, -1.517479419708252, -1.4778950214385986, -1.4383106231689453, -1.398726224899292, -1.3591418266296387, -1.3195574283599854, -1.279973030090332, -1.2403886318206787, -1.2008042335510254, -1.161219835281372, -1.1216354370117188, -1.0820510387420654, -1.042466640472412, -1.0028822422027588, -0.9632978439331055, -0.9237134456634521, -0.8841291666030884, -0.8445447683334351, -0.8049603700637817, -0.7653759717941284, -0.7257915735244751, -0.6862071752548218, -0.6466227769851685, -0.6070383787155151, -0.5674539804458618, -0.5278695821762085, -0.4882851839065552, -0.44870078563690186, -0.40911638736724854, -0.3695319890975952, -0.3299475908279419, -0.2903631925582886, -0.25077876448631287, -0.21119436621665955, -0.17160996794700623, -0.1320255696773529, -0.09244117140769958, -0.052856773138046265, -0.013272374868392944, 0.026312023401260376, 0.0658964216709137, 0.10548081994056702, 0.14506521821022034, 0.18464961647987366, 0.22423401474952698, 0.2638184130191803, 0.3034028112888336, 0.34298720955848694, 0.38257160782814026]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 0.0, 4.0, 6.0, 8.0, 2.0, 4.0, 15.0, 24.0, 29.0, 33.0, 34.0, 50.0, 57.0, 59.0, 79.0, 79.0, 83.0, 79.0, 62.0, 55.0, 51.0, 55.0, 38.0, 25.0, 18.0, 17.0, 11.0, 10.0, 8.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2359585165977478, -0.22905640304088593, -0.22215430438518524, -0.21525219082832336, -0.20835009217262268, -0.2014479786157608, -0.19454586505889893, -0.18764376640319824, -0.18074166774749756, -0.17383955419063568, -0.166937455534935, -0.16003534197807312, -0.15313324332237244, -0.14623112976551056, -0.13932901620864868, -0.132426917552948, -0.12552480399608612, -0.11862269788980484, -0.11172059178352356, -0.10481847822666168, -0.097916379570961, -0.09101426601409912, -0.08411215990781784, -0.07721005380153656, -0.07030794769525528, -0.063405841588974, -0.05650373548269272, -0.04960162565112114, -0.04269951954483986, -0.03579741343855858, -0.028895303606987, -0.02199319750070572, -0.015091091394424438, -0.008188984356820583, -0.0012868773192167282, 0.0056152306497097015, 0.012517336755990982, 0.019419442862272263, 0.02632155269384384, 0.03322365880012512, 0.0401257649064064, 0.04702787101268768, 0.053929977118968964, 0.06083208695054054, 0.06773419678211212, 0.0746362954378128, 0.08153840899467468, 0.08844051510095596, 0.09534262120723724, 0.10224472731351852, 0.1091468334197998, 0.11604894697666168, 0.12295104563236237, 0.12985315918922424, 0.13675525784492493, 0.1436573714017868, 0.15055948495864868, 0.15746159851551056, 0.16436369717121124, 0.17126581072807312, 0.1781679093837738, 0.18507002294063568, 0.19197213649749756, 0.19887423515319824, 0.20577633380889893]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 2.0, 2.0, 5.0, 10.0, 15.0, 23.0, 36.0, 73.0, 77.0, 123.0, 198.0, 355.0, 625.0, 1104.0, 2329.0, 5389.0, 13717.0, 42924.0, 212370.0, 655559.0, 77179.0, 21786.0, 7893.0, 3285.0, 1541.0, 809.0, 432.0, 255.0, 171.0, 89.0, 59.0, 33.0, 29.0, 14.0, 12.0, 9.0, 8.0, 8.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.269775390625, -0.2616539001464844, -0.25353240966796875, -0.24541091918945312, -0.2372894287109375, -0.22916793823242188, -0.22104644775390625, -0.21292495727539062, -0.204803466796875, -0.19668197631835938, -0.18856048583984375, -0.18043899536132812, -0.1723175048828125, -0.16419601440429688, -0.15607452392578125, -0.14795303344726562, -0.13983154296875, -0.13171005249023438, -0.12358856201171875, -0.11546707153320312, -0.1073455810546875, -0.09922409057617188, -0.09110260009765625, -0.08298110961914062, -0.074859619140625, -0.06673812866210938, -0.05861663818359375, -0.050495147705078125, -0.0423736572265625, -0.034252166748046875, -0.02613067626953125, -0.018009185791015625, -0.0098876953125, -0.001766204833984375, 0.00635528564453125, 0.014476776123046875, 0.0225982666015625, 0.030719757080078125, 0.03884124755859375, 0.046962738037109375, 0.055084228515625, 0.06320571899414062, 0.07132720947265625, 0.07944869995117188, 0.0875701904296875, 0.09569168090820312, 0.10381317138671875, 0.11193466186523438, 0.12005615234375, 0.12817764282226562, 0.13629913330078125, 0.14442062377929688, 0.1525421142578125, 0.16066360473632812, 0.16878509521484375, 0.17690658569335938, 0.185028076171875, 0.19314956665039062, 0.20127105712890625, 0.20939254760742188, 0.2175140380859375, 0.22563552856445312, 0.23375701904296875, 0.24187850952148438, 0.25]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 6.0, 1.0, 4.0, 4.0, 6.0, 8.0, 12.0, 12.0, 12.0, 27.0, 19.0, 19.0, 35.0, 39.0, 73.0, 157.0, 174.0, 97.0, 76.0, 43.0, 24.0, 19.0, 26.0, 23.0, 10.0, 17.0, 13.0, 9.0, 9.0, 5.0, 8.0, 5.0, 7.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03857421875, -0.037457942962646484, -0.03634166717529297, -0.03522539138793945, -0.03410911560058594, -0.03299283981323242, -0.031876564025878906, -0.03076028823852539, -0.029644012451171875, -0.02852773666381836, -0.027411460876464844, -0.026295185089111328, -0.025178909301757812, -0.024062633514404297, -0.02294635772705078, -0.021830081939697266, -0.02071380615234375, -0.019597530364990234, -0.01848125457763672, -0.017364978790283203, -0.016248703002929688, -0.015132427215576172, -0.014016151428222656, -0.01289987564086914, -0.011783599853515625, -0.01066732406616211, -0.009551048278808594, -0.008434772491455078, -0.0073184967041015625, -0.006202220916748047, -0.005085945129394531, -0.003969669342041016, -0.0028533935546875, -0.0017371177673339844, -0.0006208419799804688, 0.0004954338073730469, 0.0016117095947265625, 0.002727985382080078, 0.0038442611694335938, 0.004960536956787109, 0.006076812744140625, 0.007193088531494141, 0.008309364318847656, 0.009425640106201172, 0.010541915893554688, 0.011658191680908203, 0.012774467468261719, 0.013890743255615234, 0.01500701904296875, 0.016123294830322266, 0.01723957061767578, 0.018355846405029297, 0.019472122192382812, 0.020588397979736328, 0.021704673767089844, 0.02282094955444336, 0.023937225341796875, 0.02505350112915039, 0.026169776916503906, 0.027286052703857422, 0.028402328491210938, 0.029518604278564453, 0.03063488006591797, 0.031751155853271484, 0.032867431640625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 9.0, 13.0, 45.0, 73.0, 230.0, 1343.0, 49408.0, 988399.0, 8194.0, 587.0, 147.0, 48.0, 20.0, 8.0, 4.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.468017578125, -0.4479408264160156, -0.42786407470703125, -0.4077873229980469, -0.3877105712890625, -0.3676338195800781, -0.34755706787109375, -0.3274803161621094, -0.307403564453125, -0.2873268127441406, -0.26725006103515625, -0.24717330932617188, -0.2270965576171875, -0.20701980590820312, -0.18694305419921875, -0.16686630249023438, -0.14678955078125, -0.12671279907226562, -0.10663604736328125, -0.08655929565429688, -0.0664825439453125, -0.046405792236328125, -0.02632904052734375, -0.006252288818359375, 0.013824462890625, 0.033901214599609375, 0.05397796630859375, 0.07405471801757812, 0.0941314697265625, 0.11420822143554688, 0.13428497314453125, 0.15436172485351562, 0.1744384765625, 0.19451522827148438, 0.21459197998046875, 0.23466873168945312, 0.2547454833984375, 0.2748222351074219, 0.29489898681640625, 0.3149757385253906, 0.335052490234375, 0.3551292419433594, 0.37520599365234375, 0.3952827453613281, 0.4153594970703125, 0.4354362487792969, 0.45551300048828125, 0.4755897521972656, 0.49566650390625, 0.5157432556152344, 0.5358200073242188, 0.5558967590332031, 0.5759735107421875, 0.5960502624511719, 0.6161270141601562, 0.6362037658691406, 0.656280517578125, 0.6763572692871094, 0.6964340209960938, 0.7165107727050781, 0.7365875244140625, 0.7566642761230469, 0.7767410278320312, 0.7968177795410156, 0.81689453125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 6.0, 8.0, 10.0, 5.0, 9.0, 18.0, 17.0, 38.0, 23.0, 26.0, 38.0, 46.0, 42.0, 38.0, 56.0, 51.0, 57.0, 61.0, 54.0, 57.0, 38.0, 44.0, 37.0, 38.0, 38.0, 34.0, 25.0, 20.0, 22.0, 15.0, 10.0, 1.0, 7.0, 6.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.130615234375, -0.12667560577392578, -0.12273597717285156, -0.11879634857177734, -0.11485671997070312, -0.1109170913696289, -0.10697746276855469, -0.10303783416748047, -0.09909820556640625, -0.09515857696533203, -0.09121894836425781, -0.0872793197631836, -0.08333969116210938, -0.07940006256103516, -0.07546043395996094, -0.07152080535888672, -0.0675811767578125, -0.06364154815673828, -0.05970191955566406, -0.055762290954589844, -0.051822662353515625, -0.047883033752441406, -0.04394340515136719, -0.04000377655029297, -0.03606414794921875, -0.03212451934814453, -0.028184890747070312, -0.024245262145996094, -0.020305633544921875, -0.016366004943847656, -0.012426376342773438, -0.008486747741699219, -0.004547119140625, -0.0006074905395507812, 0.0033321380615234375, 0.007271766662597656, 0.011211395263671875, 0.015151023864746094, 0.019090652465820312, 0.02303028106689453, 0.02696990966796875, 0.03090953826904297, 0.03484916687011719, 0.038788795471191406, 0.042728424072265625, 0.046668052673339844, 0.05060768127441406, 0.05454730987548828, 0.0584869384765625, 0.06242656707763672, 0.06636619567871094, 0.07030582427978516, 0.07424545288085938, 0.0781850814819336, 0.08212471008300781, 0.08606433868408203, 0.09000396728515625, 0.09394359588623047, 0.09788322448730469, 0.1018228530883789, 0.10576248168945312, 0.10970211029052734, 0.11364173889160156, 0.11758136749267578, 0.12152099609375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 7.0, 1.0, 3.0, 9.0, 2.0, 12.0, 19.0, 27.0, 44.0, 140.0, 388.0, 1691.0, 13488.0, 638405.0, 383067.0, 9402.0, 1309.0, 325.0, 119.0, 34.0, 24.0, 13.0, 11.0, 6.0, 2.0, 0.0, 2.0, 4.0, 2.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2939453125, -0.28598594665527344, -0.2780265808105469, -0.2700672149658203, -0.26210784912109375, -0.2541484832763672, -0.24618911743164062, -0.23822975158691406, -0.2302703857421875, -0.22231101989746094, -0.21435165405273438, -0.2063922882080078, -0.19843292236328125, -0.1904735565185547, -0.18251419067382812, -0.17455482482910156, -0.166595458984375, -0.15863609313964844, -0.15067672729492188, -0.1427173614501953, -0.13475799560546875, -0.1267986297607422, -0.11883926391601562, -0.11087989807128906, -0.1029205322265625, -0.09496116638183594, -0.08700180053710938, -0.07904243469238281, -0.07108306884765625, -0.06312370300292969, -0.055164337158203125, -0.04720497131347656, -0.03924560546875, -0.03128623962402344, -0.023326873779296875, -0.015367507934570312, -0.00740814208984375, 0.0005512237548828125, 0.008510589599609375, 0.016469955444335938, 0.0244293212890625, 0.03238868713378906, 0.040348052978515625, 0.04830741882324219, 0.05626678466796875, 0.06422615051269531, 0.07218551635742188, 0.08014488220214844, 0.088104248046875, 0.09606361389160156, 0.10402297973632812, 0.11198234558105469, 0.11994171142578125, 0.1279010772705078, 0.13586044311523438, 0.14381980895996094, 0.1517791748046875, 0.15973854064941406, 0.16769790649414062, 0.1756572723388672, 0.18361663818359375, 0.1915760040283203, 0.19953536987304688, 0.20749473571777344, 0.2154541015625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 4.0, 2.0, 5.0, 8.0, 3.0, 1.0, 5.0, 10.0, 12.0, 13.0, 12.0, 23.0, 24.0, 62.0, 93.0, 128.0, 158.0, 153.0, 96.0, 49.0, 41.0, 27.0, 10.0, 15.0, 6.0, 10.0, 6.0, 10.0, 3.0, 5.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.167194366455078e-05, -8.834246546030045e-05, -8.501298725605011e-05, -8.168350905179977e-05, -7.835403084754944e-05, -7.50245526432991e-05, -7.169507443904877e-05, -6.836559623479843e-05, -6.50361180305481e-05, -6.170663982629776e-05, -5.8377161622047424e-05, -5.504768341779709e-05, -5.171820521354675e-05, -4.838872700929642e-05, -4.505924880504608e-05, -4.1729770600795746e-05, -3.840029239654541e-05, -3.5070814192295074e-05, -3.174133598804474e-05, -2.8411857783794403e-05, -2.5082379579544067e-05, -2.175290137529373e-05, -1.8423423171043396e-05, -1.509394496679306e-05, -1.1764466762542725e-05, -8.434988558292389e-06, -5.105510354042053e-06, -1.7760321497917175e-06, 1.5534460544586182e-06, 4.882924258708954e-06, 8.21240246295929e-06, 1.1541880667209625e-05, 1.4871358871459961e-05, 1.8200837075710297e-05, 2.1530315279960632e-05, 2.4859793484210968e-05, 2.8189271688461304e-05, 3.151874989271164e-05, 3.4848228096961975e-05, 3.817770630121231e-05, 4.1507184505462646e-05, 4.483666270971298e-05, 4.816614091396332e-05, 5.1495619118213654e-05, 5.482509732246399e-05, 5.8154575526714325e-05, 6.148405373096466e-05, 6.4813531935215e-05, 6.814301013946533e-05, 7.147248834371567e-05, 7.4801966547966e-05, 7.813144475221634e-05, 8.146092295646667e-05, 8.479040116071701e-05, 8.811987936496735e-05, 9.144935756921768e-05, 9.477883577346802e-05, 9.810831397771835e-05, 0.00010143779218196869, 0.00010476727038621902, 0.00010809674859046936, 0.0001114262267947197, 0.00011475570499897003, 0.00011808518320322037, 0.0001214146614074707]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 4.0, 4.0, 6.0, 9.0, 11.0, 12.0, 20.0, 26.0, 49.0, 76.0, 152.0, 234.0, 475.0, 1036.0, 2361.0, 5845.0, 17071.0, 64548.0, 331375.0, 479752.0, 106848.0, 24988.0, 8118.0, 2961.0, 1260.0, 590.0, 308.0, 154.0, 78.0, 67.0, 48.0, 25.0, 12.0, 9.0, 9.0, 3.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.10113525390625, -0.09808540344238281, -0.09503555297851562, -0.09198570251464844, -0.08893585205078125, -0.08588600158691406, -0.08283615112304688, -0.07978630065917969, -0.0767364501953125, -0.07368659973144531, -0.07063674926757812, -0.06758689880371094, -0.06453704833984375, -0.06148719787597656, -0.058437347412109375, -0.05538749694824219, -0.052337646484375, -0.04928779602050781, -0.046237945556640625, -0.04318809509277344, -0.04013824462890625, -0.03708839416503906, -0.034038543701171875, -0.030988693237304688, -0.0279388427734375, -0.024888992309570312, -0.021839141845703125, -0.018789291381835938, -0.01573944091796875, -0.012689590454101562, -0.009639739990234375, -0.0065898895263671875, -0.0035400390625, -0.0004901885986328125, 0.002559661865234375, 0.0056095123291015625, 0.00865936279296875, 0.011709213256835938, 0.014759063720703125, 0.017808914184570312, 0.0208587646484375, 0.023908615112304688, 0.026958465576171875, 0.030008316040039062, 0.03305816650390625, 0.03610801696777344, 0.039157867431640625, 0.04220771789550781, 0.045257568359375, 0.04830741882324219, 0.051357269287109375, 0.05440711975097656, 0.05745697021484375, 0.06050682067871094, 0.06355667114257812, 0.06660652160644531, 0.0696563720703125, 0.07270622253417969, 0.07575607299804688, 0.07880592346191406, 0.08185577392578125, 0.08490562438964844, 0.08795547485351562, 0.09100532531738281, 0.09405517578125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 8.0, 6.0, 2.0, 2.0, 5.0, 7.0, 11.0, 19.0, 26.0, 26.0, 32.0, 29.0, 43.0, 62.0, 69.0, 72.0, 108.0, 78.0, 59.0, 68.0, 64.0, 55.0, 29.0, 27.0, 27.0, 10.0, 17.0, 11.0, 6.0, 8.0, 5.0, 4.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06451416015625, -0.062491416931152344, -0.06046867370605469, -0.05844593048095703, -0.056423187255859375, -0.05440044403076172, -0.05237770080566406, -0.050354957580566406, -0.04833221435546875, -0.046309471130371094, -0.04428672790527344, -0.04226398468017578, -0.040241241455078125, -0.03821849822998047, -0.03619575500488281, -0.034173011779785156, -0.0321502685546875, -0.030127525329589844, -0.028104782104492188, -0.02608203887939453, -0.024059295654296875, -0.02203655242919922, -0.020013809204101562, -0.017991065979003906, -0.01596832275390625, -0.013945579528808594, -0.011922836303710938, -0.009900093078613281, -0.007877349853515625, -0.005854606628417969, -0.0038318634033203125, -0.0018091201782226562, 0.000213623046875, 0.0022363662719726562, 0.0042591094970703125, 0.006281852722167969, 0.008304595947265625, 0.010327339172363281, 0.012350082397460938, 0.014372825622558594, 0.01639556884765625, 0.018418312072753906, 0.020441055297851562, 0.02246379852294922, 0.024486541748046875, 0.02650928497314453, 0.028532028198242188, 0.030554771423339844, 0.0325775146484375, 0.034600257873535156, 0.03662300109863281, 0.03864574432373047, 0.040668487548828125, 0.04269123077392578, 0.04471397399902344, 0.046736717224121094, 0.04875946044921875, 0.050782203674316406, 0.05280494689941406, 0.05482769012451172, 0.056850433349609375, 0.05887317657470703, 0.06089591979980469, 0.06291866302490234, 0.06494140625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 28.0, 101.0, 500.0, 321.0, 33.0, 8.0, 8.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7726354598999023, -1.6914583444595337, -1.610281229019165, -1.529104232788086, -1.4479271173477173, -1.3667500019073486, -1.2855730056762695, -1.2043958902359009, -1.1232187747955322, -1.0420416593551636, -0.9608646035194397, -0.8796875476837158, -0.7985104322433472, -0.7173333168029785, -0.6361562609672546, -0.5549792051315308, -0.4738020896911621, -0.39262500405311584, -0.3114479184150696, -0.23027083277702332, -0.14909374713897705, -0.06791666150093079, 0.013260424137115479, 0.09443747997283936, 0.175614595413208, 0.2567916810512543, 0.33796876668930054, 0.4191458523273468, 0.5003229379653931, 0.5815000534057617, 0.6626771092414856, 0.7438541650772095, 0.825031042098999, 0.9062081575393677, 0.9873852133750916, 1.0685622692108154, 1.149739384651184, 1.2309165000915527, 1.3120934963226318, 1.3932706117630005, 1.4744477272033691, 1.5556248426437378, 1.6368019580841064, 1.7179789543151855, 1.7991560697555542, 1.8803331851959229, 1.961510181427002, 2.04268741607666, 2.1238644123077393, 2.2050414085388184, 2.2862186431884766, 2.3673956394195557, 2.4485726356506348, 2.529749870300293, 2.610926866531372, 2.692103862762451, 2.7732810974121094, 2.8544580936431885, 2.9356353282928467, 3.016812324523926, 3.097989559173584, 3.179166555404663, 3.260343551635742, 3.3415207862854004, 3.4226977825164795]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 5.0, 3.0, 5.0, 7.0, 9.0, 12.0, 24.0, 24.0, 28.0, 34.0, 40.0, 51.0, 66.0, 92.0, 72.0, 82.0, 91.0, 56.0, 71.0, 44.0, 46.0, 34.0, 24.0, 22.0, 17.0, 9.0, 9.0, 1.0, 8.0, 4.0, 4.0, 3.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4258710145950317, -1.3880832195281982, -1.3502955436706543, -1.3125077486038208, -1.2747199535369873, -1.2369321584701538, -1.1991443634033203, -1.1613566875457764, -1.1235688924789429, -1.0857810974121094, -1.0479934215545654, -1.010205626487732, -0.9724178314208984, -0.9346300363540649, -0.8968423008918762, -0.8590545654296875, -0.821266770362854, -0.7834789752960205, -0.7456912398338318, -0.7079035043716431, -0.6701157093048096, -0.6323279142379761, -0.5945401787757874, -0.5567524433135986, -0.5189646482467651, -0.48117688298225403, -0.4433891177177429, -0.4056013524532318, -0.3678135871887207, -0.3300258219242096, -0.2922380566596985, -0.2544502913951874, -0.2166624665260315, -0.17887470126152039, -0.14108693599700928, -0.10329917073249817, -0.06551140546798706, -0.027723640203475952, 0.010064125061035156, 0.047851890325546265, 0.08563965559005737, 0.12342742085456848, 0.1612151861190796, 0.1990029513835907, 0.2367907166481018, 0.2745784819126129, 0.312366247177124, 0.35015401244163513, 0.38794177770614624, 0.42572954297065735, 0.46351730823516846, 0.501305103302002, 0.5390928387641907, 0.5768805742263794, 0.6146683692932129, 0.6524561643600464, 0.6902438998222351, 0.7280316352844238, 0.7658194303512573, 0.8036072254180908, 0.8413949608802795, 0.8791826963424683, 0.9169704914093018, 0.9547582864761353, 0.992546021938324]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 8.0, 9.0, 15.0, 31.0, 42.0, 51.0, 96.0, 124.0, 228.0, 398.0, 667.0, 1121.0, 1875.0, 3510.0, 7814.0, 23668.0, 183661.0, 3860688.0, 79647.0, 16573.0, 6373.0, 3193.0, 1764.0, 1059.0, 631.0, 391.0, 244.0, 130.0, 93.0, 55.0, 34.0, 33.0, 19.0, 10.0, 10.0, 6.0, 6.0, 6.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.400634765625, -0.3865013122558594, -0.37236785888671875, -0.3582344055175781, -0.3441009521484375, -0.3299674987792969, -0.31583404541015625, -0.3017005920410156, -0.287567138671875, -0.2734336853027344, -0.25930023193359375, -0.24516677856445312, -0.2310333251953125, -0.21689987182617188, -0.20276641845703125, -0.18863296508789062, -0.17449951171875, -0.16036605834960938, -0.14623260498046875, -0.13209915161132812, -0.1179656982421875, -0.10383224487304688, -0.08969879150390625, -0.07556533813476562, -0.061431884765625, -0.047298431396484375, -0.03316497802734375, -0.019031524658203125, -0.0048980712890625, 0.009235382080078125, 0.02336883544921875, 0.037502288818359375, 0.0516357421875, 0.06576919555664062, 0.07990264892578125, 0.09403610229492188, 0.1081695556640625, 0.12230300903320312, 0.13643646240234375, 0.15056991577148438, 0.164703369140625, 0.17883682250976562, 0.19297027587890625, 0.20710372924804688, 0.2212371826171875, 0.23537063598632812, 0.24950408935546875, 0.2636375427246094, 0.27777099609375, 0.2919044494628906, 0.30603790283203125, 0.3201713562011719, 0.3343048095703125, 0.3484382629394531, 0.36257171630859375, 0.3767051696777344, 0.390838623046875, 0.4049720764160156, 0.41910552978515625, 0.4332389831542969, 0.4473724365234375, 0.4615058898925781, 0.47563934326171875, 0.4897727966308594, 0.50390625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 6.0, 6.0, 3.0, 6.0, 4.0, 6.0, 11.0, 9.0, 16.0, 14.0, 17.0, 22.0, 20.0, 30.0, 38.0, 86.0, 113.0, 140.0, 103.0, 74.0, 53.0, 42.0, 31.0, 33.0, 21.0, 18.0, 22.0, 12.0, 10.0, 14.0, 2.0, 4.0, 8.0, 3.0, 3.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0364990234375, -0.035454511642456055, -0.03440999984741211, -0.033365488052368164, -0.03232097625732422, -0.03127646446228027, -0.030231952667236328, -0.029187440872192383, -0.028142929077148438, -0.027098417282104492, -0.026053905487060547, -0.0250093936920166, -0.023964881896972656, -0.02292037010192871, -0.021875858306884766, -0.02083134651184082, -0.019786834716796875, -0.01874232292175293, -0.017697811126708984, -0.01665329933166504, -0.015608787536621094, -0.014564275741577148, -0.013519763946533203, -0.012475252151489258, -0.011430740356445312, -0.010386228561401367, -0.009341716766357422, -0.008297204971313477, -0.007252693176269531, -0.006208181381225586, -0.005163669586181641, -0.004119157791137695, -0.00307464599609375, -0.0020301342010498047, -0.0009856224060058594, 5.888938903808594e-05, 0.0011034011840820312, 0.0021479129791259766, 0.003192424774169922, 0.004236936569213867, 0.0052814483642578125, 0.006325960159301758, 0.007370471954345703, 0.008414983749389648, 0.009459495544433594, 0.010504007339477539, 0.011548519134521484, 0.01259303092956543, 0.013637542724609375, 0.01468205451965332, 0.015726566314697266, 0.01677107810974121, 0.017815589904785156, 0.0188601016998291, 0.019904613494873047, 0.020949125289916992, 0.021993637084960938, 0.023038148880004883, 0.024082660675048828, 0.025127172470092773, 0.02617168426513672, 0.027216196060180664, 0.02826070785522461, 0.029305219650268555, 0.0303497314453125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 8.0, 5.0, 17.0, 17.0, 33.0, 43.0, 81.0, 171.0, 444.0, 1149.0, 3862.0, 13942.0, 80055.0, 3413584.0, 626739.0, 41163.0, 9015.0, 2511.0, 820.0, 290.0, 131.0, 73.0, 43.0, 29.0, 21.0, 11.0, 8.0, 6.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.391845703125, -0.3787117004394531, -0.36557769775390625, -0.3524436950683594, -0.3393096923828125, -0.3261756896972656, -0.31304168701171875, -0.2999076843261719, -0.286773681640625, -0.2736396789550781, -0.26050567626953125, -0.24737167358398438, -0.2342376708984375, -0.22110366821289062, -0.20796966552734375, -0.19483566284179688, -0.18170166015625, -0.16856765747070312, -0.15543365478515625, -0.14229965209960938, -0.1291656494140625, -0.11603164672851562, -0.10289764404296875, -0.08976364135742188, -0.076629638671875, -0.06349563598632812, -0.05036163330078125, -0.037227630615234375, -0.0240936279296875, -0.010959625244140625, 0.00217437744140625, 0.015308380126953125, 0.0284423828125, 0.041576385498046875, 0.05471038818359375, 0.06784439086914062, 0.0809783935546875, 0.09411239624023438, 0.10724639892578125, 0.12038040161132812, 0.133514404296875, 0.14664840698242188, 0.15978240966796875, 0.17291641235351562, 0.1860504150390625, 0.19918441772460938, 0.21231842041015625, 0.22545242309570312, 0.23858642578125, 0.2517204284667969, 0.26485443115234375, 0.2779884338378906, 0.2911224365234375, 0.3042564392089844, 0.31739044189453125, 0.3305244445800781, 0.343658447265625, 0.3567924499511719, 0.36992645263671875, 0.3830604553222656, 0.3961944580078125, 0.4093284606933594, 0.42246246337890625, 0.4355964660644531, 0.44873046875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 3.0, 6.0, 9.0, 6.0, 14.0, 22.0, 35.0, 53.0, 75.0, 135.0, 270.0, 515.0, 1781.0, 506.0, 228.0, 135.0, 80.0, 67.0, 36.0, 19.0, 14.0, 12.0, 10.0, 5.0, 5.0, 5.0, 6.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.075439453125, -0.07357549667358398, -0.07171154022216797, -0.06984758377075195, -0.06798362731933594, -0.06611967086791992, -0.0642557144165039, -0.06239175796508789, -0.060527801513671875, -0.05866384506225586, -0.056799888610839844, -0.05493593215942383, -0.05307197570800781, -0.0512080192565918, -0.04934406280517578, -0.047480106353759766, -0.04561614990234375, -0.043752193450927734, -0.04188823699951172, -0.0400242805480957, -0.03816032409667969, -0.03629636764526367, -0.034432411193847656, -0.03256845474243164, -0.030704498291015625, -0.02884054183959961, -0.026976585388183594, -0.025112628936767578, -0.023248672485351562, -0.021384716033935547, -0.01952075958251953, -0.017656803131103516, -0.0157928466796875, -0.013928890228271484, -0.012064933776855469, -0.010200977325439453, -0.008337020874023438, -0.006473064422607422, -0.004609107971191406, -0.0027451515197753906, -0.000881195068359375, 0.0009827613830566406, 0.0028467178344726562, 0.004710674285888672, 0.0065746307373046875, 0.008438587188720703, 0.010302543640136719, 0.012166500091552734, 0.01403045654296875, 0.015894412994384766, 0.01775836944580078, 0.019622325897216797, 0.021486282348632812, 0.023350238800048828, 0.025214195251464844, 0.02707815170288086, 0.028942108154296875, 0.03080606460571289, 0.032670021057128906, 0.03453397750854492, 0.03639793395996094, 0.03826189041137695, 0.04012584686279297, 0.041989803314208984, 0.043853759765625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 8.0, 35.0, 186.0, 455.0, 262.0, 46.0, 10.0, 6.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.4559972286224365, -1.4298144578933716, -1.4036316871643066, -1.3774490356445312, -1.3512662649154663, -1.3250834941864014, -1.298900842666626, -1.272718071937561, -1.246535301208496, -1.2203525304794312, -1.1941697597503662, -1.1679871082305908, -1.1418043375015259, -1.115621566772461, -1.0894389152526855, -1.0632561445236206, -1.0370733737945557, -1.0108906030654907, -0.9847078919410706, -0.9585251808166504, -0.9323424100875854, -0.9061596393585205, -0.8799769282341003, -0.8537942171096802, -0.8276114463806152, -0.8014286756515503, -0.7752459645271301, -0.74906325340271, -0.722880482673645, -0.6966977119445801, -0.6705150008201599, -0.6443322896957397, -0.6181495785713196, -0.5919668674468994, -0.5657840967178345, -0.5396013259887695, -0.5134186148643494, -0.4872358739376068, -0.46105313301086426, -0.4348703920841217, -0.40868765115737915, -0.3825049102306366, -0.35632216930389404, -0.3301394283771515, -0.30395668745040894, -0.2777739465236664, -0.25159120559692383, -0.22540846467018127, -0.19922572374343872, -0.17304298281669617, -0.1468602418899536, -0.12067750096321106, -0.0944947600364685, -0.06831201910972595, -0.0421292781829834, -0.015946537256240845, 0.010236203670501709, 0.03641894459724426, 0.06260168552398682, 0.08878442645072937, 0.11496716737747192, 0.14114990830421448, 0.16733264923095703, 0.19351539015769958, 0.21969813108444214]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 6.0, 4.0, 1.0, 6.0, 6.0, 15.0, 11.0, 21.0, 22.0, 28.0, 39.0, 36.0, 41.0, 50.0, 55.0, 65.0, 67.0, 59.0, 52.0, 63.0, 56.0, 42.0, 36.0, 43.0, 26.0, 35.0, 24.0, 27.0, 14.0, 14.0, 9.0, 9.0, 7.0, 2.0, 5.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.25167882442474365, -0.24537360668182373, -0.2390683889389038, -0.2327631562948227, -0.22645793855190277, -0.22015272080898285, -0.21384748816490173, -0.2075422704219818, -0.2012370526790619, -0.19493183493614197, -0.18862661719322205, -0.18232138454914093, -0.176016166806221, -0.1697109490633011, -0.16340571641921997, -0.15710049867630005, -0.15079528093338013, -0.1444900631904602, -0.13818484544754028, -0.13187961280345917, -0.12557439506053925, -0.11926917731761932, -0.1129639521241188, -0.10665872693061829, -0.10035350918769836, -0.09404829144477844, -0.08774306625127792, -0.0814378410577774, -0.07513262331485748, -0.06882740557193756, -0.06252218037843704, -0.05621695891022682, -0.0499117374420166, -0.04360651597380638, -0.03730129450559616, -0.03099607303738594, -0.02469085156917572, -0.0183856301009655, -0.01208040863275528, -0.005775187164545059, 0.0005300343036651611, 0.0068352557718753815, 0.013140477240085602, 0.019445698708295822, 0.025750920176506042, 0.03205614164471626, 0.03836136311292648, 0.044666584581136703, 0.050971806049346924, 0.057277027517557144, 0.06358224898576736, 0.06988747417926788, 0.0761926919221878, 0.08249790966510773, 0.08880313485860825, 0.09510836005210876, 0.10141357779502869, 0.10771879553794861, 0.11402402073144913, 0.12032924592494965, 0.12663446366786957, 0.1329396814107895, 0.1392449140548706, 0.14555013179779053, 0.15185534954071045]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 5.0, 4.0, 3.0, 10.0, 13.0, 22.0, 31.0, 45.0, 56.0, 69.0, 114.0, 187.0, 350.0, 564.0, 1033.0, 1921.0, 3755.0, 8068.0, 18293.0, 45053.0, 145047.0, 538826.0, 190676.0, 54544.0, 21123.0, 9347.0, 4359.0, 2256.0, 1139.0, 629.0, 386.0, 204.0, 152.0, 94.0, 59.0, 33.0, 21.0, 20.0, 17.0, 9.0, 5.0, 6.0, 1.0, 2.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.263916015625, -0.25628662109375, -0.2486572265625, -0.24102783203125, -0.2333984375, -0.22576904296875, -0.2181396484375, -0.21051025390625, -0.202880859375, -0.19525146484375, -0.1876220703125, -0.17999267578125, -0.17236328125, -0.16473388671875, -0.1571044921875, -0.14947509765625, -0.141845703125, -0.13421630859375, -0.1265869140625, -0.11895751953125, -0.111328125, -0.10369873046875, -0.0960693359375, -0.08843994140625, -0.080810546875, -0.07318115234375, -0.0655517578125, -0.05792236328125, -0.05029296875, -0.04266357421875, -0.0350341796875, -0.02740478515625, -0.019775390625, -0.01214599609375, -0.0045166015625, 0.00311279296875, 0.0107421875, 0.01837158203125, 0.0260009765625, 0.03363037109375, 0.041259765625, 0.04888916015625, 0.0565185546875, 0.06414794921875, 0.07177734375, 0.07940673828125, 0.0870361328125, 0.09466552734375, 0.102294921875, 0.10992431640625, 0.1175537109375, 0.12518310546875, 0.1328125, 0.14044189453125, 0.1480712890625, 0.15570068359375, 0.163330078125, 0.17095947265625, 0.1785888671875, 0.18621826171875, 0.19384765625, 0.20147705078125, 0.2091064453125, 0.21673583984375, 0.224365234375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 2.0, 3.0, 2.0, 6.0, 6.0, 9.0, 12.0, 17.0, 16.0, 30.0, 24.0, 36.0, 55.0, 74.0, 102.0, 148.0, 87.0, 81.0, 72.0, 42.0, 32.0, 24.0, 18.0, 15.0, 27.0, 16.0, 7.0, 8.0, 8.0, 8.0, 2.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.035491943359375, -0.03441476821899414, -0.03333759307861328, -0.03226041793823242, -0.031183242797851562, -0.030106067657470703, -0.029028892517089844, -0.027951717376708984, -0.026874542236328125, -0.025797367095947266, -0.024720191955566406, -0.023643016815185547, -0.022565841674804688, -0.021488666534423828, -0.02041149139404297, -0.01933431625366211, -0.01825714111328125, -0.01717996597290039, -0.01610279083251953, -0.015025615692138672, -0.013948440551757812, -0.012871265411376953, -0.011794090270996094, -0.010716915130615234, -0.009639739990234375, -0.008562564849853516, -0.007485389709472656, -0.006408214569091797, -0.0053310394287109375, -0.004253864288330078, -0.0031766891479492188, -0.0020995140075683594, -0.0010223388671875, 5.4836273193359375e-05, 0.0011320114135742188, 0.002209186553955078, 0.0032863616943359375, 0.004363536834716797, 0.005440711975097656, 0.006517887115478516, 0.007595062255859375, 0.008672237396240234, 0.009749412536621094, 0.010826587677001953, 0.011903762817382812, 0.012980937957763672, 0.014058113098144531, 0.01513528823852539, 0.01621246337890625, 0.01728963851928711, 0.01836681365966797, 0.019443988800048828, 0.020521163940429688, 0.021598339080810547, 0.022675514221191406, 0.023752689361572266, 0.024829864501953125, 0.025907039642333984, 0.026984214782714844, 0.028061389923095703, 0.029138565063476562, 0.030215740203857422, 0.03129291534423828, 0.03237009048461914, 0.033447265625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 9.0, 12.0, 19.0, 15.0, 26.0, 43.0, 49.0, 69.0, 81.0, 113.0, 159.0, 196.0, 258.0, 417.0, 612.0, 846.0, 1582.0, 3490.0, 9197.0, 33126.0, 137628.0, 444916.0, 309023.0, 75267.0, 19141.0, 5978.0, 2458.0, 1247.0, 785.0, 464.0, 345.0, 236.0, 192.0, 143.0, 102.0, 88.0, 49.0, 39.0, 30.0, 22.0, 24.0, 8.0, 10.0, 13.0, 11.0, 4.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.2276611328125, -0.2200183868408203, -0.21237564086914062, -0.20473289489746094, -0.19709014892578125, -0.18944740295410156, -0.18180465698242188, -0.1741619110107422, -0.1665191650390625, -0.1588764190673828, -0.15123367309570312, -0.14359092712402344, -0.13594818115234375, -0.12830543518066406, -0.12066268920898438, -0.11301994323730469, -0.105377197265625, -0.09773445129394531, -0.09009170532226562, -0.08244895935058594, -0.07480621337890625, -0.06716346740722656, -0.059520721435546875, -0.05187797546386719, -0.0442352294921875, -0.03659248352050781, -0.028949737548828125, -0.021306991577148438, -0.01366424560546875, -0.0060214996337890625, 0.001621246337890625, 0.009263992309570312, 0.01690673828125, 0.024549484252929688, 0.032192230224609375, 0.03983497619628906, 0.04747772216796875, 0.05512046813964844, 0.06276321411132812, 0.07040596008300781, 0.0780487060546875, 0.08569145202636719, 0.09333419799804688, 0.10097694396972656, 0.10861968994140625, 0.11626243591308594, 0.12390518188476562, 0.1315479278564453, 0.139190673828125, 0.1468334197998047, 0.15447616577148438, 0.16211891174316406, 0.16976165771484375, 0.17740440368652344, 0.18504714965820312, 0.1926898956298828, 0.2003326416015625, 0.2079753875732422, 0.21561813354492188, 0.22326087951660156, 0.23090362548828125, 0.23854637145996094, 0.24618911743164062, 0.2538318634033203, 0.261474609375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 9.0, 10.0, 6.0, 6.0, 19.0, 12.0, 24.0, 22.0, 16.0, 23.0, 21.0, 35.0, 40.0, 33.0, 50.0, 35.0, 37.0, 40.0, 34.0, 39.0, 39.0, 44.0, 42.0, 46.0, 35.0, 35.0, 30.0, 31.0, 25.0, 22.0, 20.0, 24.0, 21.0, 9.0, 11.0, 13.0, 8.0, 7.0, 12.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.12164306640625, -0.11767864227294922, -0.11371421813964844, -0.10974979400634766, -0.10578536987304688, -0.1018209457397461, -0.09785652160644531, -0.09389209747314453, -0.08992767333984375, -0.08596324920654297, -0.08199882507324219, -0.0780344009399414, -0.07406997680664062, -0.07010555267333984, -0.06614112854003906, -0.06217670440673828, -0.0582122802734375, -0.05424785614013672, -0.05028343200683594, -0.046319007873535156, -0.042354583740234375, -0.038390159606933594, -0.03442573547363281, -0.03046131134033203, -0.02649688720703125, -0.02253246307373047, -0.018568038940429688, -0.014603614807128906, -0.010639190673828125, -0.006674766540527344, -0.0027103424072265625, 0.0012540817260742188, 0.005218505859375, 0.009182929992675781, 0.013147354125976562, 0.017111778259277344, 0.021076202392578125, 0.025040626525878906, 0.029005050659179688, 0.03296947479248047, 0.03693389892578125, 0.04089832305908203, 0.04486274719238281, 0.048827171325683594, 0.052791595458984375, 0.056756019592285156, 0.06072044372558594, 0.06468486785888672, 0.0686492919921875, 0.07261371612548828, 0.07657814025878906, 0.08054256439208984, 0.08450698852539062, 0.0884714126586914, 0.09243583679199219, 0.09640026092529297, 0.10036468505859375, 0.10432910919189453, 0.10829353332519531, 0.1122579574584961, 0.11622238159179688, 0.12018680572509766, 0.12415122985839844, 0.12811565399169922, 0.132080078125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 6.0, 8.0, 12.0, 6.0, 21.0, 15.0, 18.0, 32.0, 38.0, 55.0, 83.0, 139.0, 195.0, 347.0, 553.0, 942.0, 1629.0, 2970.0, 6160.0, 12663.0, 28585.0, 67776.0, 165723.0, 309765.0, 252868.0, 112264.0, 46192.0, 20240.0, 9190.0, 4517.0, 2325.0, 1227.0, 741.0, 440.0, 245.0, 185.0, 107.0, 71.0, 58.0, 46.0, 24.0, 19.0, 13.0, 11.0, 9.0, 6.0, 2.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0888671875, -0.08607101440429688, -0.08327484130859375, -0.08047866821289062, -0.0776824951171875, -0.07488632202148438, -0.07209014892578125, -0.06929397583007812, -0.066497802734375, -0.06370162963867188, -0.06090545654296875, -0.058109283447265625, -0.0553131103515625, -0.052516937255859375, -0.04972076416015625, -0.046924591064453125, -0.04412841796875, -0.041332244873046875, -0.03853607177734375, -0.035739898681640625, -0.0329437255859375, -0.030147552490234375, -0.02735137939453125, -0.024555206298828125, -0.021759033203125, -0.018962860107421875, -0.01616668701171875, -0.013370513916015625, -0.0105743408203125, -0.007778167724609375, -0.00498199462890625, -0.002185821533203125, 0.0006103515625, 0.003406524658203125, 0.00620269775390625, 0.008998870849609375, 0.0117950439453125, 0.014591217041015625, 0.01738739013671875, 0.020183563232421875, 0.022979736328125, 0.025775909423828125, 0.02857208251953125, 0.031368255615234375, 0.0341644287109375, 0.036960601806640625, 0.03975677490234375, 0.042552947998046875, 0.04534912109375, 0.048145294189453125, 0.05094146728515625, 0.053737640380859375, 0.0565338134765625, 0.059329986572265625, 0.06212615966796875, 0.06492233276367188, 0.067718505859375, 0.07051467895507812, 0.07331085205078125, 0.07610702514648438, 0.0789031982421875, 0.08169937133789062, 0.08449554443359375, 0.08729171752929688, 0.090087890625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 5.0, 3.0, 6.0, 6.0, 15.0, 16.0, 24.0, 24.0, 38.0, 54.0, 64.0, 80.0, 88.0, 89.0, 90.0, 80.0, 76.0, 51.0, 53.0, 50.0, 30.0, 19.0, 12.0, 9.0, 8.0, 4.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.167194366455078e-05, -8.811615407466888e-05, -8.456036448478699e-05, -8.100457489490509e-05, -7.74487853050232e-05, -7.38929957151413e-05, -7.03372061252594e-05, -6.67814165353775e-05, -6.32256269454956e-05, -5.966983735561371e-05, -5.611404776573181e-05, -5.2558258175849915e-05, -4.900246858596802e-05, -4.544667899608612e-05, -4.1890889406204224e-05, -3.833509981632233e-05, -3.477931022644043e-05, -3.122352063655853e-05, -2.7667731046676636e-05, -2.411194145679474e-05, -2.0556151866912842e-05, -1.7000362277030945e-05, -1.3444572687149048e-05, -9.888783097267151e-06, -6.332993507385254e-06, -2.777203917503357e-06, 7.7858567237854e-07, 4.334375262260437e-06, 7.890164852142334e-06, 1.1445954442024231e-05, 1.5001744031906128e-05, 1.8557533621788025e-05, 2.2113323211669922e-05, 2.566911280155182e-05, 2.9224902391433716e-05, 3.278069198131561e-05, 3.633648157119751e-05, 3.989227116107941e-05, 4.3448060750961304e-05, 4.70038503408432e-05, 5.05596399307251e-05, 5.4115429520606995e-05, 5.767121911048889e-05, 6.122700870037079e-05, 6.478279829025269e-05, 6.833858788013458e-05, 7.189437747001648e-05, 7.545016705989838e-05, 7.900595664978027e-05, 8.256174623966217e-05, 8.611753582954407e-05, 8.967332541942596e-05, 9.322911500930786e-05, 9.678490459918976e-05, 0.00010034069418907166, 0.00010389648377895355, 0.00010745227336883545, 0.00011100806295871735, 0.00011456385254859924, 0.00011811964213848114, 0.00012167543172836304, 0.00012523122131824493, 0.00012878701090812683, 0.00013234280049800873, 0.00013589859008789062]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 7.0, 16.0, 19.0, 17.0, 41.0, 59.0, 77.0, 141.0, 248.0, 427.0, 857.0, 2044.0, 6385.0, 31503.0, 260237.0, 626421.0, 98503.0, 15000.0, 3650.0, 1356.0, 672.0, 307.0, 178.0, 127.0, 90.0, 51.0, 31.0, 15.0, 25.0, 14.0, 4.0, 11.0, 6.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1915283203125, -0.18540573120117188, -0.17928314208984375, -0.17316055297851562, -0.1670379638671875, -0.16091537475585938, -0.15479278564453125, -0.14867019653320312, -0.142547607421875, -0.13642501831054688, -0.13030242919921875, -0.12417984008789062, -0.1180572509765625, -0.11193466186523438, -0.10581207275390625, -0.09968948364257812, -0.09356689453125, -0.08744430541992188, -0.08132171630859375, -0.07519912719726562, -0.0690765380859375, -0.06295394897460938, -0.05683135986328125, -0.050708770751953125, -0.044586181640625, -0.038463592529296875, -0.03234100341796875, -0.026218414306640625, -0.0200958251953125, -0.013973236083984375, -0.00785064697265625, -0.001728057861328125, 0.00439453125, 0.010517120361328125, 0.01663970947265625, 0.022762298583984375, 0.0288848876953125, 0.035007476806640625, 0.04113006591796875, 0.047252655029296875, 0.053375244140625, 0.059497833251953125, 0.06562042236328125, 0.07174301147460938, 0.0778656005859375, 0.08398818969726562, 0.09011077880859375, 0.09623336791992188, 0.10235595703125, 0.10847854614257812, 0.11460113525390625, 0.12072372436523438, 0.1268463134765625, 0.13296890258789062, 0.13909149169921875, 0.14521408081054688, 0.151336669921875, 0.15745925903320312, 0.16358184814453125, 0.16970443725585938, 0.1758270263671875, 0.18194961547851562, 0.18807220458984375, 0.19419479370117188, 0.2003173828125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 7.0, 3.0, 9.0, 12.0, 14.0, 13.0, 18.0, 27.0, 30.0, 39.0, 47.0, 63.0, 56.0, 81.0, 71.0, 84.0, 71.0, 64.0, 33.0, 60.0, 32.0, 23.0, 20.0, 19.0, 21.0, 19.0, 7.0, 13.0, 11.0, 5.0, 7.0, 2.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.0860595703125, -0.08367633819580078, -0.08129310607910156, -0.07890987396240234, -0.07652664184570312, -0.0741434097290039, -0.07176017761230469, -0.06937694549560547, -0.06699371337890625, -0.06461048126220703, -0.06222724914550781, -0.059844017028808594, -0.057460784912109375, -0.055077552795410156, -0.05269432067871094, -0.05031108856201172, -0.0479278564453125, -0.04554462432861328, -0.04316139221191406, -0.040778160095214844, -0.038394927978515625, -0.036011695861816406, -0.03362846374511719, -0.03124523162841797, -0.02886199951171875, -0.02647876739501953, -0.024095535278320312, -0.021712303161621094, -0.019329071044921875, -0.016945838928222656, -0.014562606811523438, -0.012179374694824219, -0.009796142578125, -0.007412910461425781, -0.0050296783447265625, -0.0026464462280273438, -0.000263214111328125, 0.0021200180053710938, 0.0045032501220703125, 0.006886482238769531, 0.00926971435546875, 0.011652946472167969, 0.014036178588867188, 0.016419410705566406, 0.018802642822265625, 0.021185874938964844, 0.023569107055664062, 0.02595233917236328, 0.0283355712890625, 0.03071880340576172, 0.03310203552246094, 0.035485267639160156, 0.037868499755859375, 0.040251731872558594, 0.04263496398925781, 0.04501819610595703, 0.04740142822265625, 0.04978466033935547, 0.05216789245605469, 0.054551124572753906, 0.056934356689453125, 0.059317588806152344, 0.06170082092285156, 0.06408405303955078, 0.06646728515625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 22.0, 62.0, 152.0, 301.0, 264.0, 118.0, 44.0, 19.0, 9.0, 3.0, 7.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.604045033454895, -1.5090916156768799, -1.4141383171081543, -1.3191848993301392, -1.224231481552124, -1.1292780637741089, -1.0343246459960938, -0.9393713474273682, -0.844417929649353, -0.7494645118713379, -0.6545111536979675, -0.5595577955245972, -0.46460437774658203, -0.3696509897708893, -0.27469760179519653, -0.17974424362182617, -0.08479082584381104, 0.010162562131881714, 0.10511595010757446, 0.2000693380832672, 0.29502272605895996, 0.3899761140346527, 0.48492950201034546, 0.5798828601837158, 0.674836277961731, 0.7697896957397461, 0.8647430539131165, 0.9596964120864868, 1.054649829864502, 1.149603247642517, 1.2445566654205322, 1.3395099639892578, 1.4344635009765625, 1.5294169187545776, 1.6243703365325928, 1.7193236351013184, 1.8142770528793335, 1.9092304706573486, 2.004183769226074, 2.099137306213379, 2.1940906047821045, 2.28904390335083, 2.3839974403381348, 2.4789507389068604, 2.573904037475586, 2.6688575744628906, 2.763810873031616, 2.858764171600342, 2.9537177085876465, 3.048671007156372, 3.1436245441436768, 3.2385778427124023, 3.333531379699707, 3.4284846782684326, 3.523437976837158, 3.618391513824463, 3.7133448123931885, 3.808298110961914, 3.9032516479492188, 3.9982049465179443, 4.09315824508667, 4.188111782073975, 4.283065319061279, 4.378018379211426, 4.4729719161987305]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 7.0, 4.0, 13.0, 14.0, 14.0, 19.0, 25.0, 38.0, 34.0, 52.0, 57.0, 73.0, 77.0, 67.0, 74.0, 68.0, 52.0, 60.0, 57.0, 45.0, 43.0, 27.0, 30.0, 15.0, 8.0, 15.0, 5.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2541041374206543, -1.2053381204605103, -1.1565721035003662, -1.1078060865402222, -1.0590400695800781, -1.0102741718292236, -0.9615081548690796, -0.9127421379089355, -0.8639761209487915, -0.8152101039886475, -0.7664440870285034, -0.7176781296730042, -0.6689121127128601, -0.6201460957527161, -0.5713801383972168, -0.5226141214370728, -0.4738481044769287, -0.42508208751678467, -0.376316100358963, -0.32755011320114136, -0.2787840962409973, -0.23001809418201447, -0.18125209212303162, -0.13248610496520996, -0.08372008800506592, -0.03495408594608307, 0.01381191611289978, 0.06257791817188263, 0.11134392023086548, 0.16010992228984833, 0.20887592434883118, 0.25764191150665283, 0.3064079284667969, 0.3551739454269409, 0.4039399325847626, 0.45270591974258423, 0.5014719367027283, 0.5502379536628723, 0.5990039110183716, 0.6477699279785156, 0.6965359449386597, 0.7453019618988037, 0.7940679788589478, 0.842833936214447, 0.8915999531745911, 0.9403659701347351, 0.9891319274902344, 1.0378979444503784, 1.0866639614105225, 1.1354299783706665, 1.1841959953308105, 1.2329620122909546, 1.2817280292510986, 1.3304939270019531, 1.3792599439620972, 1.4280259609222412, 1.4767919778823853, 1.5255579948425293, 1.5743240118026733, 1.6230900287628174, 1.6718559265136719, 1.720621943473816, 1.76938796043396, 1.818153977394104, 1.866919994354248]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 7.0, 14.0, 11.0, 20.0, 36.0, 47.0, 57.0, 140.0, 260.0, 550.0, 1707.0, 8108.0, 106396.0, 4008247.0, 59247.0, 6593.0, 1550.0, 590.0, 290.0, 144.0, 99.0, 53.0, 26.0, 22.0, 23.0, 11.0, 8.0, 3.0, 6.0, 3.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6884765625, -0.665069580078125, -0.64166259765625, -0.618255615234375, -0.5948486328125, -0.571441650390625, -0.54803466796875, -0.524627685546875, -0.501220703125, -0.477813720703125, -0.45440673828125, -0.430999755859375, -0.4075927734375, -0.384185791015625, -0.36077880859375, -0.337371826171875, -0.31396484375, -0.290557861328125, -0.26715087890625, -0.243743896484375, -0.2203369140625, -0.196929931640625, -0.17352294921875, -0.150115966796875, -0.126708984375, -0.103302001953125, -0.07989501953125, -0.056488037109375, -0.0330810546875, -0.009674072265625, 0.01373291015625, 0.037139892578125, 0.060546875, 0.083953857421875, 0.10736083984375, 0.130767822265625, 0.1541748046875, 0.177581787109375, 0.20098876953125, 0.224395751953125, 0.247802734375, 0.271209716796875, 0.29461669921875, 0.318023681640625, 0.3414306640625, 0.364837646484375, 0.38824462890625, 0.411651611328125, 0.43505859375, 0.458465576171875, 0.48187255859375, 0.505279541015625, 0.5286865234375, 0.552093505859375, 0.57550048828125, 0.598907470703125, 0.622314453125, 0.645721435546875, 0.66912841796875, 0.692535400390625, 0.7159423828125, 0.739349365234375, 0.76275634765625, 0.786163330078125, 0.8095703125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 8.0, 12.0, 14.0, 23.0, 23.0, 30.0, 38.0, 53.0, 68.0, 76.0, 104.0, 90.0, 80.0, 79.0, 54.0, 48.0, 38.0, 28.0, 28.0, 23.0, 13.0, 13.0, 10.0, 12.0, 11.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.039337158203125, -0.03809165954589844, -0.036846160888671875, -0.03560066223144531, -0.03435516357421875, -0.03310966491699219, -0.031864166259765625, -0.030618667602539062, -0.0293731689453125, -0.028127670288085938, -0.026882171630859375, -0.025636672973632812, -0.02439117431640625, -0.023145675659179688, -0.021900177001953125, -0.020654678344726562, -0.0194091796875, -0.018163681030273438, -0.016918182373046875, -0.015672683715820312, -0.01442718505859375, -0.013181686401367188, -0.011936187744140625, -0.010690689086914062, -0.0094451904296875, -0.008199691772460938, -0.006954193115234375, -0.0057086944580078125, -0.00446319580078125, -0.0032176971435546875, -0.001972198486328125, -0.0007266998291015625, 0.000518798828125, 0.0017642974853515625, 0.003009796142578125, 0.0042552947998046875, 0.00550079345703125, 0.0067462921142578125, 0.007991790771484375, 0.009237289428710938, 0.0104827880859375, 0.011728286743164062, 0.012973785400390625, 0.014219284057617188, 0.01546478271484375, 0.016710281372070312, 0.017955780029296875, 0.019201278686523438, 0.02044677734375, 0.021692276000976562, 0.022937774658203125, 0.024183273315429688, 0.02542877197265625, 0.026674270629882812, 0.027919769287109375, 0.029165267944335938, 0.0304107666015625, 0.03165626525878906, 0.032901763916015625, 0.03414726257324219, 0.03539276123046875, 0.03663825988769531, 0.037883758544921875, 0.03912925720214844, 0.040374755859375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 1.0, 7.0, 5.0, 8.0, 20.0, 15.0, 34.0, 55.0, 90.0, 170.0, 302.0, 588.0, 1251.0, 2670.0, 6267.0, 17390.0, 63956.0, 392150.0, 3313394.0, 316358.0, 54626.0, 15331.0, 5276.0, 2241.0, 964.0, 497.0, 275.0, 129.0, 81.0, 48.0, 25.0, 20.0, 13.0, 8.0, 6.0, 2.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.329833984375, -0.3210277557373047, -0.3122215270996094, -0.30341529846191406, -0.29460906982421875, -0.28580284118652344, -0.2769966125488281, -0.2681903839111328, -0.2593841552734375, -0.2505779266357422, -0.24177169799804688, -0.23296546936035156, -0.22415924072265625, -0.21535301208496094, -0.20654678344726562, -0.1977405548095703, -0.188934326171875, -0.1801280975341797, -0.17132186889648438, -0.16251564025878906, -0.15370941162109375, -0.14490318298339844, -0.13609695434570312, -0.1272907257080078, -0.1184844970703125, -0.10967826843261719, -0.10087203979492188, -0.09206581115722656, -0.08325958251953125, -0.07445335388183594, -0.06564712524414062, -0.05684089660644531, -0.04803466796875, -0.03922843933105469, -0.030422210693359375, -0.021615982055664062, -0.01280975341796875, -0.0040035247802734375, 0.004802703857421875, 0.013608932495117188, 0.0224151611328125, 0.031221389770507812, 0.040027618408203125, 0.04883384704589844, 0.05764007568359375, 0.06644630432128906, 0.07525253295898438, 0.08405876159667969, 0.092864990234375, 0.10167121887207031, 0.11047744750976562, 0.11928367614746094, 0.12808990478515625, 0.13689613342285156, 0.14570236206054688, 0.1545085906982422, 0.1633148193359375, 0.1721210479736328, 0.18092727661132812, 0.18973350524902344, 0.19853973388671875, 0.20734596252441406, 0.21615219116210938, 0.2249584197998047, 0.2337646484375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 3.0, 5.0, 2.0, 2.0, 4.0, 8.0, 10.0, 3.0, 21.0, 16.0, 22.0, 33.0, 42.0, 47.0, 82.0, 114.0, 147.0, 249.0, 446.0, 1363.0, 583.0, 273.0, 175.0, 130.0, 76.0, 50.0, 48.0, 30.0, 22.0, 18.0, 14.0, 9.0, 8.0, 2.0, 5.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.061920166015625, -0.060184478759765625, -0.05844879150390625, -0.056713104248046875, -0.0549774169921875, -0.053241729736328125, -0.05150604248046875, -0.049770355224609375, -0.04803466796875, -0.046298980712890625, -0.04456329345703125, -0.042827606201171875, -0.0410919189453125, -0.039356231689453125, -0.03762054443359375, -0.035884857177734375, -0.034149169921875, -0.032413482666015625, -0.03067779541015625, -0.028942108154296875, -0.0272064208984375, -0.025470733642578125, -0.02373504638671875, -0.021999359130859375, -0.020263671875, -0.018527984619140625, -0.01679229736328125, -0.015056610107421875, -0.0133209228515625, -0.011585235595703125, -0.00984954833984375, -0.008113861083984375, -0.006378173828125, -0.004642486572265625, -0.00290679931640625, -0.001171112060546875, 0.0005645751953125, 0.002300262451171875, 0.00403594970703125, 0.005771636962890625, 0.00750732421875, 0.009243011474609375, 0.01097869873046875, 0.012714385986328125, 0.0144500732421875, 0.016185760498046875, 0.01792144775390625, 0.019657135009765625, 0.021392822265625, 0.023128509521484375, 0.02486419677734375, 0.026599884033203125, 0.0283355712890625, 0.030071258544921875, 0.03180694580078125, 0.033542633056640625, 0.0352783203125, 0.037014007568359375, 0.03874969482421875, 0.040485382080078125, 0.0422210693359375, 0.043956756591796875, 0.04569244384765625, 0.047428131103515625, 0.049163818359375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 12.0, 32.0, 62.0, 123.0, 179.0, 174.0, 159.0, 118.0, 67.0, 43.0, 14.0, 12.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5787186622619629, -0.5629356503486633, -0.5471526384353638, -0.5313695669174194, -0.5155865550041199, -0.4998035430908203, -0.48402053117752075, -0.4682375192642212, -0.45245447754859924, -0.4366714656352997, -0.42088842391967773, -0.4051054120063782, -0.3893224000930786, -0.37353935837745667, -0.3577563464641571, -0.34197330474853516, -0.3261902928352356, -0.31040728092193604, -0.2946242392063141, -0.2788412272930145, -0.2630581855773926, -0.24727517366409302, -0.23149216175079346, -0.2157091349363327, -0.19992610812187195, -0.1841430813074112, -0.16836005449295044, -0.15257704257965088, -0.13679401576519012, -0.12101098895072937, -0.10522796958684921, -0.08944495022296906, -0.07366189360618591, -0.05787887051701546, -0.042095847427845, -0.026312824338674545, -0.01052980124950409, 0.005253225564956665, 0.021036244928836823, 0.03681926429271698, 0.052602291107177734, 0.06838531792163849, 0.08416833728551865, 0.0999513566493988, 0.11573438346385956, 0.1315174102783203, 0.14730042219161987, 0.16308344900608063, 0.17886647582054138, 0.19464950263500214, 0.2104325294494629, 0.22621554136276245, 0.2419985681772232, 0.25778159499168396, 0.2735646069049835, 0.28934764862060547, 0.30513066053390503, 0.3209136724472046, 0.33669671416282654, 0.3524797260761261, 0.36826276779174805, 0.3840457797050476, 0.39982879161834717, 0.41561180353164673, 0.4313948452472687]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 3.0, 5.0, 6.0, 9.0, 5.0, 12.0, 8.0, 14.0, 20.0, 15.0, 19.0, 29.0, 29.0, 32.0, 36.0, 37.0, 37.0, 30.0, 34.0, 43.0, 37.0, 50.0, 34.0, 33.0, 38.0, 46.0, 44.0, 27.0, 33.0, 24.0, 19.0, 23.0, 11.0, 21.0, 18.0, 27.0, 14.0, 11.0, 10.0, 10.0, 14.0, 7.0, 9.0, 5.0, 3.0, 5.0, 0.0, 4.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.20007222890853882, -0.1944400817155838, -0.18880793452262878, -0.18317577242851257, -0.17754362523555756, -0.17191147804260254, -0.16627933084964752, -0.1606471836566925, -0.1550150215625763, -0.14938287436962128, -0.14375072717666626, -0.13811856508255005, -0.13248641788959503, -0.12685427069664001, -0.121222123503685, -0.11558997631072998, -0.10995782911777496, -0.10432568192481995, -0.09869352728128433, -0.09306138008832932, -0.0874292254447937, -0.08179707825183868, -0.07616493105888367, -0.07053278386592865, -0.06490062922239304, -0.05926847830414772, -0.053636327385902405, -0.04800418019294739, -0.04237202927470207, -0.03673987835645676, -0.03110773116350174, -0.025475580245256424, -0.01984342932701111, -0.014211279340088367, -0.008579129353165627, -0.00294698029756546, 0.0026851706206798553, 0.008317321538925171, 0.013949468731880188, 0.019581619650125504, 0.02521377056837082, 0.030845921486616135, 0.03647807240486145, 0.04211021959781647, 0.04774237051606178, 0.0533745214343071, 0.059006668627262115, 0.06463882327079773, 0.07027097046375275, 0.07590311765670776, 0.08153527230024338, 0.0871674194931984, 0.09279957413673401, 0.09843172132968903, 0.10406386852264404, 0.10969601571559906, 0.11532817035913467, 0.12096031755208969, 0.1265924721956253, 0.13222461938858032, 0.13785676658153534, 0.14348891377449036, 0.14912107586860657, 0.15475322306156158, 0.1603853702545166]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 7.0, 7.0, 10.0, 11.0, 17.0, 13.0, 24.0, 27.0, 45.0, 76.0, 93.0, 126.0, 201.0, 339.0, 526.0, 944.0, 1542.0, 2855.0, 5375.0, 11045.0, 24445.0, 58982.0, 155168.0, 360604.0, 258158.0, 96236.0, 38103.0, 16575.0, 7846.0, 3860.0, 2190.0, 1156.0, 678.0, 423.0, 253.0, 194.0, 117.0, 76.0, 51.0, 39.0, 19.0, 17.0, 12.0, 21.0, 10.0, 8.0, 6.0, 2.0, 5.0, 6.0, 7.0, 1.0, 5.0, 0.0, 0.0, 1.0], "bins": [-0.185302734375, -0.17946815490722656, -0.17363357543945312, -0.1677989959716797, -0.16196441650390625, -0.1561298370361328, -0.15029525756835938, -0.14446067810058594, -0.1386260986328125, -0.13279151916503906, -0.12695693969726562, -0.12112236022949219, -0.11528778076171875, -0.10945320129394531, -0.10361862182617188, -0.09778404235839844, -0.091949462890625, -0.08611488342285156, -0.08028030395507812, -0.07444572448730469, -0.06861114501953125, -0.06277656555175781, -0.056941986083984375, -0.05110740661621094, -0.0452728271484375, -0.03943824768066406, -0.033603668212890625, -0.027769088745117188, -0.02193450927734375, -0.016099929809570312, -0.010265350341796875, -0.0044307708740234375, 0.00140380859375, 0.0072383880615234375, 0.013072967529296875, 0.018907546997070312, 0.02474212646484375, 0.030576705932617188, 0.036411285400390625, 0.04224586486816406, 0.0480804443359375, 0.05391502380371094, 0.059749603271484375, 0.06558418273925781, 0.07141876220703125, 0.07725334167480469, 0.08308792114257812, 0.08892250061035156, 0.094757080078125, 0.10059165954589844, 0.10642623901367188, 0.11226081848144531, 0.11809539794921875, 0.12392997741699219, 0.12976455688476562, 0.13559913635253906, 0.1414337158203125, 0.14726829528808594, 0.15310287475585938, 0.1589374542236328, 0.16477203369140625, 0.1706066131591797, 0.17644119262695312, 0.18227577209472656, 0.1881103515625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 8.0, 5.0, 6.0, 9.0, 16.0, 15.0, 29.0, 22.0, 37.0, 52.0, 60.0, 79.0, 93.0, 96.0, 83.0, 66.0, 66.0, 59.0, 42.0, 31.0, 29.0, 23.0, 18.0, 12.0, 11.0, 10.0, 6.0, 4.0, 7.0, 4.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04052734375, -0.03925895690917969, -0.037990570068359375, -0.03672218322753906, -0.03545379638671875, -0.03418540954589844, -0.032917022705078125, -0.03164863586425781, -0.0303802490234375, -0.029111862182617188, -0.027843475341796875, -0.026575088500976562, -0.02530670166015625, -0.024038314819335938, -0.022769927978515625, -0.021501541137695312, -0.020233154296875, -0.018964767456054688, -0.017696380615234375, -0.016427993774414062, -0.01515960693359375, -0.013891220092773438, -0.012622833251953125, -0.011354446411132812, -0.0100860595703125, -0.008817672729492188, -0.007549285888671875, -0.0062808990478515625, -0.00501251220703125, -0.0037441253662109375, -0.002475738525390625, -0.0012073516845703125, 6.103515625e-05, 0.0013294219970703125, 0.002597808837890625, 0.0038661956787109375, 0.00513458251953125, 0.0064029693603515625, 0.007671356201171875, 0.008939743041992188, 0.0102081298828125, 0.011476516723632812, 0.012744903564453125, 0.014013290405273438, 0.01528167724609375, 0.016550064086914062, 0.017818450927734375, 0.019086837768554688, 0.020355224609375, 0.021623611450195312, 0.022891998291015625, 0.024160385131835938, 0.02542877197265625, 0.026697158813476562, 0.027965545654296875, 0.029233932495117188, 0.0305023193359375, 0.03177070617675781, 0.033039093017578125, 0.03430747985839844, 0.03557586669921875, 0.03684425354003906, 0.038112640380859375, 0.03938102722167969, 0.0406494140625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 6.0, 5.0, 7.0, 11.0, 13.0, 12.0, 26.0, 22.0, 30.0, 50.0, 62.0, 73.0, 98.0, 155.0, 169.0, 212.0, 348.0, 436.0, 663.0, 1197.0, 2115.0, 4833.0, 14269.0, 49111.0, 175264.0, 446129.0, 249123.0, 71179.0, 19869.0, 6480.0, 2555.0, 1292.0, 782.0, 495.0, 382.0, 296.0, 180.0, 147.0, 116.0, 80.0, 69.0, 49.0, 32.0, 34.0, 18.0, 21.0, 15.0, 6.0, 11.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.23876953125, -0.23145484924316406, -0.22414016723632812, -0.2168254852294922, -0.20951080322265625, -0.2021961212158203, -0.19488143920898438, -0.18756675720214844, -0.1802520751953125, -0.17293739318847656, -0.16562271118164062, -0.1583080291748047, -0.15099334716796875, -0.1436786651611328, -0.13636398315429688, -0.12904930114746094, -0.121734619140625, -0.11441993713378906, -0.10710525512695312, -0.09979057312011719, -0.09247589111328125, -0.08516120910644531, -0.07784652709960938, -0.07053184509277344, -0.0632171630859375, -0.05590248107910156, -0.048587799072265625, -0.04127311706542969, -0.03395843505859375, -0.026643753051757812, -0.019329071044921875, -0.012014389038085938, -0.00469970703125, 0.0026149749755859375, 0.009929656982421875, 0.017244338989257812, 0.02455902099609375, 0.03187370300292969, 0.039188385009765625, 0.04650306701660156, 0.0538177490234375, 0.06113243103027344, 0.06844711303710938, 0.07576179504394531, 0.08307647705078125, 0.09039115905761719, 0.09770584106445312, 0.10502052307128906, 0.112335205078125, 0.11964988708496094, 0.12696456909179688, 0.1342792510986328, 0.14159393310546875, 0.1489086151123047, 0.15622329711914062, 0.16353797912597656, 0.1708526611328125, 0.17816734313964844, 0.18548202514648438, 0.1927967071533203, 0.20011138916015625, 0.2074260711669922, 0.21474075317382812, 0.22205543518066406, 0.2293701171875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 2.0, 7.0, 5.0, 8.0, 9.0, 7.0, 12.0, 12.0, 15.0, 18.0, 17.0, 24.0, 23.0, 35.0, 30.0, 42.0, 40.0, 50.0, 37.0, 48.0, 38.0, 50.0, 40.0, 40.0, 47.0, 38.0, 34.0, 35.0, 27.0, 49.0, 32.0, 18.0, 28.0, 18.0, 13.0, 15.0, 11.0, 5.0, 8.0, 1.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.152587890625, -0.14769554138183594, -0.14280319213867188, -0.1379108428955078, -0.13301849365234375, -0.1281261444091797, -0.12323379516601562, -0.11834144592285156, -0.1134490966796875, -0.10855674743652344, -0.10366439819335938, -0.09877204895019531, -0.09387969970703125, -0.08898735046386719, -0.08409500122070312, -0.07920265197753906, -0.074310302734375, -0.06941795349121094, -0.06452560424804688, -0.05963325500488281, -0.05474090576171875, -0.04984855651855469, -0.044956207275390625, -0.04006385803222656, -0.0351715087890625, -0.030279159545898438, -0.025386810302734375, -0.020494461059570312, -0.01560211181640625, -0.010709762573242188, -0.005817413330078125, -0.0009250640869140625, 0.00396728515625, 0.008859634399414062, 0.013751983642578125, 0.018644332885742188, 0.02353668212890625, 0.028429031372070312, 0.033321380615234375, 0.03821372985839844, 0.0431060791015625, 0.04799842834472656, 0.052890777587890625, 0.05778312683105469, 0.06267547607421875, 0.06756782531738281, 0.07246017456054688, 0.07735252380371094, 0.082244873046875, 0.08713722229003906, 0.09202957153320312, 0.09692192077636719, 0.10181427001953125, 0.10670661926269531, 0.11159896850585938, 0.11649131774902344, 0.1213836669921875, 0.12627601623535156, 0.13116836547851562, 0.1360607147216797, 0.14095306396484375, 0.1458454132080078, 0.15073776245117188, 0.15563011169433594, 0.1605224609375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 2.0, 7.0, 5.0, 8.0, 12.0, 12.0, 31.0, 51.0, 96.0, 103.0, 212.0, 325.0, 636.0, 1405.0, 3065.0, 7096.0, 17978.0, 48908.0, 146506.0, 436102.0, 258182.0, 80174.0, 28328.0, 10828.0, 4469.0, 1948.0, 926.0, 481.0, 248.0, 162.0, 87.0, 53.0, 39.0, 20.0, 22.0, 7.0, 8.0, 9.0, 4.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11077880859375, -0.10705280303955078, -0.10332679748535156, -0.09960079193115234, -0.09587478637695312, -0.0921487808227539, -0.08842277526855469, -0.08469676971435547, -0.08097076416015625, -0.07724475860595703, -0.07351875305175781, -0.0697927474975586, -0.06606674194335938, -0.062340736389160156, -0.05861473083496094, -0.05488872528076172, -0.0511627197265625, -0.04743671417236328, -0.04371070861816406, -0.039984703063964844, -0.036258697509765625, -0.032532691955566406, -0.028806686401367188, -0.02508068084716797, -0.02135467529296875, -0.01762866973876953, -0.013902664184570312, -0.010176658630371094, -0.006450653076171875, -0.0027246475219726562, 0.0010013580322265625, 0.004727363586425781, 0.008453369140625, 0.012179374694824219, 0.015905380249023438, 0.019631385803222656, 0.023357391357421875, 0.027083396911621094, 0.030809402465820312, 0.03453540802001953, 0.03826141357421875, 0.04198741912841797, 0.04571342468261719, 0.049439430236816406, 0.053165435791015625, 0.056891441345214844, 0.06061744689941406, 0.06434345245361328, 0.0680694580078125, 0.07179546356201172, 0.07552146911621094, 0.07924747467041016, 0.08297348022460938, 0.0866994857788086, 0.09042549133300781, 0.09415149688720703, 0.09787750244140625, 0.10160350799560547, 0.10532951354980469, 0.1090555191040039, 0.11278152465820312, 0.11650753021240234, 0.12023353576660156, 0.12395954132080078, 0.127685546875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 1.0, 2.0, 4.0, 7.0, 2.0, 4.0, 11.0, 15.0, 10.0, 18.0, 24.0, 32.0, 62.0, 55.0, 71.0, 90.0, 120.0, 93.0, 88.0, 75.0, 50.0, 48.0, 25.0, 26.0, 17.0, 10.0, 16.0, 7.0, 9.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.137392044067383e-05, -8.860509842634201e-05, -8.583627641201019e-05, -8.306745439767838e-05, -8.029863238334656e-05, -7.752981036901474e-05, -7.476098835468292e-05, -7.19921663403511e-05, -6.922334432601929e-05, -6.645452231168747e-05, -6.368570029735565e-05, -6.0916878283023834e-05, -5.8148056268692017e-05, -5.53792342543602e-05, -5.261041224002838e-05, -4.9841590225696564e-05, -4.7072768211364746e-05, -4.430394619703293e-05, -4.153512418270111e-05, -3.876630216836929e-05, -3.5997480154037476e-05, -3.322865813970566e-05, -3.045983612537384e-05, -2.7691014111042023e-05, -2.4922192096710205e-05, -2.2153370082378387e-05, -1.938454806804657e-05, -1.6615726053714752e-05, -1.3846904039382935e-05, -1.1078082025051117e-05, -8.3092600107193e-06, -5.540437996387482e-06, -2.771615982055664e-06, -2.7939677238464355e-09, 2.766028046607971e-06, 5.534850060939789e-06, 8.303672075271606e-06, 1.1072494089603424e-05, 1.3841316103935242e-05, 1.661013811826706e-05, 1.9378960132598877e-05, 2.2147782146930695e-05, 2.4916604161262512e-05, 2.768542617559433e-05, 3.0454248189926147e-05, 3.3223070204257965e-05, 3.599189221858978e-05, 3.87607142329216e-05, 4.152953624725342e-05, 4.4298358261585236e-05, 4.706718027591705e-05, 4.983600229024887e-05, 5.260482430458069e-05, 5.5373646318912506e-05, 5.8142468333244324e-05, 6.091129034757614e-05, 6.368011236190796e-05, 6.644893437623978e-05, 6.92177563905716e-05, 7.198657840490341e-05, 7.475540041923523e-05, 7.752422243356705e-05, 8.029304444789886e-05, 8.306186646223068e-05, 8.58306884765625e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 8.0, 7.0, 10.0, 22.0, 23.0, 36.0, 56.0, 71.0, 101.0, 159.0, 214.0, 389.0, 574.0, 1094.0, 2233.0, 5532.0, 18322.0, 72146.0, 402708.0, 437282.0, 76996.0, 19448.0, 5981.0, 2319.0, 1116.0, 590.0, 345.0, 229.0, 164.0, 98.0, 83.0, 50.0, 42.0, 26.0, 23.0, 21.0, 9.0, 11.0, 7.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.166748046875, -0.16137313842773438, -0.15599822998046875, -0.15062332153320312, -0.1452484130859375, -0.13987350463867188, -0.13449859619140625, -0.12912368774414062, -0.123748779296875, -0.11837387084960938, -0.11299896240234375, -0.10762405395507812, -0.1022491455078125, -0.09687423706054688, -0.09149932861328125, -0.08612442016601562, -0.08074951171875, -0.07537460327148438, -0.06999969482421875, -0.06462478637695312, -0.0592498779296875, -0.053874969482421875, -0.04850006103515625, -0.043125152587890625, -0.037750244140625, -0.032375335693359375, -0.02700042724609375, -0.021625518798828125, -0.0162506103515625, -0.010875701904296875, -0.00550079345703125, -0.000125885009765625, 0.0052490234375, 0.010623931884765625, 0.01599884033203125, 0.021373748779296875, 0.0267486572265625, 0.032123565673828125, 0.03749847412109375, 0.042873382568359375, 0.048248291015625, 0.053623199462890625, 0.05899810791015625, 0.06437301635742188, 0.0697479248046875, 0.07512283325195312, 0.08049774169921875, 0.08587265014648438, 0.09124755859375, 0.09662246704101562, 0.10199737548828125, 0.10737228393554688, 0.1127471923828125, 0.11812210083007812, 0.12349700927734375, 0.12887191772460938, 0.134246826171875, 0.13962173461914062, 0.14499664306640625, 0.15037155151367188, 0.1557464599609375, 0.16112136840820312, 0.16649627685546875, 0.17187118530273438, 0.17724609375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 5.0, 5.0, 9.0, 10.0, 13.0, 7.0, 12.0, 20.0, 17.0, 14.0, 28.0, 32.0, 43.0, 37.0, 60.0, 79.0, 88.0, 95.0, 80.0, 65.0, 61.0, 48.0, 32.0, 24.0, 14.0, 25.0, 12.0, 12.0, 9.0, 6.0, 7.0, 7.0, 7.0, 4.0, 6.0, 6.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07977294921875, -0.07693862915039062, -0.07410430908203125, -0.07126998901367188, -0.0684356689453125, -0.06560134887695312, -0.06276702880859375, -0.059932708740234375, -0.057098388671875, -0.054264068603515625, -0.05142974853515625, -0.048595428466796875, -0.0457611083984375, -0.042926788330078125, -0.04009246826171875, -0.037258148193359375, -0.034423828125, -0.031589508056640625, -0.02875518798828125, -0.025920867919921875, -0.0230865478515625, -0.020252227783203125, -0.01741790771484375, -0.014583587646484375, -0.011749267578125, -0.008914947509765625, -0.00608062744140625, -0.003246307373046875, -0.0004119873046875, 0.002422332763671875, 0.00525665283203125, 0.008090972900390625, 0.01092529296875, 0.013759613037109375, 0.01659393310546875, 0.019428253173828125, 0.0222625732421875, 0.025096893310546875, 0.02793121337890625, 0.030765533447265625, 0.033599853515625, 0.036434173583984375, 0.03926849365234375, 0.042102813720703125, 0.0449371337890625, 0.047771453857421875, 0.05060577392578125, 0.053440093994140625, 0.0562744140625, 0.059108734130859375, 0.06194305419921875, 0.06477737426757812, 0.0676116943359375, 0.07044601440429688, 0.07328033447265625, 0.07611465454101562, 0.078948974609375, 0.08178329467773438, 0.08461761474609375, 0.08745193481445312, 0.0902862548828125, 0.09312057495117188, 0.09595489501953125, 0.09878921508789062, 0.10162353515625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 8.0, 9.0, 26.0, 29.0, 44.0, 86.0, 102.0, 119.0, 141.0, 122.0, 110.0, 61.0, 47.0, 42.0, 15.0, 9.0, 11.0, 8.0, 8.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.250376582145691, -1.2030826807022095, -1.155788779258728, -1.1084948778152466, -1.0612008571624756, -1.0139069557189941, -0.9666130542755127, -0.9193191528320312, -0.8720252513885498, -0.8247313499450684, -0.7774374485015869, -0.7301434874534607, -0.6828495860099792, -0.6355556845664978, -0.5882617235183716, -0.5409678220748901, -0.4936739206314087, -0.44638001918792725, -0.3990860879421234, -0.3517921566963196, -0.30449825525283813, -0.2572043538093567, -0.20991042256355286, -0.16261649131774902, -0.11532258987426758, -0.06802867352962494, -0.0207347571849823, 0.02655915915966034, 0.07385307550430298, 0.12114699184894562, 0.16844090819358826, 0.2157348394393921, 0.263028621673584, 0.31032252311706543, 0.35761645436286926, 0.4049103856086731, 0.45220428705215454, 0.499498188495636, 0.5467921495437622, 0.5940860509872437, 0.6413799524307251, 0.6886738538742065, 0.735967755317688, 0.7832617163658142, 0.8305556178092957, 0.8778495192527771, 0.9251434803009033, 0.9724373817443848, 1.0197312831878662, 1.0670251846313477, 1.114319086074829, 1.1616129875183105, 1.208906888961792, 1.256200909614563, 1.3034948110580444, 1.3507887125015259, 1.3980826139450073, 1.4453765153884888, 1.4926704168319702, 1.5399643182754517, 1.5872583389282227, 1.634552240371704, 1.6818461418151855, 1.729140043258667, 1.7764339447021484]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 2.0, 7.0, 4.0, 4.0, 5.0, 4.0, 9.0, 9.0, 14.0, 14.0, 23.0, 21.0, 19.0, 22.0, 19.0, 33.0, 32.0, 42.0, 33.0, 54.0, 42.0, 33.0, 43.0, 45.0, 45.0, 44.0, 41.0, 33.0, 31.0, 20.0, 21.0, 29.0, 33.0, 24.0, 24.0, 21.0, 17.0, 13.0, 20.0, 14.0, 8.0, 8.0, 7.0, 8.0, 2.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.0215882062911987, -0.9906684756278992, -0.9597487449645996, -0.9288290143013, -0.8979092836380005, -0.8669895529747009, -0.8360698223114014, -0.8051501512527466, -0.7742303609848022, -0.7433106303215027, -0.7123908996582031, -0.6814711689949036, -0.650551438331604, -0.6196317076683044, -0.5887119770050049, -0.5577923059463501, -0.5268725752830505, -0.495952844619751, -0.4650331139564514, -0.43411338329315186, -0.4031936526298523, -0.37227392196655273, -0.34135422110557556, -0.310434490442276, -0.27951475977897644, -0.24859502911567688, -0.21767529845237732, -0.18675558269023895, -0.1558358520269394, -0.12491612136363983, -0.09399640560150146, -0.0630766749382019, -0.032156944274902344, -0.0012372173368930817, 0.02968250960111618, 0.060602232813835144, 0.0915219634771347, 0.12244169414043427, 0.15336140990257263, 0.1842811405658722, 0.21520087122917175, 0.2461206018924713, 0.2770403325557709, 0.30796003341674805, 0.3388797640800476, 0.36979949474334717, 0.40071922540664673, 0.4316389560699463, 0.46255868673324585, 0.4934784173965454, 0.524398148059845, 0.5553178787231445, 0.5862376093864441, 0.6171573400497437, 0.6480770111083984, 0.6789968013763428, 0.7099164724349976, 0.7408362030982971, 0.7717559337615967, 0.8026756644248962, 0.8335953950881958, 0.8645151257514954, 0.8954348564147949, 0.9263545274734497, 0.957274317741394]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 4.0, 6.0, 4.0, 9.0, 14.0, 16.0, 18.0, 45.0, 45.0, 99.0, 134.0, 232.0, 412.0, 757.0, 1560.0, 4066.0, 13280.0, 59903.0, 707633.0, 3284837.0, 91804.0, 18770.0, 5798.0, 2183.0, 997.0, 611.0, 327.0, 220.0, 157.0, 112.0, 71.0, 47.0, 31.0, 23.0, 10.0, 11.0, 5.0, 15.0, 2.0, 8.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26025390625, -0.25099945068359375, -0.2417449951171875, -0.23249053955078125, -0.223236083984375, -0.21398162841796875, -0.2047271728515625, -0.19547271728515625, -0.18621826171875, -0.17696380615234375, -0.1677093505859375, -0.15845489501953125, -0.149200439453125, -0.13994598388671875, -0.1306915283203125, -0.12143707275390625, -0.1121826171875, -0.10292816162109375, -0.0936737060546875, -0.08441925048828125, -0.075164794921875, -0.06591033935546875, -0.0566558837890625, -0.04740142822265625, -0.03814697265625, -0.02889251708984375, -0.0196380615234375, -0.01038360595703125, -0.001129150390625, 0.00812530517578125, 0.0173797607421875, 0.02663421630859375, 0.035888671875, 0.04514312744140625, 0.0543975830078125, 0.06365203857421875, 0.072906494140625, 0.08216094970703125, 0.0914154052734375, 0.10066986083984375, 0.10992431640625, 0.11917877197265625, 0.1284332275390625, 0.13768768310546875, 0.146942138671875, 0.15619659423828125, 0.1654510498046875, 0.17470550537109375, 0.1839599609375, 0.19321441650390625, 0.2024688720703125, 0.21172332763671875, 0.220977783203125, 0.23023223876953125, 0.2394866943359375, 0.24874114990234375, 0.25799560546875, 0.26725006103515625, 0.2765045166015625, 0.28575897216796875, 0.295013427734375, 0.30426788330078125, 0.3135223388671875, 0.32277679443359375, 0.33203125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 7.0, 7.0, 14.0, 14.0, 19.0, 23.0, 37.0, 44.0, 40.0, 44.0, 49.0, 62.0, 70.0, 69.0, 68.0, 75.0, 61.0, 51.0, 42.0, 43.0, 32.0, 17.0, 22.0, 15.0, 22.0, 11.0, 7.0, 6.0, 15.0, 4.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.043212890625, -0.04194211959838867, -0.040671348571777344, -0.039400577545166016, -0.03812980651855469, -0.03685903549194336, -0.03558826446533203, -0.0343174934387207, -0.033046722412109375, -0.03177595138549805, -0.03050518035888672, -0.02923440933227539, -0.027963638305664062, -0.026692867279052734, -0.025422096252441406, -0.024151325225830078, -0.02288055419921875, -0.021609783172607422, -0.020339012145996094, -0.019068241119384766, -0.017797470092773438, -0.01652669906616211, -0.015255928039550781, -0.013985157012939453, -0.012714385986328125, -0.011443614959716797, -0.010172843933105469, -0.00890207290649414, -0.0076313018798828125, -0.006360530853271484, -0.005089759826660156, -0.003818988800048828, -0.0025482177734375, -0.0012774467468261719, -6.67572021484375e-06, 0.0012640953063964844, 0.0025348663330078125, 0.0038056373596191406, 0.005076408386230469, 0.006347179412841797, 0.007617950439453125, 0.008888721466064453, 0.010159492492675781, 0.01143026351928711, 0.012701034545898438, 0.013971805572509766, 0.015242576599121094, 0.016513347625732422, 0.01778411865234375, 0.019054889678955078, 0.020325660705566406, 0.021596431732177734, 0.022867202758789062, 0.02413797378540039, 0.02540874481201172, 0.026679515838623047, 0.027950286865234375, 0.029221057891845703, 0.03049182891845703, 0.03176259994506836, 0.03303337097167969, 0.034304141998291016, 0.035574913024902344, 0.03684568405151367, 0.038116455078125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 4.0, 2.0, 5.0, 13.0, 22.0, 28.0, 50.0, 91.0, 140.0, 205.0, 396.0, 664.0, 1293.0, 2741.0, 6307.0, 16123.0, 51417.0, 225809.0, 3048986.0, 686243.0, 105617.0, 29464.0, 10226.0, 4173.0, 1894.0, 967.0, 510.0, 315.0, 175.0, 126.0, 83.0, 64.0, 33.0, 34.0, 20.0, 11.0, 11.0, 6.0, 6.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2415771484375, -0.23482131958007812, -0.22806549072265625, -0.22130966186523438, -0.2145538330078125, -0.20779800415039062, -0.20104217529296875, -0.19428634643554688, -0.187530517578125, -0.18077468872070312, -0.17401885986328125, -0.16726303100585938, -0.1605072021484375, -0.15375137329101562, -0.14699554443359375, -0.14023971557617188, -0.13348388671875, -0.12672805786132812, -0.11997222900390625, -0.11321640014648438, -0.1064605712890625, -0.09970474243164062, -0.09294891357421875, -0.08619308471679688, -0.079437255859375, -0.07268142700195312, -0.06592559814453125, -0.059169769287109375, -0.0524139404296875, -0.045658111572265625, -0.03890228271484375, -0.032146453857421875, -0.025390625, -0.018634796142578125, -0.01187896728515625, -0.005123138427734375, 0.0016326904296875, 0.008388519287109375, 0.01514434814453125, 0.021900177001953125, 0.028656005859375, 0.035411834716796875, 0.04216766357421875, 0.048923492431640625, 0.0556793212890625, 0.062435150146484375, 0.06919097900390625, 0.07594680786132812, 0.08270263671875, 0.08945846557617188, 0.09621429443359375, 0.10297012329101562, 0.1097259521484375, 0.11648178100585938, 0.12323760986328125, 0.12999343872070312, 0.136749267578125, 0.14350509643554688, 0.15026092529296875, 0.15701675415039062, 0.1637725830078125, 0.17052841186523438, 0.17728424072265625, 0.18404006958007812, 0.1907958984375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 8.0, 10.0, 11.0, 14.0, 18.0, 18.0, 24.0, 54.0, 86.0, 117.0, 260.0, 495.0, 1708.0, 584.0, 241.0, 146.0, 88.0, 66.0, 43.0, 23.0, 20.0, 9.0, 7.0, 7.0, 6.0, 4.0, 1.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07171630859375, -0.0692901611328125, -0.066864013671875, -0.0644378662109375, -0.06201171875, -0.0595855712890625, -0.057159423828125, -0.0547332763671875, -0.05230712890625, -0.0498809814453125, -0.047454833984375, -0.0450286865234375, -0.0426025390625, -0.0401763916015625, -0.037750244140625, -0.0353240966796875, -0.03289794921875, -0.0304718017578125, -0.028045654296875, -0.0256195068359375, -0.023193359375, -0.0207672119140625, -0.018341064453125, -0.0159149169921875, -0.01348876953125, -0.0110626220703125, -0.008636474609375, -0.0062103271484375, -0.0037841796875, -0.0013580322265625, 0.001068115234375, 0.0034942626953125, 0.00592041015625, 0.0083465576171875, 0.010772705078125, 0.0131988525390625, 0.015625, 0.0180511474609375, 0.020477294921875, 0.0229034423828125, 0.02532958984375, 0.0277557373046875, 0.030181884765625, 0.0326080322265625, 0.0350341796875, 0.0374603271484375, 0.039886474609375, 0.0423126220703125, 0.04473876953125, 0.0471649169921875, 0.049591064453125, 0.0520172119140625, 0.054443359375, 0.0568695068359375, 0.059295654296875, 0.0617218017578125, 0.06414794921875, 0.0665740966796875, 0.069000244140625, 0.0714263916015625, 0.0738525390625, 0.0762786865234375, 0.078704833984375, 0.0811309814453125, 0.08355712890625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 6.0, 9.0, 15.0, 38.0, 72.0, 86.0, 175.0, 177.0, 134.0, 103.0, 70.0, 56.0, 31.0, 13.0, 7.0, 3.0, 2.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3565395176410675, -0.3408111333847046, -0.3250827193260193, -0.30935433506965637, -0.29362592101097107, -0.27789753675460815, -0.26216912269592285, -0.24644073843955994, -0.23071233928203583, -0.21498394012451172, -0.1992555409669876, -0.1835271418094635, -0.16779875755310059, -0.15207034349441528, -0.13634195923805237, -0.12061356008052826, -0.10488516092300415, -0.08915676176548004, -0.07342836260795593, -0.05769997090101242, -0.04197157174348831, -0.026243172585964203, -0.010514780879020691, 0.005213618278503418, 0.020942017436027527, 0.036670416593551636, 0.052398812025785446, 0.06812720745801926, 0.08385560661554337, 0.09958400577306747, 0.11531239748001099, 0.1310407966375351, 0.1467692255973816, 0.1624976247549057, 0.1782260239124298, 0.19395440816879272, 0.20968282222747803, 0.22541120648384094, 0.24113960564136505, 0.25686800479888916, 0.27259641885757446, 0.2883248031139374, 0.3040532171726227, 0.3197816014289856, 0.3355100154876709, 0.3512383997440338, 0.36696678400039673, 0.38269519805908203, 0.39842358231544495, 0.41415196657180786, 0.42988038063049316, 0.4456087648868561, 0.4613371789455414, 0.4770655632019043, 0.4927939772605896, 0.5085223913192749, 0.5242507457733154, 0.5399791598320007, 0.5557075142860413, 0.5714359283447266, 0.5871643424034119, 0.6028927564620972, 0.6186211109161377, 0.634349524974823, 0.6500779390335083]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 7.0, 8.0, 9.0, 6.0, 9.0, 11.0, 15.0, 14.0, 16.0, 21.0, 30.0, 34.0, 40.0, 33.0, 48.0, 53.0, 50.0, 57.0, 43.0, 40.0, 56.0, 44.0, 40.0, 40.0, 40.0, 34.0, 32.0, 29.0, 29.0, 16.0, 23.0, 14.0, 11.0, 15.0, 10.0, 5.0, 5.0, 5.0, 6.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2550392150878906, -0.24742937088012695, -0.23981952667236328, -0.2322096824645996, -0.22459983825683594, -0.21698999404907227, -0.2093801349401474, -0.20177029073238373, -0.19416044652462006, -0.18655060231685638, -0.1789407581090927, -0.17133091390132904, -0.16372105479240417, -0.1561112105846405, -0.14850136637687683, -0.14089152216911316, -0.1332816779613495, -0.12567183375358582, -0.11806198954582214, -0.11045213788747787, -0.1028422936797142, -0.09523244947195053, -0.08762259781360626, -0.08001275360584259, -0.07240290939807892, -0.06479306519031525, -0.057183217257261276, -0.049573369324207306, -0.041963525116443634, -0.03435368090867996, -0.026743832975625992, -0.01913398504257202, -0.01152414083480835, -0.0039142947643995285, 0.0036955513060092926, 0.011305397376418114, 0.018915243446826935, 0.026525087654590607, 0.03413493558764458, 0.04174478352069855, 0.04935462772846222, 0.05696447193622589, 0.06457431614398956, 0.07218416780233383, 0.0797940120100975, 0.08740385621786118, 0.09501370787620544, 0.10262355208396912, 0.11023339629173279, 0.11784324049949646, 0.12545308470726013, 0.1330629289150238, 0.14067277312278748, 0.14828261733055115, 0.155892476439476, 0.16350232064723969, 0.17111216485500336, 0.17872200906276703, 0.1863318532705307, 0.19394169747829437, 0.20155155658721924, 0.2091614007949829, 0.21677124500274658, 0.22438108921051025, 0.23199093341827393]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 6.0, 5.0, 9.0, 9.0, 18.0, 24.0, 38.0, 50.0, 113.0, 219.0, 441.0, 1044.0, 2251.0, 6489.0, 18620.0, 60340.0, 210982.0, 474387.0, 191427.0, 54906.0, 17280.0, 5904.0, 2236.0, 902.0, 379.0, 207.0, 96.0, 62.0, 47.0, 16.0, 17.0, 7.0, 10.0, 3.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.243408203125, -0.23673248291015625, -0.2300567626953125, -0.22338104248046875, -0.216705322265625, -0.21002960205078125, -0.2033538818359375, -0.19667816162109375, -0.19000244140625, -0.18332672119140625, -0.1766510009765625, -0.16997528076171875, -0.163299560546875, -0.15662384033203125, -0.1499481201171875, -0.14327239990234375, -0.1365966796875, -0.12992095947265625, -0.1232452392578125, -0.11656951904296875, -0.109893798828125, -0.10321807861328125, -0.0965423583984375, -0.08986663818359375, -0.08319091796875, -0.07651519775390625, -0.0698394775390625, -0.06316375732421875, -0.056488037109375, -0.04981231689453125, -0.0431365966796875, -0.03646087646484375, -0.02978515625, -0.02310943603515625, -0.0164337158203125, -0.00975799560546875, -0.003082275390625, 0.00359344482421875, 0.0102691650390625, 0.01694488525390625, 0.02362060546875, 0.03029632568359375, 0.0369720458984375, 0.04364776611328125, 0.050323486328125, 0.05699920654296875, 0.0636749267578125, 0.07035064697265625, 0.0770263671875, 0.08370208740234375, 0.0903778076171875, 0.09705352783203125, 0.103729248046875, 0.11040496826171875, 0.1170806884765625, 0.12375640869140625, 0.13043212890625, 0.13710784912109375, 0.1437835693359375, 0.15045928955078125, 0.157135009765625, 0.16381072998046875, 0.1704864501953125, 0.17716217041015625, 0.183837890625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 6.0, 21.0, 8.0, 14.0, 29.0, 30.0, 35.0, 30.0, 43.0, 49.0, 55.0, 72.0, 74.0, 63.0, 77.0, 60.0, 52.0, 58.0, 35.0, 38.0, 34.0, 19.0, 18.0, 20.0, 12.0, 7.0, 8.0, 13.0, 7.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.042449951171875, -0.0411829948425293, -0.039916038513183594, -0.03864908218383789, -0.03738212585449219, -0.036115169525146484, -0.03484821319580078, -0.03358125686645508, -0.032314300537109375, -0.031047344207763672, -0.02978038787841797, -0.028513431549072266, -0.027246475219726562, -0.02597951889038086, -0.024712562561035156, -0.023445606231689453, -0.02217864990234375, -0.020911693572998047, -0.019644737243652344, -0.01837778091430664, -0.017110824584960938, -0.015843868255615234, -0.014576911926269531, -0.013309955596923828, -0.012042999267578125, -0.010776042938232422, -0.009509086608886719, -0.008242130279541016, -0.0069751739501953125, -0.005708217620849609, -0.004441261291503906, -0.003174304962158203, -0.0019073486328125, -0.0006403923034667969, 0.0006265640258789062, 0.0018935203552246094, 0.0031604766845703125, 0.004427433013916016, 0.005694389343261719, 0.006961345672607422, 0.008228302001953125, 0.009495258331298828, 0.010762214660644531, 0.012029170989990234, 0.013296127319335938, 0.01456308364868164, 0.015830039978027344, 0.017096996307373047, 0.01836395263671875, 0.019630908966064453, 0.020897865295410156, 0.02216482162475586, 0.023431777954101562, 0.024698734283447266, 0.02596569061279297, 0.027232646942138672, 0.028499603271484375, 0.029766559600830078, 0.03103351593017578, 0.032300472259521484, 0.03356742858886719, 0.03483438491821289, 0.036101341247558594, 0.0373682975769043, 0.03863525390625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 10.0, 18.0, 16.0, 21.0, 24.0, 37.0, 51.0, 67.0, 93.0, 139.0, 166.0, 227.0, 301.0, 436.0, 636.0, 1089.0, 1911.0, 4589.0, 13967.0, 50688.0, 186002.0, 457250.0, 235967.0, 65594.0, 17694.0, 5638.0, 2304.0, 1121.0, 741.0, 502.0, 334.0, 278.0, 153.0, 121.0, 88.0, 63.0, 73.0, 40.0, 30.0, 24.0, 9.0, 12.0, 14.0, 8.0, 4.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1966552734375, -0.19062232971191406, -0.18458938598632812, -0.1785564422607422, -0.17252349853515625, -0.1664905548095703, -0.16045761108398438, -0.15442466735839844, -0.1483917236328125, -0.14235877990722656, -0.13632583618164062, -0.1302928924560547, -0.12425994873046875, -0.11822700500488281, -0.11219406127929688, -0.10616111755371094, -0.100128173828125, -0.09409523010253906, -0.08806228637695312, -0.08202934265136719, -0.07599639892578125, -0.06996345520019531, -0.06393051147460938, -0.05789756774902344, -0.0518646240234375, -0.04583168029785156, -0.039798736572265625, -0.03376579284667969, -0.02773284912109375, -0.021699905395507812, -0.015666961669921875, -0.009634017944335938, -0.00360107421875, 0.0024318695068359375, 0.008464813232421875, 0.014497756958007812, 0.02053070068359375, 0.026563644409179688, 0.032596588134765625, 0.03862953186035156, 0.0446624755859375, 0.05069541931152344, 0.056728363037109375, 0.06276130676269531, 0.06879425048828125, 0.07482719421386719, 0.08086013793945312, 0.08689308166503906, 0.092926025390625, 0.09895896911621094, 0.10499191284179688, 0.11102485656738281, 0.11705780029296875, 0.12309074401855469, 0.12912368774414062, 0.13515663146972656, 0.1411895751953125, 0.14722251892089844, 0.15325546264648438, 0.1592884063720703, 0.16532135009765625, 0.1713542938232422, 0.17738723754882812, 0.18342018127441406, 0.189453125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 3.0, 7.0, 2.0, 5.0, 7.0, 4.0, 3.0, 12.0, 13.0, 16.0, 11.0, 22.0, 26.0, 23.0, 26.0, 31.0, 41.0, 40.0, 45.0, 43.0, 50.0, 46.0, 32.0, 45.0, 42.0, 44.0, 48.0, 42.0, 32.0, 33.0, 27.0, 29.0, 26.0, 21.0, 20.0, 16.0, 13.0, 13.0, 10.0, 11.0, 6.0, 4.0, 6.0, 2.0, 4.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.127685546875, -0.12273979187011719, -0.11779403686523438, -0.11284828186035156, -0.10790252685546875, -0.10295677185058594, -0.09801101684570312, -0.09306526184082031, -0.0881195068359375, -0.08317375183105469, -0.07822799682617188, -0.07328224182128906, -0.06833648681640625, -0.06339073181152344, -0.058444976806640625, -0.05349922180175781, -0.048553466796875, -0.04360771179199219, -0.038661956787109375, -0.03371620178222656, -0.02877044677734375, -0.023824691772460938, -0.018878936767578125, -0.013933181762695312, -0.0089874267578125, -0.0040416717529296875, 0.000904083251953125, 0.0058498382568359375, 0.01079559326171875, 0.015741348266601562, 0.020687103271484375, 0.025632858276367188, 0.03057861328125, 0.03552436828613281, 0.040470123291015625, 0.04541587829589844, 0.05036163330078125, 0.05530738830566406, 0.060253143310546875, 0.06519889831542969, 0.0701446533203125, 0.07509040832519531, 0.08003616333007812, 0.08498191833496094, 0.08992767333984375, 0.09487342834472656, 0.09981918334960938, 0.10476493835449219, 0.109710693359375, 0.11465644836425781, 0.11960220336914062, 0.12454795837402344, 0.12949371337890625, 0.13443946838378906, 0.13938522338867188, 0.1443309783935547, 0.1492767333984375, 0.1542224884033203, 0.15916824340820312, 0.16411399841308594, 0.16905975341796875, 0.17400550842285156, 0.17895126342773438, 0.1838970184326172, 0.1888427734375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 5.0, 13.0, 13.0, 17.0, 28.0, 53.0, 80.0, 102.0, 215.0, 325.0, 611.0, 1048.0, 2208.0, 4965.0, 13202.0, 39955.0, 142493.0, 467093.0, 269988.0, 70228.0, 21644.0, 7719.0, 3178.0, 1521.0, 755.0, 404.0, 235.0, 175.0, 94.0, 49.0, 39.0, 35.0, 16.0, 9.0, 10.0, 8.0, 3.0, 4.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09344482421875, -0.0904998779296875, -0.087554931640625, -0.0846099853515625, -0.0816650390625, -0.0787200927734375, -0.075775146484375, -0.0728302001953125, -0.06988525390625, -0.0669403076171875, -0.063995361328125, -0.0610504150390625, -0.05810546875, -0.0551605224609375, -0.052215576171875, -0.0492706298828125, -0.04632568359375, -0.0433807373046875, -0.040435791015625, -0.0374908447265625, -0.0345458984375, -0.0316009521484375, -0.028656005859375, -0.0257110595703125, -0.02276611328125, -0.0198211669921875, -0.016876220703125, -0.0139312744140625, -0.010986328125, -0.0080413818359375, -0.005096435546875, -0.0021514892578125, 0.00079345703125, 0.0037384033203125, 0.006683349609375, 0.0096282958984375, 0.0125732421875, 0.0155181884765625, 0.018463134765625, 0.0214080810546875, 0.02435302734375, 0.0272979736328125, 0.030242919921875, 0.0331878662109375, 0.0361328125, 0.0390777587890625, 0.042022705078125, 0.0449676513671875, 0.04791259765625, 0.0508575439453125, 0.053802490234375, 0.0567474365234375, 0.0596923828125, 0.0626373291015625, 0.065582275390625, 0.0685272216796875, 0.07147216796875, 0.0744171142578125, 0.077362060546875, 0.0803070068359375, 0.083251953125, 0.0861968994140625, 0.089141845703125, 0.0920867919921875, 0.09503173828125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 7.0, 3.0, 6.0, 6.0, 9.0, 9.0, 9.0, 16.0, 18.0, 25.0, 28.0, 37.0, 41.0, 33.0, 43.0, 42.0, 55.0, 68.0, 74.0, 58.0, 68.0, 71.0, 50.0, 56.0, 26.0, 17.0, 16.0, 19.0, 13.0, 20.0, 11.0, 8.0, 9.0, 5.0, 2.0, 5.0, 3.0, 1.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-6.93202018737793e-05, -6.743241101503372e-05, -6.554462015628815e-05, -6.365682929754257e-05, -6.1769038438797e-05, -5.988124758005142e-05, -5.799345672130585e-05, -5.610566586256027e-05, -5.42178750038147e-05, -5.233008414506912e-05, -5.044229328632355e-05, -4.855450242757797e-05, -4.66667115688324e-05, -4.477892071008682e-05, -4.289112985134125e-05, -4.100333899259567e-05, -3.91155481338501e-05, -3.722775727510452e-05, -3.533996641635895e-05, -3.345217555761337e-05, -3.15643846988678e-05, -2.9676593840122223e-05, -2.7788802981376648e-05, -2.5901012122631073e-05, -2.4013221263885498e-05, -2.2125430405139923e-05, -2.0237639546394348e-05, -1.8349848687648773e-05, -1.6462057828903198e-05, -1.4574266970157623e-05, -1.2686476111412048e-05, -1.0798685252666473e-05, -8.910894393920898e-06, -7.0231035351753235e-06, -5.1353126764297485e-06, -3.2475218176841736e-06, -1.3597309589385986e-06, 5.280598998069763e-07, 2.4158507585525513e-06, 4.303641617298126e-06, 6.191432476043701e-06, 8.079223334789276e-06, 9.967014193534851e-06, 1.1854805052280426e-05, 1.3742595911026001e-05, 1.5630386769771576e-05, 1.751817762851715e-05, 1.9405968487262726e-05, 2.12937593460083e-05, 2.3181550204753876e-05, 2.506934106349945e-05, 2.6957131922245026e-05, 2.88449227809906e-05, 3.0732713639736176e-05, 3.262050449848175e-05, 3.4508295357227325e-05, 3.63960862159729e-05, 3.8283877074718475e-05, 4.017166793346405e-05, 4.2059458792209625e-05, 4.39472496509552e-05, 4.5835040509700775e-05, 4.772283136844635e-05, 4.9610622227191925e-05, 5.14984130859375e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 5.0, 9.0, 6.0, 12.0, 12.0, 19.0, 25.0, 41.0, 37.0, 59.0, 89.0, 113.0, 224.0, 290.0, 505.0, 909.0, 1990.0, 4697.0, 14059.0, 55969.0, 301557.0, 525980.0, 105200.0, 23966.0, 6987.0, 2682.0, 1273.0, 670.0, 415.0, 241.0, 169.0, 80.0, 64.0, 47.0, 42.0, 31.0, 15.0, 14.0, 11.0, 9.0, 10.0, 1.0, 10.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 4.0], "bins": [-0.12347412109375, -0.11996650695800781, -0.11645889282226562, -0.11295127868652344, -0.10944366455078125, -0.10593605041503906, -0.10242843627929688, -0.09892082214355469, -0.0954132080078125, -0.09190559387207031, -0.08839797973632812, -0.08489036560058594, -0.08138275146484375, -0.07787513732910156, -0.07436752319335938, -0.07085990905761719, -0.067352294921875, -0.06384468078613281, -0.060337066650390625, -0.05682945251464844, -0.05332183837890625, -0.04981422424316406, -0.046306610107421875, -0.04279899597167969, -0.0392913818359375, -0.03578376770019531, -0.032276153564453125, -0.028768539428710938, -0.02526092529296875, -0.021753311157226562, -0.018245697021484375, -0.014738082885742188, -0.01123046875, -0.0077228546142578125, -0.004215240478515625, -0.0007076263427734375, 0.00279998779296875, 0.0063076019287109375, 0.009815216064453125, 0.013322830200195312, 0.0168304443359375, 0.020338058471679688, 0.023845672607421875, 0.027353286743164062, 0.03086090087890625, 0.03436851501464844, 0.037876129150390625, 0.04138374328613281, 0.044891357421875, 0.04839897155761719, 0.051906585693359375, 0.05541419982910156, 0.05892181396484375, 0.06242942810058594, 0.06593704223632812, 0.06944465637207031, 0.0729522705078125, 0.07645988464355469, 0.07996749877929688, 0.08347511291503906, 0.08698272705078125, 0.09049034118652344, 0.09399795532226562, 0.09750556945800781, 0.10101318359375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 6.0, 5.0, 1.0, 6.0, 7.0, 9.0, 7.0, 11.0, 13.0, 20.0, 24.0, 27.0, 32.0, 52.0, 61.0, 79.0, 114.0, 103.0, 74.0, 77.0, 61.0, 40.0, 43.0, 26.0, 22.0, 18.0, 18.0, 9.0, 5.0, 7.0, 7.0, 4.0, 4.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.08612060546875, -0.08360958099365234, -0.08109855651855469, -0.07858753204345703, -0.07607650756835938, -0.07356548309326172, -0.07105445861816406, -0.0685434341430664, -0.06603240966796875, -0.0635213851928711, -0.06101036071777344, -0.05849933624267578, -0.055988311767578125, -0.05347728729248047, -0.05096626281738281, -0.048455238342285156, -0.0459442138671875, -0.043433189392089844, -0.04092216491699219, -0.03841114044189453, -0.035900115966796875, -0.03338909149169922, -0.030878067016601562, -0.028367042541503906, -0.02585601806640625, -0.023344993591308594, -0.020833969116210938, -0.01832294464111328, -0.015811920166015625, -0.013300895690917969, -0.010789871215820312, -0.008278846740722656, -0.005767822265625, -0.0032567977905273438, -0.0007457733154296875, 0.0017652511596679688, 0.004276275634765625, 0.006787300109863281, 0.009298324584960938, 0.011809349060058594, 0.01432037353515625, 0.016831398010253906, 0.019342422485351562, 0.02185344696044922, 0.024364471435546875, 0.02687549591064453, 0.029386520385742188, 0.031897544860839844, 0.0344085693359375, 0.036919593811035156, 0.03943061828613281, 0.04194164276123047, 0.044452667236328125, 0.04696369171142578, 0.04947471618652344, 0.051985740661621094, 0.05449676513671875, 0.057007789611816406, 0.05951881408691406, 0.06202983856201172, 0.06454086303710938, 0.06705188751220703, 0.06956291198730469, 0.07207393646240234, 0.0745849609375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 16.0, 33.0, 64.0, 106.0, 162.0, 199.0, 166.0, 125.0, 77.0, 29.0, 13.0, 6.0, 3.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.8273568153381348, -2.7691216468811035, -2.7108867168426514, -2.65265154838562, -2.594416618347168, -2.5361814498901367, -2.4779465198516846, -2.4197113513946533, -2.361476421356201, -2.30324125289917, -2.2450063228607178, -2.1867711544036865, -2.1285362243652344, -2.070301055908203, -2.012066125869751, -1.9538309574127197, -1.8955957889556885, -1.8373607397079468, -1.779125690460205, -1.7208906412124634, -1.6626555919647217, -1.6044204235076904, -1.5461853742599487, -1.487950325012207, -1.4297152757644653, -1.3714802265167236, -1.313245177268982, -1.2550101280212402, -1.196774959564209, -1.1385400295257568, -1.0803048610687256, -1.0220698118209839, -0.9638346433639526, -0.9055995941162109, -0.8473645448684692, -0.7891294360160828, -0.7308943867683411, -0.6726593375205994, -0.6144242286682129, -0.5561891794204712, -0.4979541301727295, -0.4397190809249878, -0.3814840018749237, -0.3232489228248596, -0.2650138735771179, -0.20677882432937622, -0.14854374527931213, -0.09030866622924805, -0.03207361698150635, 0.026161447167396545, 0.08439651131629944, 0.14263157546520233, 0.20086663961410522, 0.2591016888618469, 0.317336767911911, 0.3755718469619751, 0.4338068962097168, 0.4920419454574585, 0.5502769947052002, 0.6085121035575867, 0.6667471528053284, 0.7249822020530701, 0.7832173109054565, 0.8414523601531982, 0.8996874094009399]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 4.0, 8.0, 3.0, 3.0, 7.0, 12.0, 10.0, 13.0, 9.0, 15.0, 18.0, 25.0, 16.0, 35.0, 30.0, 33.0, 31.0, 36.0, 31.0, 33.0, 47.0, 38.0, 48.0, 39.0, 50.0, 46.0, 45.0, 33.0, 35.0, 35.0, 28.0, 29.0, 32.0, 19.0, 25.0, 13.0, 12.0, 11.0, 14.0, 5.0, 7.0, 9.0, 4.0, 7.0, 4.0, 0.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8710747957229614, -0.8437668681144714, -0.8164590001106262, -0.7891510725021362, -0.761843204498291, -0.734535276889801, -0.707227349281311, -0.6799194812774658, -0.6526115536689758, -0.6253036260604858, -0.5979957580566406, -0.5706878304481506, -0.5433799028396606, -0.5160720348358154, -0.48876410722732544, -0.46145620942115784, -0.43414831161499023, -0.40684041380882263, -0.37953251600265503, -0.35222458839416504, -0.32491669058799744, -0.29760879278182983, -0.27030086517333984, -0.24299296736717224, -0.21568506956100464, -0.18837717175483704, -0.16106925904750824, -0.13376134634017944, -0.10645344853401184, -0.07914555072784424, -0.05183763802051544, -0.024529725313186646, 0.0027781128883361816, 0.03008601814508438, 0.05739392340183258, 0.08470182865858078, 0.11200973391532898, 0.13931763172149658, 0.16662554442882538, 0.19393345713615417, 0.22124135494232178, 0.24854925274848938, 0.275857150554657, 0.303165078163147, 0.3304729759693146, 0.3577808737754822, 0.38508880138397217, 0.41239669919013977, 0.4397045969963074, 0.467012494802475, 0.4943203926086426, 0.5216283202171326, 0.5489362478256226, 0.5762441158294678, 0.6035520434379578, 0.6308599710464478, 0.658167839050293, 0.685475766658783, 0.7127836346626282, 0.7400915622711182, 0.7673994302749634, 0.7947073578834534, 0.8220152854919434, 0.8493231534957886, 0.8766310811042786]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 18.0, 27.0, 59.0, 121.0, 211.0, 442.0, 903.0, 2288.0, 5734.0, 17072.0, 69986.0, 995012.0, 2983316.0, 87027.0, 20096.0, 6850.0, 2629.0, 1192.0, 539.0, 294.0, 162.0, 104.0, 54.0, 39.0, 31.0, 17.0, 14.0, 9.0, 10.0, 7.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1455078125, -0.13745498657226562, -0.12940216064453125, -0.12134933471679688, -0.1132965087890625, -0.10524368286132812, -0.09719085693359375, -0.08913803100585938, -0.081085205078125, -0.07303237915039062, -0.06497955322265625, -0.056926727294921875, -0.0488739013671875, -0.040821075439453125, -0.03276824951171875, -0.024715423583984375, -0.01666259765625, -0.008609771728515625, -0.00055694580078125, 0.007495880126953125, 0.0155487060546875, 0.023601531982421875, 0.03165435791015625, 0.039707183837890625, 0.047760009765625, 0.055812835693359375, 0.06386566162109375, 0.07191848754882812, 0.0799713134765625, 0.08802413940429688, 0.09607696533203125, 0.10412979125976562, 0.1121826171875, 0.12023544311523438, 0.12828826904296875, 0.13634109497070312, 0.1443939208984375, 0.15244674682617188, 0.16049957275390625, 0.16855239868164062, 0.176605224609375, 0.18465805053710938, 0.19271087646484375, 0.20076370239257812, 0.2088165283203125, 0.21686935424804688, 0.22492218017578125, 0.23297500610351562, 0.24102783203125, 0.24908065795898438, 0.25713348388671875, 0.2651863098144531, 0.2732391357421875, 0.2812919616699219, 0.28934478759765625, 0.2973976135253906, 0.305450439453125, 0.3135032653808594, 0.32155609130859375, 0.3296089172363281, 0.3376617431640625, 0.3457145690917969, 0.35376739501953125, 0.3618202209472656, 0.369873046875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 3.0, 2.0, 5.0, 2.0, 1.0, 5.0, 4.0, 8.0, 5.0, 16.0, 13.0, 11.0, 27.0, 22.0, 48.0, 52.0, 58.0, 52.0, 63.0, 57.0, 65.0, 68.0, 61.0, 59.0, 36.0, 38.0, 46.0, 34.0, 34.0, 25.0, 23.0, 11.0, 17.0, 3.0, 11.0, 7.0, 7.0, 2.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.040435791015625, -0.0391693115234375, -0.03790283203125, -0.0366363525390625, -0.035369873046875, -0.0341033935546875, -0.0328369140625, -0.0315704345703125, -0.030303955078125, -0.0290374755859375, -0.02777099609375, -0.0265045166015625, -0.025238037109375, -0.0239715576171875, -0.022705078125, -0.0214385986328125, -0.020172119140625, -0.0189056396484375, -0.01763916015625, -0.0163726806640625, -0.015106201171875, -0.0138397216796875, -0.0125732421875, -0.0113067626953125, -0.010040283203125, -0.0087738037109375, -0.00750732421875, -0.0062408447265625, -0.004974365234375, -0.0037078857421875, -0.00244140625, -0.0011749267578125, 9.1552734375e-05, 0.0013580322265625, 0.00262451171875, 0.0038909912109375, 0.005157470703125, 0.0064239501953125, 0.0076904296875, 0.0089569091796875, 0.010223388671875, 0.0114898681640625, 0.01275634765625, 0.0140228271484375, 0.015289306640625, 0.0165557861328125, 0.017822265625, 0.0190887451171875, 0.020355224609375, 0.0216217041015625, 0.02288818359375, 0.0241546630859375, 0.025421142578125, 0.0266876220703125, 0.0279541015625, 0.0292205810546875, 0.030487060546875, 0.0317535400390625, 0.03302001953125, 0.0342864990234375, 0.035552978515625, 0.0368194580078125, 0.0380859375, 0.0393524169921875, 0.040618896484375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 11.0, 8.0, 15.0, 16.0, 17.0, 38.0, 34.0, 75.0, 86.0, 140.0, 266.0, 743.0, 4020.0, 44639.0, 3596365.0, 526015.0, 18345.0, 2230.0, 549.0, 236.0, 150.0, 103.0, 46.0, 40.0, 27.0, 17.0, 12.0, 8.0, 12.0, 8.0, 3.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57470703125, -0.5582084655761719, -0.5417098999023438, -0.5252113342285156, -0.5087127685546875, -0.4922142028808594, -0.47571563720703125, -0.4592170715332031, -0.442718505859375, -0.4262199401855469, -0.40972137451171875, -0.3932228088378906, -0.3767242431640625, -0.3602256774902344, -0.34372711181640625, -0.3272285461425781, -0.31072998046875, -0.2942314147949219, -0.27773284912109375, -0.2612342834472656, -0.2447357177734375, -0.22823715209960938, -0.21173858642578125, -0.19524002075195312, -0.178741455078125, -0.16224288940429688, -0.14574432373046875, -0.12924575805664062, -0.1127471923828125, -0.09624862670898438, -0.07975006103515625, -0.06325149536132812, -0.0467529296875, -0.030254364013671875, -0.01375579833984375, 0.002742767333984375, 0.0192413330078125, 0.035739898681640625, 0.05223846435546875, 0.06873703002929688, 0.085235595703125, 0.10173416137695312, 0.11823272705078125, 0.13473129272460938, 0.1512298583984375, 0.16772842407226562, 0.18422698974609375, 0.20072555541992188, 0.21722412109375, 0.23372268676757812, 0.25022125244140625, 0.2667198181152344, 0.2832183837890625, 0.2997169494628906, 0.31621551513671875, 0.3327140808105469, 0.349212646484375, 0.3657112121582031, 0.38220977783203125, 0.3987083435058594, 0.4152069091796875, 0.4317054748535156, 0.44820404052734375, 0.4647026062011719, 0.481201171875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 1.0, 4.0, 10.0, 15.0, 46.0, 77.0, 162.0, 521.0, 2295.0, 589.0, 200.0, 72.0, 45.0, 24.0, 9.0, 6.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1575927734375, -0.1528949737548828, -0.14819717407226562, -0.14349937438964844, -0.13880157470703125, -0.13410377502441406, -0.12940597534179688, -0.12470817565917969, -0.1200103759765625, -0.11531257629394531, -0.11061477661132812, -0.10591697692871094, -0.10121917724609375, -0.09652137756347656, -0.09182357788085938, -0.08712577819824219, -0.082427978515625, -0.07773017883300781, -0.07303237915039062, -0.06833457946777344, -0.06363677978515625, -0.05893898010253906, -0.054241180419921875, -0.04954338073730469, -0.0448455810546875, -0.04014778137207031, -0.035449981689453125, -0.030752182006835938, -0.02605438232421875, -0.021356582641601562, -0.016658782958984375, -0.011960983276367188, -0.00726318359375, -0.0025653839111328125, 0.002132415771484375, 0.0068302154541015625, 0.01152801513671875, 0.016225814819335938, 0.020923614501953125, 0.025621414184570312, 0.0303192138671875, 0.03501701354980469, 0.039714813232421875, 0.04441261291503906, 0.04911041259765625, 0.05380821228027344, 0.058506011962890625, 0.06320381164550781, 0.067901611328125, 0.07259941101074219, 0.07729721069335938, 0.08199501037597656, 0.08669281005859375, 0.09139060974121094, 0.09608840942382812, 0.10078620910644531, 0.1054840087890625, 0.11018180847167969, 0.11487960815429688, 0.11957740783691406, 0.12427520751953125, 0.12897300720214844, 0.13367080688476562, 0.1383686065673828, 0.14306640625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 23.0, 33.0, 86.0, 160.0, 228.0, 204.0, 132.0, 69.0, 38.0, 17.0, 10.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8907641768455505, -0.8672272562980652, -0.8436903357505798, -0.8201534152030945, -0.7966164946556091, -0.7730796337127686, -0.7495427131652832, -0.7260057926177979, -0.7024688720703125, -0.6789319515228271, -0.6553950309753418, -0.6318581104278564, -0.6083211898803711, -0.5847842693328857, -0.5612473487854004, -0.5377104878425598, -0.5141735076904297, -0.49063658714294434, -0.467099666595459, -0.44356274604797363, -0.42002585530281067, -0.3964889347553253, -0.37295201420783997, -0.349415123462677, -0.32587820291519165, -0.3023412823677063, -0.27880436182022095, -0.2552674412727356, -0.23173055052757263, -0.20819362998008728, -0.18465670943260193, -0.16111980378627777, -0.1375828981399536, -0.11404598504304886, -0.0905090719461441, -0.06697215139865875, -0.043435238301754, -0.019898325204849243, 0.0036385953426361084, 0.027175500988960266, 0.05071242153644562, 0.07424933463335037, 0.09778624773025513, 0.12132316827774048, 0.14486008882522583, 0.16839699447155, 0.19193391501903534, 0.2154708206653595, 0.23900774121284485, 0.2625446617603302, 0.28608158230781555, 0.3096184730529785, 0.33315539360046387, 0.3566923141479492, 0.38022923469543457, 0.4037661552429199, 0.4273030757904053, 0.4508399963378906, 0.474376916885376, 0.49791383743286133, 0.5214507579803467, 0.544987678527832, 0.5685245990753174, 0.592061460018158, 0.6155983805656433]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 6.0, 1.0, 6.0, 5.0, 7.0, 8.0, 8.0, 14.0, 15.0, 22.0, 25.0, 22.0, 33.0, 24.0, 24.0, 39.0, 36.0, 27.0, 41.0, 47.0, 39.0, 40.0, 45.0, 51.0, 36.0, 35.0, 31.0, 44.0, 33.0, 31.0, 29.0, 25.0, 23.0, 12.0, 26.0, 10.0, 17.0, 14.0, 20.0, 9.0, 8.0, 6.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20392996072769165, -0.19633793830871582, -0.18874591588974, -0.18115389347076416, -0.17356185615062714, -0.1659698337316513, -0.15837781131267548, -0.15078578889369965, -0.14319375157356262, -0.1356017291545868, -0.12800970673561096, -0.12041767686605453, -0.11282564699649811, -0.10523362457752228, -0.09764160215854645, -0.09004957973957062, -0.08245755732059479, -0.07486553490161896, -0.06727350503206253, -0.0596814826130867, -0.05208945646882057, -0.04449743032455444, -0.03690540790557861, -0.029313381761312485, -0.021721355617046356, -0.014129330404102802, -0.006537305191159248, 0.001054719090461731, 0.00864674523472786, 0.016238771378993988, 0.023830793797969818, 0.03142281994223595, 0.039014846086502075, 0.046606872230768204, 0.05419889837503433, 0.06179092079401016, 0.06938295066356659, 0.07697497308254242, 0.08456699550151825, 0.09215901792049408, 0.0997510477900505, 0.10734307020902634, 0.11493510007858276, 0.1225271224975586, 0.13011914491653442, 0.13771116733551025, 0.14530318975448608, 0.1528952270746231, 0.16048724949359894, 0.16807927191257477, 0.1756712943315506, 0.18326333165168762, 0.19085535407066345, 0.19844737648963928, 0.2060393989086151, 0.21363142132759094, 0.22122344374656677, 0.2288154661655426, 0.23640748858451843, 0.24399951100349426, 0.2515915334224701, 0.2591835856437683, 0.26677560806274414, 0.27436763048171997, 0.2819596529006958]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 12.0, 10.0, 19.0, 25.0, 17.0, 47.0, 61.0, 92.0, 166.0, 228.0, 428.0, 740.0, 1304.0, 2494.0, 4843.0, 9496.0, 20223.0, 44408.0, 98277.0, 212474.0, 316973.0, 181138.0, 82649.0, 37441.0, 17314.0, 8584.0, 4165.0, 2123.0, 1176.0, 640.0, 376.0, 207.0, 141.0, 87.0, 59.0, 35.0, 24.0, 12.0, 21.0, 10.0, 4.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11309814453125, -0.10896968841552734, -0.10484123229980469, -0.10071277618408203, -0.09658432006835938, -0.09245586395263672, -0.08832740783691406, -0.0841989517211914, -0.08007049560546875, -0.0759420394897461, -0.07181358337402344, -0.06768512725830078, -0.06355667114257812, -0.05942821502685547, -0.05529975891113281, -0.051171302795410156, -0.0470428466796875, -0.042914390563964844, -0.03878593444824219, -0.03465747833251953, -0.030529022216796875, -0.02640056610107422, -0.022272109985351562, -0.018143653869628906, -0.01401519775390625, -0.009886741638183594, -0.0057582855224609375, -0.0016298294067382812, 0.002498626708984375, 0.006627082824707031, 0.010755538940429688, 0.014883995056152344, 0.019012451171875, 0.023140907287597656, 0.027269363403320312, 0.03139781951904297, 0.035526275634765625, 0.03965473175048828, 0.04378318786621094, 0.047911643981933594, 0.05204010009765625, 0.056168556213378906, 0.06029701232910156, 0.06442546844482422, 0.06855392456054688, 0.07268238067626953, 0.07681083679199219, 0.08093929290771484, 0.0850677490234375, 0.08919620513916016, 0.09332466125488281, 0.09745311737060547, 0.10158157348632812, 0.10571002960205078, 0.10983848571777344, 0.1139669418334961, 0.11809539794921875, 0.1222238540649414, 0.12635231018066406, 0.13048076629638672, 0.13460922241210938, 0.13873767852783203, 0.1428661346435547, 0.14699459075927734, 0.151123046875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 2.0, 3.0, 6.0, 12.0, 10.0, 15.0, 17.0, 20.0, 24.0, 30.0, 36.0, 55.0, 49.0, 57.0, 47.0, 61.0, 56.0, 67.0, 62.0, 55.0, 46.0, 42.0, 29.0, 36.0, 36.0, 27.0, 15.0, 17.0, 15.0, 17.0, 6.0, 6.0, 7.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038604736328125, -0.03735780715942383, -0.036110877990722656, -0.034863948822021484, -0.03361701965332031, -0.03237009048461914, -0.03112316131591797, -0.029876232147216797, -0.028629302978515625, -0.027382373809814453, -0.02613544464111328, -0.02488851547241211, -0.023641586303710938, -0.022394657135009766, -0.021147727966308594, -0.019900798797607422, -0.01865386962890625, -0.017406940460205078, -0.016160011291503906, -0.014913082122802734, -0.013666152954101562, -0.01241922378540039, -0.011172294616699219, -0.009925365447998047, -0.008678436279296875, -0.007431507110595703, -0.006184577941894531, -0.004937648773193359, -0.0036907196044921875, -0.0024437904357910156, -0.0011968612670898438, 5.0067901611328125e-05, 0.0012969970703125, 0.002543926239013672, 0.0037908554077148438, 0.005037784576416016, 0.0062847137451171875, 0.007531642913818359, 0.008778572082519531, 0.010025501251220703, 0.011272430419921875, 0.012519359588623047, 0.013766288757324219, 0.01501321792602539, 0.016260147094726562, 0.017507076263427734, 0.018754005432128906, 0.020000934600830078, 0.02124786376953125, 0.022494792938232422, 0.023741722106933594, 0.024988651275634766, 0.026235580444335938, 0.02748250961303711, 0.02872943878173828, 0.029976367950439453, 0.031223297119140625, 0.0324702262878418, 0.03371715545654297, 0.03496408462524414, 0.03621101379394531, 0.037457942962646484, 0.038704872131347656, 0.03995180130004883, 0.04119873046875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 5.0, 1.0, 6.0, 12.0, 17.0, 10.0, 25.0, 27.0, 58.0, 54.0, 90.0, 113.0, 178.0, 240.0, 411.0, 619.0, 1116.0, 2203.0, 6317.0, 26066.0, 138888.0, 538963.0, 266168.0, 49662.0, 10396.0, 3232.0, 1417.0, 786.0, 444.0, 301.0, 207.0, 153.0, 91.0, 66.0, 64.0, 38.0, 26.0, 27.0, 18.0, 12.0, 12.0, 4.0, 4.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2420654296875, -0.23442840576171875, -0.2267913818359375, -0.21915435791015625, -0.211517333984375, -0.20388031005859375, -0.1962432861328125, -0.18860626220703125, -0.18096923828125, -0.17333221435546875, -0.1656951904296875, -0.15805816650390625, -0.150421142578125, -0.14278411865234375, -0.1351470947265625, -0.12751007080078125, -0.119873046875, -0.11223602294921875, -0.1045989990234375, -0.09696197509765625, -0.089324951171875, -0.08168792724609375, -0.0740509033203125, -0.06641387939453125, -0.05877685546875, -0.05113983154296875, -0.0435028076171875, -0.03586578369140625, -0.028228759765625, -0.02059173583984375, -0.0129547119140625, -0.00531768798828125, 0.0023193359375, 0.00995635986328125, 0.0175933837890625, 0.02523040771484375, 0.032867431640625, 0.04050445556640625, 0.0481414794921875, 0.05577850341796875, 0.06341552734375, 0.07105255126953125, 0.0786895751953125, 0.08632659912109375, 0.093963623046875, 0.10160064697265625, 0.1092376708984375, 0.11687469482421875, 0.12451171875, 0.13214874267578125, 0.1397857666015625, 0.14742279052734375, 0.155059814453125, 0.16269683837890625, 0.1703338623046875, 0.17797088623046875, 0.18560791015625, 0.19324493408203125, 0.2008819580078125, 0.20851898193359375, 0.216156005859375, 0.22379302978515625, 0.2314300537109375, 0.23906707763671875, 0.2467041015625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 8.0, 11.0, 11.0, 9.0, 15.0, 12.0, 12.0, 19.0, 26.0, 33.0, 25.0, 35.0, 43.0, 46.0, 38.0, 41.0, 51.0, 42.0, 38.0, 43.0, 50.0, 49.0, 44.0, 39.0, 39.0, 27.0, 27.0, 28.0, 22.0, 26.0, 18.0, 18.0, 12.0, 13.0, 8.0, 8.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1285400390625, -0.12342453002929688, -0.11830902099609375, -0.11319351196289062, -0.1080780029296875, -0.10296249389648438, -0.09784698486328125, -0.09273147583007812, -0.087615966796875, -0.08250045776367188, -0.07738494873046875, -0.07226943969726562, -0.0671539306640625, -0.062038421630859375, -0.05692291259765625, -0.051807403564453125, -0.04669189453125, -0.041576385498046875, -0.03646087646484375, -0.031345367431640625, -0.0262298583984375, -0.021114349365234375, -0.01599884033203125, -0.010883331298828125, -0.005767822265625, -0.000652313232421875, 0.00446319580078125, 0.009578704833984375, 0.0146942138671875, 0.019809722900390625, 0.02492523193359375, 0.030040740966796875, 0.03515625, 0.040271759033203125, 0.04538726806640625, 0.050502777099609375, 0.0556182861328125, 0.060733795166015625, 0.06584930419921875, 0.07096481323242188, 0.076080322265625, 0.08119583129882812, 0.08631134033203125, 0.09142684936523438, 0.0965423583984375, 0.10165786743164062, 0.10677337646484375, 0.11188888549804688, 0.11700439453125, 0.12211990356445312, 0.12723541259765625, 0.13235092163085938, 0.1374664306640625, 0.14258193969726562, 0.14769744873046875, 0.15281295776367188, 0.157928466796875, 0.16304397583007812, 0.16815948486328125, 0.17327499389648438, 0.1783905029296875, 0.18350601196289062, 0.18862152099609375, 0.19373703002929688, 0.1988525390625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 7.0, 4.0, 5.0, 3.0, 4.0, 11.0, 16.0, 27.0, 30.0, 48.0, 94.0, 159.0, 251.0, 421.0, 839.0, 1734.0, 4086.0, 10713.0, 39454.0, 294686.0, 594216.0, 74596.0, 16749.0, 5556.0, 2424.0, 1064.0, 580.0, 328.0, 165.0, 98.0, 61.0, 41.0, 28.0, 19.0, 17.0, 12.0, 10.0, 4.0, 0.0, 0.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13916015625, -0.1345500946044922, -0.12994003295898438, -0.12532997131347656, -0.12071990966796875, -0.11610984802246094, -0.11149978637695312, -0.10688972473144531, -0.1022796630859375, -0.09766960144042969, -0.09305953979492188, -0.08844947814941406, -0.08383941650390625, -0.07922935485839844, -0.07461929321289062, -0.07000923156738281, -0.065399169921875, -0.06078910827636719, -0.056179046630859375, -0.05156898498535156, -0.04695892333984375, -0.04234886169433594, -0.037738800048828125, -0.03312873840332031, -0.0285186767578125, -0.023908615112304688, -0.019298553466796875, -0.014688491821289062, -0.01007843017578125, -0.0054683685302734375, -0.000858306884765625, 0.0037517547607421875, 0.00836181640625, 0.012971878051757812, 0.017581939697265625, 0.022192001342773438, 0.02680206298828125, 0.03141212463378906, 0.036022186279296875, 0.04063224792480469, 0.0452423095703125, 0.04985237121582031, 0.054462432861328125, 0.05907249450683594, 0.06368255615234375, 0.06829261779785156, 0.07290267944335938, 0.07751274108886719, 0.082122802734375, 0.08673286437988281, 0.09134292602539062, 0.09595298767089844, 0.10056304931640625, 0.10517311096191406, 0.10978317260742188, 0.11439323425292969, 0.1190032958984375, 0.12361335754394531, 0.12822341918945312, 0.13283348083496094, 0.13744354248046875, 0.14205360412597656, 0.14666366577148438, 0.1512737274169922, 0.1558837890625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 4.0, 6.0, 10.0, 22.0, 22.0, 45.0, 56.0, 100.0, 160.0, 168.0, 127.0, 89.0, 58.0, 31.0, 24.0, 19.0, 15.0, 11.0, 11.0, 9.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011014938354492188, -0.0001056380569934845, -0.00010112673044204712, -9.661540389060974e-05, -9.210407733917236e-05, -8.759275078773499e-05, -8.308142423629761e-05, -7.857009768486023e-05, -7.405877113342285e-05, -6.954744458198547e-05, -6.50361180305481e-05, -6.052479147911072e-05, -5.601346492767334e-05, -5.150213837623596e-05, -4.6990811824798584e-05, -4.2479485273361206e-05, -3.796815872192383e-05, -3.345683217048645e-05, -2.8945505619049072e-05, -2.4434179067611694e-05, -1.9922852516174316e-05, -1.541152596473694e-05, -1.090019941329956e-05, -6.388872861862183e-06, -1.8775463104248047e-06, 2.6337802410125732e-06, 7.145106792449951e-06, 1.1656433343887329e-05, 1.6167759895324707e-05, 2.0679086446762085e-05, 2.5190412998199463e-05, 2.970173954963684e-05, 3.421306610107422e-05, 3.87243926525116e-05, 4.3235719203948975e-05, 4.774704575538635e-05, 5.225837230682373e-05, 5.676969885826111e-05, 6.128102540969849e-05, 6.579235196113586e-05, 7.030367851257324e-05, 7.481500506401062e-05, 7.9326331615448e-05, 8.383765816688538e-05, 8.834898471832275e-05, 9.286031126976013e-05, 9.737163782119751e-05, 0.00010188296437263489, 0.00010639429092407227, 0.00011090561747550964, 0.00011541694402694702, 0.0001199282705783844, 0.00012443959712982178, 0.00012895092368125916, 0.00013346225023269653, 0.0001379735767841339, 0.0001424849033355713, 0.00014699622988700867, 0.00015150755643844604, 0.00015601888298988342, 0.0001605302095413208, 0.00016504153609275818, 0.00016955286264419556, 0.00017406418919563293, 0.0001785755157470703]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 9.0, 9.0, 12.0, 10.0, 18.0, 14.0, 10.0, 28.0, 42.0, 82.0, 111.0, 198.0, 375.0, 882.0, 2413.0, 8577.0, 50753.0, 718695.0, 237277.0, 21362.0, 4837.0, 1511.0, 628.0, 282.0, 153.0, 77.0, 52.0, 38.0, 19.0, 25.0, 17.0, 8.0, 7.0, 4.0, 6.0, 1.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.206787109375, -0.20084190368652344, -0.19489669799804688, -0.1889514923095703, -0.18300628662109375, -0.1770610809326172, -0.17111587524414062, -0.16517066955566406, -0.1592254638671875, -0.15328025817871094, -0.14733505249023438, -0.1413898468017578, -0.13544464111328125, -0.1294994354248047, -0.12355422973632812, -0.11760902404785156, -0.111663818359375, -0.10571861267089844, -0.09977340698242188, -0.09382820129394531, -0.08788299560546875, -0.08193778991699219, -0.07599258422851562, -0.07004737854003906, -0.0641021728515625, -0.05815696716308594, -0.052211761474609375, -0.04626655578613281, -0.04032135009765625, -0.03437614440917969, -0.028430938720703125, -0.022485733032226562, -0.01654052734375, -0.010595321655273438, -0.004650115966796875, 0.0012950897216796875, 0.00724029541015625, 0.013185501098632812, 0.019130706787109375, 0.025075912475585938, 0.0310211181640625, 0.03696632385253906, 0.042911529541015625, 0.04885673522949219, 0.05480194091796875, 0.06074714660644531, 0.06669235229492188, 0.07263755798339844, 0.078582763671875, 0.08452796936035156, 0.09047317504882812, 0.09641838073730469, 0.10236358642578125, 0.10830879211425781, 0.11425399780273438, 0.12019920349121094, 0.1261444091796875, 0.13208961486816406, 0.13803482055664062, 0.1439800262451172, 0.14992523193359375, 0.1558704376220703, 0.16181564331054688, 0.16776084899902344, 0.1737060546875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 5.0, 6.0, 8.0, 12.0, 16.0, 16.0, 24.0, 36.0, 59.0, 86.0, 121.0, 170.0, 130.0, 91.0, 57.0, 40.0, 35.0, 25.0, 19.0, 11.0, 7.0, 6.0, 4.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09619140625, -0.09242057800292969, -0.08864974975585938, -0.08487892150878906, -0.08110809326171875, -0.07733726501464844, -0.07356643676757812, -0.06979560852050781, -0.0660247802734375, -0.06225395202636719, -0.058483123779296875, -0.05471229553222656, -0.05094146728515625, -0.04717063903808594, -0.043399810791015625, -0.03962898254394531, -0.035858154296875, -0.03208732604980469, -0.028316497802734375, -0.024545669555664062, -0.02077484130859375, -0.017004013061523438, -0.013233184814453125, -0.009462356567382812, -0.0056915283203125, -0.0019207000732421875, 0.001850128173828125, 0.0056209564208984375, 0.00939178466796875, 0.013162612915039062, 0.016933441162109375, 0.020704269409179688, 0.02447509765625, 0.028245925903320312, 0.032016754150390625, 0.03578758239746094, 0.03955841064453125, 0.04332923889160156, 0.047100067138671875, 0.05087089538574219, 0.0546417236328125, 0.05841255187988281, 0.062183380126953125, 0.06595420837402344, 0.06972503662109375, 0.07349586486816406, 0.07726669311523438, 0.08103752136230469, 0.084808349609375, 0.08857917785644531, 0.09235000610351562, 0.09612083435058594, 0.09989166259765625, 0.10366249084472656, 0.10743331909179688, 0.11120414733886719, 0.1149749755859375, 0.11874580383300781, 0.12251663208007812, 0.12628746032714844, 0.13005828857421875, 0.13382911682128906, 0.13759994506835938, 0.1413707733154297, 0.1451416015625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 1.0, 7.0, 6.0, 23.0, 37.0, 53.0, 114.0, 161.0, 166.0, 150.0, 109.0, 68.0, 64.0, 22.0, 15.0, 4.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.4324772357940674, -2.380523443222046, -2.3285698890686035, -2.276616096496582, -2.2246625423431396, -2.172708749771118, -2.120755195617676, -2.0688014030456543, -2.016847848892212, -1.96489417552948, -1.912940502166748, -1.8609868288040161, -1.8090331554412842, -1.7570793628692627, -1.7051258087158203, -1.6531720161437988, -1.6012182235717773, -1.5492645502090454, -1.4973108768463135, -1.4453572034835815, -1.3934035301208496, -1.3414497375488281, -1.2894961833953857, -1.2375423908233643, -1.1855888366699219, -1.13363516330719, -1.081681489944458, -1.029727816581726, -0.9777740836143494, -0.9258204102516174, -0.8738667368888855, -0.8219130039215088, -0.7699593305587769, -0.7180056571960449, -0.666051983833313, -0.614098310470581, -0.5621445775032043, -0.5101909041404724, -0.4582372307777405, -0.40628352761268616, -0.3543298542499542, -0.3023761808872223, -0.25042247772216797, -0.19846880435943604, -0.1465151160955429, -0.09456142783164978, -0.04260775446891785, 0.009345948696136475, 0.06129962205886841, 0.11325331032276154, 0.16520699858665466, 0.2171606719493866, 0.2691143751144409, 0.32106804847717285, 0.3730217218399048, 0.4249754250049591, 0.47692909836769104, 0.5288828015327454, 0.5808364748954773, 0.6327901482582092, 0.6847438216209412, 0.7366975545883179, 0.7886512279510498, 0.8406049013137817, 0.8925585746765137]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 2.0, 6.0, 2.0, 10.0, 4.0, 8.0, 7.0, 13.0, 13.0, 18.0, 17.0, 28.0, 35.0, 26.0, 33.0, 42.0, 36.0, 45.0, 49.0, 57.0, 56.0, 55.0, 47.0, 47.0, 34.0, 46.0, 39.0, 51.0, 28.0, 22.0, 19.0, 20.0, 19.0, 19.0, 18.0, 6.0, 5.0, 10.0, 6.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.9482361078262329, -0.917751133441925, -0.8872660994529724, -0.8567811250686646, -0.8262961506843567, -0.7958111763000488, -0.7653261423110962, -0.7348411679267883, -0.7043561935424805, -0.6738712191581726, -0.64338618516922, -0.6129012107849121, -0.5824162364006042, -0.5519312620162964, -0.5214462280273438, -0.4909612536430359, -0.46047621965408325, -0.429991215467453, -0.39950624108314514, -0.3690212368965149, -0.33853626251220703, -0.3080512583255768, -0.27756625413894653, -0.24708126485347748, -0.21659627556800842, -0.18611128628253937, -0.1556262969970703, -0.12514129281044006, -0.09465630352497101, -0.06417131423950195, -0.033686310052871704, -0.003201320767402649, 0.027283668518066406, 0.05776866152882576, 0.08825365453958511, 0.11873865127563477, 0.14922364056110382, 0.17970862984657288, 0.21019363403320312, 0.24067862331867218, 0.27116361260414124, 0.3016486167907715, 0.33213359117507935, 0.3626185953617096, 0.39310359954833984, 0.4235885739326477, 0.45407357811927795, 0.4845585823059082, 0.5150435566902161, 0.5455285310745239, 0.5760135650634766, 0.6064985394477844, 0.6369835138320923, 0.6674685478210449, 0.6979535222053528, 0.7284384965896606, 0.7589235305786133, 0.7894085049629211, 0.8198935389518738, 0.8503785133361816, 0.8808634877204895, 0.9113484621047974, 0.94183349609375, 0.9723184704780579, 1.0028034448623657]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 10.0, 26.0, 24.0, 42.0, 58.0, 114.0, 163.0, 300.0, 472.0, 881.0, 1584.0, 3285.0, 7073.0, 18611.0, 58878.0, 285511.0, 3320282.0, 387927.0, 70881.0, 21519.0, 8224.0, 3669.0, 1934.0, 1042.0, 624.0, 360.0, 207.0, 166.0, 112.0, 83.0, 53.0, 29.0, 30.0, 18.0, 19.0, 13.0, 12.0, 13.0, 7.0, 5.0, 6.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1490478515625, -0.14364242553710938, -0.13823699951171875, -0.13283157348632812, -0.1274261474609375, -0.12202072143554688, -0.11661529541015625, -0.11120986938476562, -0.105804443359375, -0.10039901733398438, -0.09499359130859375, -0.08958816528320312, -0.0841827392578125, -0.07877731323242188, -0.07337188720703125, -0.06796646118164062, -0.06256103515625, -0.057155609130859375, -0.05175018310546875, -0.046344757080078125, -0.0409393310546875, -0.035533905029296875, -0.03012847900390625, -0.024723052978515625, -0.019317626953125, -0.013912200927734375, -0.00850677490234375, -0.003101348876953125, 0.0023040771484375, 0.007709503173828125, 0.01311492919921875, 0.018520355224609375, 0.02392578125, 0.029331207275390625, 0.03473663330078125, 0.040142059326171875, 0.0455474853515625, 0.050952911376953125, 0.05635833740234375, 0.061763763427734375, 0.067169189453125, 0.07257461547851562, 0.07798004150390625, 0.08338546752929688, 0.0887908935546875, 0.09419631958007812, 0.09960174560546875, 0.10500717163085938, 0.11041259765625, 0.11581802368164062, 0.12122344970703125, 0.12662887573242188, 0.1320343017578125, 0.13743972778320312, 0.14284515380859375, 0.14825057983398438, 0.153656005859375, 0.15906143188476562, 0.16446685791015625, 0.16987228393554688, 0.1752777099609375, 0.18068313598632812, 0.18608856201171875, 0.19149398803710938, 0.1968994140625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 5.0, 6.0, 8.0, 8.0, 4.0, 19.0, 21.0, 20.0, 16.0, 21.0, 46.0, 39.0, 43.0, 55.0, 65.0, 56.0, 66.0, 57.0, 57.0, 59.0, 48.0, 40.0, 39.0, 28.0, 35.0, 34.0, 22.0, 19.0, 16.0, 11.0, 8.0, 6.0, 4.0, 3.0, 8.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.037750244140625, -0.036501407623291016, -0.03525257110595703, -0.03400373458862305, -0.03275489807128906, -0.03150606155395508, -0.030257225036621094, -0.02900838851928711, -0.027759552001953125, -0.02651071548461914, -0.025261878967285156, -0.024013042449951172, -0.022764205932617188, -0.021515369415283203, -0.02026653289794922, -0.019017696380615234, -0.01776885986328125, -0.016520023345947266, -0.015271186828613281, -0.014022350311279297, -0.012773513793945312, -0.011524677276611328, -0.010275840759277344, -0.00902700424194336, -0.007778167724609375, -0.006529331207275391, -0.005280494689941406, -0.004031658172607422, -0.0027828216552734375, -0.0015339851379394531, -0.00028514862060546875, 0.0009636878967285156, 0.0022125244140625, 0.0034613609313964844, 0.004710197448730469, 0.005959033966064453, 0.0072078704833984375, 0.008456707000732422, 0.009705543518066406, 0.01095438003540039, 0.012203216552734375, 0.01345205307006836, 0.014700889587402344, 0.015949726104736328, 0.017198562622070312, 0.018447399139404297, 0.01969623565673828, 0.020945072174072266, 0.02219390869140625, 0.023442745208740234, 0.02469158172607422, 0.025940418243408203, 0.027189254760742188, 0.028438091278076172, 0.029686927795410156, 0.03093576431274414, 0.032184600830078125, 0.03343343734741211, 0.034682273864746094, 0.03593111038208008, 0.03717994689941406, 0.03842878341674805, 0.03967761993408203, 0.040926456451416016, 0.04217529296875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 9.0, 13.0, 17.0, 22.0, 39.0, 56.0, 110.0, 214.0, 554.0, 1772.0, 7431.0, 43930.0, 661852.0, 3342770.0, 115686.0, 14955.0, 3180.0, 924.0, 368.0, 160.0, 93.0, 40.0, 38.0, 16.0, 14.0, 8.0, 7.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.307861328125, -0.2976722717285156, -0.28748321533203125, -0.2772941589355469, -0.2671051025390625, -0.2569160461425781, -0.24672698974609375, -0.23653793334960938, -0.226348876953125, -0.21615982055664062, -0.20597076416015625, -0.19578170776367188, -0.1855926513671875, -0.17540359497070312, -0.16521453857421875, -0.15502548217773438, -0.14483642578125, -0.13464736938476562, -0.12445831298828125, -0.11426925659179688, -0.1040802001953125, -0.09389114379882812, -0.08370208740234375, -0.07351303100585938, -0.063323974609375, -0.053134918212890625, -0.04294586181640625, -0.032756805419921875, -0.0225677490234375, -0.012378692626953125, -0.00218963623046875, 0.007999420166015625, 0.0181884765625, 0.028377532958984375, 0.03856658935546875, 0.048755645751953125, 0.0589447021484375, 0.06913375854492188, 0.07932281494140625, 0.08951187133789062, 0.099700927734375, 0.10988998413085938, 0.12007904052734375, 0.13026809692382812, 0.1404571533203125, 0.15064620971679688, 0.16083526611328125, 0.17102432250976562, 0.18121337890625, 0.19140243530273438, 0.20159149169921875, 0.21178054809570312, 0.2219696044921875, 0.23215866088867188, 0.24234771728515625, 0.2525367736816406, 0.262725830078125, 0.2729148864746094, 0.28310394287109375, 0.2932929992675781, 0.3034820556640625, 0.3136711120605469, 0.32386016845703125, 0.3340492248535156, 0.34423828125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 6.0, 4.0, 14.0, 13.0, 25.0, 34.0, 65.0, 107.0, 162.0, 270.0, 603.0, 1398.0, 681.0, 303.0, 141.0, 89.0, 61.0, 27.0, 23.0, 22.0, 9.0, 9.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0908203125, -0.08739852905273438, -0.08397674560546875, -0.08055496215820312, -0.0771331787109375, -0.07371139526367188, -0.07028961181640625, -0.06686782836914062, -0.063446044921875, -0.060024261474609375, -0.05660247802734375, -0.053180694580078125, -0.0497589111328125, -0.046337127685546875, -0.04291534423828125, -0.039493560791015625, -0.03607177734375, -0.032649993896484375, -0.02922821044921875, -0.025806427001953125, -0.0223846435546875, -0.018962860107421875, -0.01554107666015625, -0.012119293212890625, -0.008697509765625, -0.005275726318359375, -0.00185394287109375, 0.001567840576171875, 0.0049896240234375, 0.008411407470703125, 0.01183319091796875, 0.015254974365234375, 0.0186767578125, 0.022098541259765625, 0.02552032470703125, 0.028942108154296875, 0.0323638916015625, 0.035785675048828125, 0.03920745849609375, 0.042629241943359375, 0.046051025390625, 0.049472808837890625, 0.05289459228515625, 0.056316375732421875, 0.0597381591796875, 0.06315994262695312, 0.06658172607421875, 0.07000350952148438, 0.07342529296875, 0.07684707641601562, 0.08026885986328125, 0.08369064331054688, 0.0871124267578125, 0.09053421020507812, 0.09395599365234375, 0.09737777709960938, 0.100799560546875, 0.10422134399414062, 0.10764312744140625, 0.11106491088867188, 0.1144866943359375, 0.11790847778320312, 0.12133026123046875, 0.12475204467773438, 0.128173828125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 7.0, 16.0, 16.0, 32.0, 57.0, 78.0, 110.0, 116.0, 121.0, 142.0, 89.0, 91.0, 47.0, 22.0, 24.0, 16.0, 9.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3080783784389496, -0.28831619024276733, -0.26855403184890747, -0.2487918585538864, -0.22902968525886536, -0.2092675119638443, -0.18950533866882324, -0.16974316537380219, -0.14998099207878113, -0.13021881878376007, -0.11045664548873901, -0.09069447219371796, -0.0709322988986969, -0.05117012560367584, -0.031407952308654785, -0.011645779013633728, 0.008116394281387329, 0.027878567576408386, 0.04764074087142944, 0.0674029141664505, 0.08716508746147156, 0.10692726075649261, 0.12668943405151367, 0.14645160734653473, 0.1662137806415558, 0.18597595393657684, 0.2057381272315979, 0.22550030052661896, 0.24526247382164001, 0.26502466201782227, 0.28478682041168213, 0.304548978805542, 0.32431113719940186, 0.3440732955932617, 0.36383548378944397, 0.3835976719856262, 0.4033598303794861, 0.42312198877334595, 0.4428841769695282, 0.46264636516571045, 0.4824085235595703, 0.5021706819534302, 0.52193284034729, 0.5416950583457947, 0.5614572167396545, 0.5812193751335144, 0.600981593132019, 0.6207437515258789, 0.6405059099197388, 0.6602680683135986, 0.6800302267074585, 0.6997924447059631, 0.719554603099823, 0.7393167614936829, 0.7590789794921875, 0.7788411378860474, 0.7986032962799072, 0.8183654546737671, 0.838127613067627, 0.8578898310661316, 0.8776519894599915, 0.8974141478538513, 0.917176365852356, 0.9369385242462158, 0.9567006826400757]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 4.0, 3.0, 10.0, 14.0, 13.0, 21.0, 21.0, 20.0, 30.0, 50.0, 47.0, 57.0, 44.0, 62.0, 67.0, 70.0, 64.0, 64.0, 59.0, 55.0, 42.0, 45.0, 27.0, 31.0, 25.0, 14.0, 11.0, 11.0, 8.0, 5.0, 7.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33771640062332153, -0.3237507939338684, -0.3097851574420929, -0.29581955075263977, -0.28185394406318665, -0.26788830757141113, -0.253922700881958, -0.2399570792913437, -0.22599145770072937, -0.21202583611011505, -0.19806022942066193, -0.1840946078300476, -0.1701289862394333, -0.15616336464881897, -0.14219775795936584, -0.12823213636875153, -0.1142665296792984, -0.10030091553926468, -0.08633529394865036, -0.07236967980861664, -0.05840406194329262, -0.0444384440779686, -0.030472829937934875, -0.016507208347320557, -0.0025415942072868347, 0.011424022726714611, 0.025389639660716057, 0.03935525566339493, 0.05332087352871895, 0.06728649139404297, 0.08125210553407669, 0.09521772712469101, 0.10918334126472473, 0.12314895540475845, 0.13711456954479218, 0.1510801911354065, 0.1650458127260208, 0.17901143431663513, 0.19297704100608826, 0.20694266259670258, 0.2209082841873169, 0.2348739057779312, 0.24883951246738434, 0.26280513405799866, 0.2767707407474518, 0.2907363772392273, 0.3047019839286804, 0.31866759061813354, 0.33263319730758667, 0.3465988039970398, 0.3605644404888153, 0.37453004717826843, 0.38849565386772156, 0.40246129035949707, 0.4164268970489502, 0.4303925037384033, 0.44435814023017883, 0.45832374691963196, 0.47228938341140747, 0.4862549901008606, 0.5002205967903137, 0.5141862034797668, 0.5281518697738647, 0.5421174764633179, 0.556083083152771]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 9.0, 9.0, 8.0, 13.0, 20.0, 28.0, 29.0, 71.0, 115.0, 246.0, 507.0, 1105.0, 2566.0, 6931.0, 19736.0, 60241.0, 214003.0, 509889.0, 160342.0, 47311.0, 15757.0, 5564.0, 2153.0, 938.0, 425.0, 224.0, 112.0, 78.0, 40.0, 25.0, 14.0, 14.0, 9.0, 4.0, 7.0, 7.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.282958984375, -0.27518463134765625, -0.2674102783203125, -0.25963592529296875, -0.251861572265625, -0.24408721923828125, -0.2363128662109375, -0.22853851318359375, -0.22076416015625, -0.21298980712890625, -0.2052154541015625, -0.19744110107421875, -0.189666748046875, -0.18189239501953125, -0.1741180419921875, -0.16634368896484375, -0.1585693359375, -0.15079498291015625, -0.1430206298828125, -0.13524627685546875, -0.127471923828125, -0.11969757080078125, -0.1119232177734375, -0.10414886474609375, -0.09637451171875, -0.08860015869140625, -0.0808258056640625, -0.07305145263671875, -0.065277099609375, -0.05750274658203125, -0.0497283935546875, -0.04195404052734375, -0.0341796875, -0.02640533447265625, -0.0186309814453125, -0.01085662841796875, -0.003082275390625, 0.00469207763671875, 0.0124664306640625, 0.02024078369140625, 0.02801513671875, 0.03578948974609375, 0.0435638427734375, 0.05133819580078125, 0.059112548828125, 0.06688690185546875, 0.0746612548828125, 0.08243560791015625, 0.0902099609375, 0.09798431396484375, 0.1057586669921875, 0.11353302001953125, 0.121307373046875, 0.12908172607421875, 0.1368560791015625, 0.14463043212890625, 0.15240478515625, 0.16017913818359375, 0.1679534912109375, 0.17572784423828125, 0.183502197265625, 0.19127655029296875, 0.1990509033203125, 0.20682525634765625, 0.214599609375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 6.0, 5.0, 5.0, 9.0, 8.0, 16.0, 18.0, 17.0, 23.0, 23.0, 35.0, 51.0, 43.0, 46.0, 67.0, 52.0, 57.0, 56.0, 49.0, 60.0, 46.0, 52.0, 42.0, 43.0, 30.0, 29.0, 24.0, 19.0, 13.0, 13.0, 9.0, 11.0, 9.0, 1.0, 5.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.040313720703125, -0.03907442092895508, -0.037835121154785156, -0.036595821380615234, -0.03535652160644531, -0.03411722183227539, -0.03287792205810547, -0.03163862228393555, -0.030399322509765625, -0.029160022735595703, -0.02792072296142578, -0.02668142318725586, -0.025442123413085938, -0.024202823638916016, -0.022963523864746094, -0.021724224090576172, -0.02048492431640625, -0.019245624542236328, -0.018006324768066406, -0.016767024993896484, -0.015527725219726562, -0.01428842544555664, -0.013049125671386719, -0.011809825897216797, -0.010570526123046875, -0.009331226348876953, -0.008091926574707031, -0.006852626800537109, -0.0056133270263671875, -0.004374027252197266, -0.0031347274780273438, -0.0018954277038574219, -0.0006561279296875, 0.0005831718444824219, 0.0018224716186523438, 0.0030617713928222656, 0.0043010711669921875, 0.005540370941162109, 0.006779670715332031, 0.008018970489501953, 0.009258270263671875, 0.010497570037841797, 0.011736869812011719, 0.01297616958618164, 0.014215469360351562, 0.015454769134521484, 0.016694068908691406, 0.017933368682861328, 0.01917266845703125, 0.020411968231201172, 0.021651268005371094, 0.022890567779541016, 0.024129867553710938, 0.02536916732788086, 0.02660846710205078, 0.027847766876220703, 0.029087066650390625, 0.030326366424560547, 0.03156566619873047, 0.03280496597290039, 0.03404426574707031, 0.035283565521240234, 0.036522865295410156, 0.03776216506958008, 0.03900146484375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 8.0, 6.0, 11.0, 12.0, 14.0, 25.0, 28.0, 52.0, 68.0, 94.0, 117.0, 219.0, 299.0, 541.0, 951.0, 1774.0, 4279.0, 12392.0, 44266.0, 185362.0, 553509.0, 180843.0, 43112.0, 12178.0, 4251.0, 1796.0, 900.0, 501.0, 284.0, 210.0, 150.0, 89.0, 48.0, 46.0, 32.0, 25.0, 21.0, 11.0, 9.0, 6.0, 3.0, 2.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2159423828125, -0.2088603973388672, -0.20177841186523438, -0.19469642639160156, -0.18761444091796875, -0.18053245544433594, -0.17345046997070312, -0.1663684844970703, -0.1592864990234375, -0.1522045135498047, -0.14512252807617188, -0.13804054260253906, -0.13095855712890625, -0.12387657165527344, -0.11679458618164062, -0.10971260070800781, -0.102630615234375, -0.09554862976074219, -0.08846664428710938, -0.08138465881347656, -0.07430267333984375, -0.06722068786621094, -0.060138702392578125, -0.05305671691894531, -0.0459747314453125, -0.03889274597167969, -0.031810760498046875, -0.024728775024414062, -0.01764678955078125, -0.010564804077148438, -0.003482818603515625, 0.0035991668701171875, 0.01068115234375, 0.017763137817382812, 0.024845123291015625, 0.03192710876464844, 0.03900909423828125, 0.04609107971191406, 0.053173065185546875, 0.06025505065917969, 0.0673370361328125, 0.07441902160644531, 0.08150100708007812, 0.08858299255371094, 0.09566497802734375, 0.10274696350097656, 0.10982894897460938, 0.11691093444824219, 0.123992919921875, 0.1310749053955078, 0.13815689086914062, 0.14523887634277344, 0.15232086181640625, 0.15940284729003906, 0.16648483276367188, 0.1735668182373047, 0.1806488037109375, 0.1877307891845703, 0.19481277465820312, 0.20189476013183594, 0.20897674560546875, 0.21605873107910156, 0.22314071655273438, 0.2302227020263672, 0.2373046875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 3.0, 2.0, 6.0, 5.0, 9.0, 7.0, 13.0, 10.0, 10.0, 15.0, 22.0, 24.0, 13.0, 24.0, 24.0, 22.0, 34.0, 24.0, 33.0, 41.0, 32.0, 41.0, 43.0, 53.0, 37.0, 37.0, 34.0, 46.0, 33.0, 33.0, 40.0, 37.0, 24.0, 18.0, 27.0, 15.0, 24.0, 15.0, 8.0, 13.0, 9.0, 9.0, 11.0, 6.0, 8.0, 2.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.162841796875, -0.15799713134765625, -0.1531524658203125, -0.14830780029296875, -0.143463134765625, -0.13861846923828125, -0.1337738037109375, -0.12892913818359375, -0.12408447265625, -0.11923980712890625, -0.1143951416015625, -0.10955047607421875, -0.104705810546875, -0.09986114501953125, -0.0950164794921875, -0.09017181396484375, -0.0853271484375, -0.08048248291015625, -0.0756378173828125, -0.07079315185546875, -0.065948486328125, -0.06110382080078125, -0.0562591552734375, -0.05141448974609375, -0.04656982421875, -0.04172515869140625, -0.0368804931640625, -0.03203582763671875, -0.027191162109375, -0.02234649658203125, -0.0175018310546875, -0.01265716552734375, -0.0078125, -0.00296783447265625, 0.0018768310546875, 0.00672149658203125, 0.011566162109375, 0.01641082763671875, 0.0212554931640625, 0.02610015869140625, 0.03094482421875, 0.03578948974609375, 0.0406341552734375, 0.04547882080078125, 0.050323486328125, 0.05516815185546875, 0.0600128173828125, 0.06485748291015625, 0.0697021484375, 0.07454681396484375, 0.0793914794921875, 0.08423614501953125, 0.089080810546875, 0.09392547607421875, 0.0987701416015625, 0.10361480712890625, 0.10845947265625, 0.11330413818359375, 0.1181488037109375, 0.12299346923828125, 0.127838134765625, 0.13268280029296875, 0.1375274658203125, 0.14237213134765625, 0.147216796875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 9.0, 6.0, 11.0, 19.0, 22.0, 33.0, 38.0, 72.0, 135.0, 236.0, 379.0, 834.0, 2468.0, 8476.0, 40733.0, 376184.0, 548576.0, 54579.0, 10622.0, 2994.0, 1069.0, 462.0, 223.0, 129.0, 78.0, 48.0, 32.0, 37.0, 18.0, 15.0, 2.0, 4.0, 5.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.263671875, -0.2570934295654297, -0.2505149841308594, -0.24393653869628906, -0.23735809326171875, -0.23077964782714844, -0.22420120239257812, -0.2176227569580078, -0.2110443115234375, -0.2044658660888672, -0.19788742065429688, -0.19130897521972656, -0.18473052978515625, -0.17815208435058594, -0.17157363891601562, -0.1649951934814453, -0.158416748046875, -0.1518383026123047, -0.14525985717773438, -0.13868141174316406, -0.13210296630859375, -0.12552452087402344, -0.11894607543945312, -0.11236763000488281, -0.1057891845703125, -0.09921073913574219, -0.09263229370117188, -0.08605384826660156, -0.07947540283203125, -0.07289695739746094, -0.06631851196289062, -0.05974006652832031, -0.05316162109375, -0.04658317565917969, -0.040004730224609375, -0.03342628479003906, -0.02684783935546875, -0.020269393920898438, -0.013690948486328125, -0.0071125030517578125, -0.0005340576171875, 0.0060443878173828125, 0.012622833251953125, 0.019201278686523438, 0.02577972412109375, 0.03235816955566406, 0.038936614990234375, 0.04551506042480469, 0.052093505859375, 0.05867195129394531, 0.06525039672851562, 0.07182884216308594, 0.07840728759765625, 0.08498573303222656, 0.09156417846679688, 0.09814262390136719, 0.1047210693359375, 0.11129951477050781, 0.11787796020507812, 0.12445640563964844, 0.13103485107421875, 0.13761329650878906, 0.14419174194335938, 0.1507701873779297, 0.1573486328125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 6.0, 5.0, 9.0, 12.0, 26.0, 45.0, 52.0, 95.0, 100.0, 106.0, 117.0, 114.0, 81.0, 75.0, 39.0, 31.0, 33.0, 18.0, 8.0, 10.0, 10.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0001481771469116211, -0.00014439597725868225, -0.0001406148076057434, -0.00013683363795280457, -0.00013305246829986572, -0.00012927129864692688, -0.00012549012899398804, -0.0001217089593410492, -0.00011792778968811035, -0.00011414662003517151, -0.00011036545038223267, -0.00010658428072929382, -0.00010280311107635498, -9.902194142341614e-05, -9.52407717704773e-05, -9.145960211753845e-05, -8.767843246459961e-05, -8.389726281166077e-05, -8.011609315872192e-05, -7.633492350578308e-05, -7.255375385284424e-05, -6.87725841999054e-05, -6.499141454696655e-05, -6.121024489402771e-05, -5.742907524108887e-05, -5.3647905588150024e-05, -4.986673593521118e-05, -4.608556628227234e-05, -4.2304396629333496e-05, -3.852322697639465e-05, -3.474205732345581e-05, -3.096088767051697e-05, -2.7179718017578125e-05, -2.3398548364639282e-05, -1.961737871170044e-05, -1.5836209058761597e-05, -1.2055039405822754e-05, -8.273869752883911e-06, -4.492700099945068e-06, -7.115304470062256e-07, 3.069639205932617e-06, 6.85080885887146e-06, 1.0631978511810303e-05, 1.4413148164749146e-05, 1.8194317817687988e-05, 2.197548747062683e-05, 2.5756657123565674e-05, 2.9537826776504517e-05, 3.331899642944336e-05, 3.71001660823822e-05, 4.0881335735321045e-05, 4.466250538825989e-05, 4.844367504119873e-05, 5.222484469413757e-05, 5.6006014347076416e-05, 5.978718400001526e-05, 6.35683536529541e-05, 6.734952330589294e-05, 7.113069295883179e-05, 7.491186261177063e-05, 7.869303226470947e-05, 8.247420191764832e-05, 8.625537157058716e-05, 9.0036541223526e-05, 9.381771087646484e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 3.0, 2.0, 8.0, 3.0, 7.0, 7.0, 15.0, 14.0, 13.0, 21.0, 33.0, 46.0, 91.0, 100.0, 179.0, 331.0, 577.0, 1237.0, 2894.0, 8454.0, 31411.0, 176072.0, 672187.0, 119429.0, 23825.0, 6719.0, 2371.0, 1132.0, 550.0, 292.0, 181.0, 111.0, 74.0, 56.0, 32.0, 22.0, 13.0, 13.0, 8.0, 2.0, 8.0, 6.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1781005859375, -0.17292404174804688, -0.16774749755859375, -0.16257095336914062, -0.1573944091796875, -0.15221786499023438, -0.14704132080078125, -0.14186477661132812, -0.136688232421875, -0.13151168823242188, -0.12633514404296875, -0.12115859985351562, -0.1159820556640625, -0.11080551147460938, -0.10562896728515625, -0.10045242309570312, -0.09527587890625, -0.09009933471679688, -0.08492279052734375, -0.07974624633789062, -0.0745697021484375, -0.06939315795898438, -0.06421661376953125, -0.059040069580078125, -0.053863525390625, -0.048686981201171875, -0.04351043701171875, -0.038333892822265625, -0.0331573486328125, -0.027980804443359375, -0.02280426025390625, -0.017627716064453125, -0.012451171875, -0.007274627685546875, -0.00209808349609375, 0.003078460693359375, 0.0082550048828125, 0.013431549072265625, 0.01860809326171875, 0.023784637451171875, 0.028961181640625, 0.034137725830078125, 0.03931427001953125, 0.044490814208984375, 0.0496673583984375, 0.054843902587890625, 0.06002044677734375, 0.06519699096679688, 0.07037353515625, 0.07555007934570312, 0.08072662353515625, 0.08590316772460938, 0.0910797119140625, 0.09625625610351562, 0.10143280029296875, 0.10660934448242188, 0.111785888671875, 0.11696243286132812, 0.12213897705078125, 0.12731552124023438, 0.1324920654296875, 0.13766860961914062, 0.14284515380859375, 0.14802169799804688, 0.1531982421875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 2.0, 5.0, 4.0, 9.0, 8.0, 12.0, 15.0, 24.0, 29.0, 36.0, 58.0, 84.0, 120.0, 131.0, 141.0, 66.0, 77.0, 55.0, 29.0, 14.0, 15.0, 19.0, 11.0, 3.0, 6.0, 6.0, 7.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11083984375, -0.10721302032470703, -0.10358619689941406, -0.0999593734741211, -0.09633255004882812, -0.09270572662353516, -0.08907890319824219, -0.08545207977294922, -0.08182525634765625, -0.07819843292236328, -0.07457160949707031, -0.07094478607177734, -0.06731796264648438, -0.0636911392211914, -0.06006431579589844, -0.05643749237060547, -0.0528106689453125, -0.04918384552001953, -0.04555702209472656, -0.041930198669433594, -0.038303375244140625, -0.034676551818847656, -0.031049728393554688, -0.02742290496826172, -0.02379608154296875, -0.02016925811767578, -0.016542434692382812, -0.012915611267089844, -0.009288787841796875, -0.005661964416503906, -0.0020351409912109375, 0.0015916824340820312, 0.005218505859375, 0.008845329284667969, 0.012472152709960938, 0.016098976135253906, 0.019725799560546875, 0.023352622985839844, 0.026979446411132812, 0.03060626983642578, 0.03423309326171875, 0.03785991668701172, 0.04148674011230469, 0.045113563537597656, 0.048740386962890625, 0.052367210388183594, 0.05599403381347656, 0.05962085723876953, 0.0632476806640625, 0.06687450408935547, 0.07050132751464844, 0.0741281509399414, 0.07775497436523438, 0.08138179779052734, 0.08500862121582031, 0.08863544464111328, 0.09226226806640625, 0.09588909149169922, 0.09951591491699219, 0.10314273834228516, 0.10676956176757812, 0.1103963851928711, 0.11402320861816406, 0.11765003204345703, 0.12127685546875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 8.0, 9.0, 21.0, 25.0, 44.0, 74.0, 112.0, 152.0, 130.0, 134.0, 107.0, 73.0, 61.0, 24.0, 20.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.013060450553894, -0.9616141319274902, -0.9101678133010864, -0.8587214946746826, -0.8072751760482788, -0.755828857421875, -0.704382598400116, -0.6529362797737122, -0.6014899611473083, -0.5500436425209045, -0.49859732389450073, -0.4471510350704193, -0.3957047164440155, -0.3442583978176117, -0.2928121089935303, -0.24136579036712646, -0.18991947174072266, -0.13847315311431885, -0.08702684938907623, -0.03558054566383362, 0.01586577296257019, 0.067312091588974, 0.11875838041305542, 0.17020469903945923, 0.22165101766586304, 0.27309733629226685, 0.32454365491867065, 0.3759899437427521, 0.4274362623691559, 0.4788825809955597, 0.5303288698196411, 0.5817751884460449, 0.6332216262817383, 0.6846679449081421, 0.7361142635345459, 0.7875605821609497, 0.8390069007873535, 0.8904532194137573, 0.9418994784355164, 0.9933457970619202, 1.0447921752929688, 1.0962384939193726, 1.1476848125457764, 1.1991311311721802, 1.250577449798584, 1.3020237684249878, 1.3534700870513916, 1.4049162864685059, 1.4563626050949097, 1.5078089237213135, 1.5592552423477173, 1.610701560974121, 1.662147879600525, 1.7135941982269287, 1.765040397644043, 1.8164868354797363, 1.8679330348968506, 1.9193793535232544, 1.9708256721496582, 2.0222718715667725, 2.073718309402466, 2.12516450881958, 2.1766109466552734, 2.2280571460723877, 2.279503583908081]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 7.0, 6.0, 9.0, 7.0, 19.0, 13.0, 22.0, 22.0, 26.0, 24.0, 25.0, 35.0, 48.0, 45.0, 42.0, 42.0, 46.0, 45.0, 42.0, 53.0, 48.0, 44.0, 41.0, 43.0, 33.0, 34.0, 20.0, 20.0, 27.0, 26.0, 14.0, 19.0, 8.0, 7.0, 8.0, 5.0, 4.0, 3.0, 6.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.1023151874542236, -1.0700024366378784, -1.0376896858215332, -1.005376935005188, -0.9730641841888428, -0.9407514333724976, -0.9084386825561523, -0.8761259317398071, -0.8438131809234619, -0.8115004301071167, -0.7791876792907715, -0.7468749284744263, -0.714562177658081, -0.6822494268417358, -0.6499366760253906, -0.6176239252090454, -0.5853111743927002, -0.552998423576355, -0.5206856727600098, -0.48837292194366455, -0.45606017112731934, -0.4237474203109741, -0.3914346694946289, -0.3591219186782837, -0.3268091678619385, -0.29449641704559326, -0.26218366622924805, -0.22987091541290283, -0.19755816459655762, -0.1652454137802124, -0.1329326629638672, -0.10061991214752197, -0.06830722093582153, -0.03599447011947632, -0.0036817193031311035, 0.02863103151321411, 0.060943782329559326, 0.09325653314590454, 0.12556928396224976, 0.15788203477859497, 0.19019478559494019, 0.2225075364112854, 0.2548202872276306, 0.28713303804397583, 0.31944578886032104, 0.35175853967666626, 0.3840712904930115, 0.4163840413093567, 0.4486967921257019, 0.4810095429420471, 0.5133222937583923, 0.5456350445747375, 0.5779477953910828, 0.610260546207428, 0.6425732970237732, 0.6748860478401184, 0.7071987986564636, 0.7395115494728088, 0.771824300289154, 0.8041370511054993, 0.8364498019218445, 0.8687625527381897, 0.9010753035545349, 0.9333880543708801, 0.9657008051872253]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 5.0, 17.0, 17.0, 32.0, 60.0, 96.0, 175.0, 310.0, 517.0, 1014.0, 2019.0, 4515.0, 11522.0, 32203.0, 123558.0, 2606621.0, 1257733.0, 105081.0, 29285.0, 10506.0, 4404.0, 2023.0, 1083.0, 593.0, 313.0, 200.0, 129.0, 62.0, 57.0, 36.0, 25.0, 13.0, 18.0, 10.0, 7.0, 7.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1392822265625, -0.1334667205810547, -0.12765121459960938, -0.12183570861816406, -0.11602020263671875, -0.11020469665527344, -0.10438919067382812, -0.09857368469238281, -0.0927581787109375, -0.08694267272949219, -0.08112716674804688, -0.07531166076660156, -0.06949615478515625, -0.06368064880371094, -0.057865142822265625, -0.05204963684082031, -0.046234130859375, -0.04041862487792969, -0.034603118896484375, -0.028787612915039062, -0.02297210693359375, -0.017156600952148438, -0.011341094970703125, -0.0055255889892578125, 0.0002899169921875, 0.0061054229736328125, 0.011920928955078125, 0.017736434936523438, 0.02355194091796875, 0.029367446899414062, 0.035182952880859375, 0.04099845886230469, 0.04681396484375, 0.05262947082519531, 0.058444976806640625, 0.06426048278808594, 0.07007598876953125, 0.07589149475097656, 0.08170700073242188, 0.08752250671386719, 0.0933380126953125, 0.09915351867675781, 0.10496902465820312, 0.11078453063964844, 0.11660003662109375, 0.12241554260253906, 0.12823104858398438, 0.1340465545654297, 0.139862060546875, 0.1456775665283203, 0.15149307250976562, 0.15730857849121094, 0.16312408447265625, 0.16893959045410156, 0.17475509643554688, 0.1805706024169922, 0.1863861083984375, 0.1922016143798828, 0.19801712036132812, 0.20383262634277344, 0.20964813232421875, 0.21546363830566406, 0.22127914428710938, 0.2270946502685547, 0.23291015625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 5.0, 5.0, 6.0, 12.0, 17.0, 23.0, 21.0, 30.0, 32.0, 39.0, 33.0, 43.0, 47.0, 44.0, 44.0, 63.0, 51.0, 51.0, 51.0, 52.0, 59.0, 57.0, 33.0, 23.0, 32.0, 25.0, 28.0, 11.0, 17.0, 6.0, 8.0, 7.0, 5.0, 4.0, 2.0, 2.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.038116455078125, -0.0368194580078125, -0.0355224609375, -0.0342254638671875, -0.032928466796875, -0.0316314697265625, -0.03033447265625, -0.0290374755859375, -0.027740478515625, -0.0264434814453125, -0.025146484375, -0.0238494873046875, -0.022552490234375, -0.0212554931640625, -0.01995849609375, -0.0186614990234375, -0.017364501953125, -0.0160675048828125, -0.0147705078125, -0.0134735107421875, -0.012176513671875, -0.0108795166015625, -0.00958251953125, -0.0082855224609375, -0.006988525390625, -0.0056915283203125, -0.00439453125, -0.0030975341796875, -0.001800537109375, -0.0005035400390625, 0.00079345703125, 0.0020904541015625, 0.003387451171875, 0.0046844482421875, 0.0059814453125, 0.0072784423828125, 0.008575439453125, 0.0098724365234375, 0.01116943359375, 0.0124664306640625, 0.013763427734375, 0.0150604248046875, 0.016357421875, 0.0176544189453125, 0.018951416015625, 0.0202484130859375, 0.02154541015625, 0.0228424072265625, 0.024139404296875, 0.0254364013671875, 0.0267333984375, 0.0280303955078125, 0.029327392578125, 0.0306243896484375, 0.03192138671875, 0.0332183837890625, 0.034515380859375, 0.0358123779296875, 0.037109375, 0.0384063720703125, 0.039703369140625, 0.0410003662109375, 0.04229736328125, 0.0435943603515625, 0.044891357421875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 7.0, 8.0, 9.0, 20.0, 37.0, 42.0, 58.0, 122.0, 179.0, 372.0, 674.0, 1322.0, 3025.0, 7970.0, 23750.0, 89832.0, 661728.0, 3130213.0, 207699.0, 44761.0, 13497.0, 4926.0, 2022.0, 909.0, 473.0, 244.0, 145.0, 75.0, 63.0, 37.0, 20.0, 14.0, 6.0, 7.0, 7.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.305908203125, -0.2983074188232422, -0.2907066345214844, -0.28310585021972656, -0.27550506591796875, -0.26790428161621094, -0.2603034973144531, -0.2527027130126953, -0.2451019287109375, -0.2375011444091797, -0.22990036010742188, -0.22229957580566406, -0.21469879150390625, -0.20709800720214844, -0.19949722290039062, -0.1918964385986328, -0.184295654296875, -0.1766948699951172, -0.16909408569335938, -0.16149330139160156, -0.15389251708984375, -0.14629173278808594, -0.13869094848632812, -0.1310901641845703, -0.1234893798828125, -0.11588859558105469, -0.10828781127929688, -0.10068702697753906, -0.09308624267578125, -0.08548545837402344, -0.07788467407226562, -0.07028388977050781, -0.06268310546875, -0.05508232116699219, -0.047481536865234375, -0.03988075256347656, -0.03227996826171875, -0.024679183959960938, -0.017078399658203125, -0.009477615356445312, -0.0018768310546875, 0.0057239532470703125, 0.013324737548828125, 0.020925521850585938, 0.02852630615234375, 0.03612709045410156, 0.043727874755859375, 0.05132865905761719, 0.058929443359375, 0.06653022766113281, 0.07413101196289062, 0.08173179626464844, 0.08933258056640625, 0.09693336486816406, 0.10453414916992188, 0.11213493347167969, 0.1197357177734375, 0.1273365020751953, 0.13493728637695312, 0.14253807067871094, 0.15013885498046875, 0.15773963928222656, 0.16534042358398438, 0.1729412078857422, 0.1805419921875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 8.0, 4.0, 12.0, 15.0, 17.0, 15.0, 26.0, 32.0, 53.0, 58.0, 120.0, 189.0, 328.0, 793.0, 1243.0, 421.0, 241.0, 144.0, 96.0, 57.0, 42.0, 48.0, 24.0, 25.0, 17.0, 12.0, 5.0, 5.0, 4.0, 4.0, 6.0, 6.0, 0.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.1080322265625, -0.10540962219238281, -0.10278701782226562, -0.10016441345214844, -0.09754180908203125, -0.09491920471191406, -0.09229660034179688, -0.08967399597167969, -0.0870513916015625, -0.08442878723144531, -0.08180618286132812, -0.07918357849121094, -0.07656097412109375, -0.07393836975097656, -0.07131576538085938, -0.06869316101074219, -0.066070556640625, -0.06344795227050781, -0.060825347900390625, -0.05820274353027344, -0.05558013916015625, -0.05295753479003906, -0.050334930419921875, -0.04771232604980469, -0.0450897216796875, -0.04246711730957031, -0.039844512939453125, -0.03722190856933594, -0.03459930419921875, -0.03197669982910156, -0.029354095458984375, -0.026731491088867188, -0.02410888671875, -0.021486282348632812, -0.018863677978515625, -0.016241073608398438, -0.01361846923828125, -0.010995864868164062, -0.008373260498046875, -0.0057506561279296875, -0.0031280517578125, -0.0005054473876953125, 0.002117156982421875, 0.0047397613525390625, 0.00736236572265625, 0.009984970092773438, 0.012607574462890625, 0.015230178833007812, 0.017852783203125, 0.020475387573242188, 0.023097991943359375, 0.025720596313476562, 0.02834320068359375, 0.030965805053710938, 0.033588409423828125, 0.03621101379394531, 0.0388336181640625, 0.04145622253417969, 0.044078826904296875, 0.04670143127441406, 0.04932403564453125, 0.05194664001464844, 0.054569244384765625, 0.05719184875488281, 0.059814453125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 8.0, 18.0, 37.0, 40.0, 133.0, 123.0, 155.0, 204.0, 134.0, 80.0, 48.0, 18.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9848441481590271, -0.9579969048500061, -0.9311496615409851, -0.9043024182319641, -0.8774551153182983, -0.8506078720092773, -0.8237606287002563, -0.7969133853912354, -0.7700661420822144, -0.7432188987731934, -0.7163716554641724, -0.6895244121551514, -0.6626771688461304, -0.6358299255371094, -0.6089826226234436, -0.5821353793144226, -0.5552881360054016, -0.5284408926963806, -0.5015936493873596, -0.47474637627601624, -0.44789913296699524, -0.42105188965797424, -0.39420461654663086, -0.36735737323760986, -0.34051012992858887, -0.31366288661956787, -0.2868156433105469, -0.2599683701992035, -0.2331211268901825, -0.2062738835811615, -0.1794266253709793, -0.15257936716079712, -0.12573206424713135, -0.09888481348752975, -0.07203756272792816, -0.04519031196832657, -0.018343061208724976, 0.00850418210029602, 0.03535144031047821, 0.0621986985206604, 0.0890459418296814, 0.11589319258928299, 0.14274044334888458, 0.16958770155906677, 0.19643494486808777, 0.22328218817710876, 0.25012946128845215, 0.27697670459747314, 0.30382394790649414, 0.33067119121551514, 0.35751843452453613, 0.3843657076358795, 0.4112129509449005, 0.4380601942539215, 0.4649074673652649, 0.4917547106742859, 0.5186019539833069, 0.5454491972923279, 0.5722964406013489, 0.5991436839103699, 0.6259909868240356, 0.6528382301330566, 0.6796854734420776, 0.7065327167510986, 0.7333799600601196]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 1.0, 10.0, 8.0, 10.0, 6.0, 6.0, 11.0, 12.0, 10.0, 20.0, 20.0, 19.0, 24.0, 24.0, 39.0, 37.0, 40.0, 36.0, 41.0, 39.0, 44.0, 44.0, 46.0, 44.0, 28.0, 36.0, 40.0, 30.0, 28.0, 38.0, 32.0, 21.0, 30.0, 24.0, 19.0, 15.0, 16.0, 12.0, 9.0, 9.0, 6.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.3551933765411377, -0.3455606698989868, -0.3359279930591583, -0.32629528641700745, -0.31666260957717896, -0.3070299029350281, -0.2973972260951996, -0.2877645194530487, -0.2781318426132202, -0.26849913597106934, -0.25886645913124084, -0.24923376739025116, -0.23960107564926147, -0.2299683839082718, -0.2203356921672821, -0.21070298552513123, -0.20107029378414154, -0.19143760204315186, -0.18180491030216217, -0.17217221856117249, -0.1625395268201828, -0.15290683507919312, -0.14327412843704224, -0.13364145159721375, -0.12400875240564346, -0.11437606066465378, -0.10474336892366409, -0.09511066973209381, -0.08547797799110413, -0.07584528625011444, -0.06621259450912476, -0.05657990276813507, -0.046947211027145386, -0.0373145192861557, -0.027681825682520866, -0.018049132078886032, -0.008416440337896347, 0.001216251403093338, 0.010848946869373322, 0.020481638610363007, 0.03011433035135269, 0.03974702209234238, 0.04937971383333206, 0.059012409299612045, 0.06864510476589203, 0.07827779650688171, 0.0879104882478714, 0.09754317998886108, 0.10717587172985077, 0.11680856347084045, 0.12644125521183014, 0.13607394695281982, 0.1457066386938095, 0.1553393304347992, 0.16497203707695007, 0.17460471391677856, 0.18423742055892944, 0.19387011229991913, 0.2035028040409088, 0.2131354957818985, 0.22276818752288818, 0.23240087926387787, 0.24203357100486755, 0.25166627764701843, 0.2612989544868469]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 9.0, 10.0, 21.0, 22.0, 30.0, 46.0, 96.0, 129.0, 215.0, 378.0, 783.0, 1488.0, 3091.0, 6498.0, 13837.0, 29629.0, 63806.0, 140470.0, 323180.0, 259379.0, 109656.0, 51087.0, 23532.0, 10886.0, 5183.0, 2428.0, 1173.0, 620.0, 311.0, 207.0, 127.0, 77.0, 46.0, 37.0, 19.0, 11.0, 12.0, 8.0, 5.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0], "bins": [-0.20068359375, -0.19538116455078125, -0.1900787353515625, -0.18477630615234375, -0.179473876953125, -0.17417144775390625, -0.1688690185546875, -0.16356658935546875, -0.15826416015625, -0.15296173095703125, -0.1476593017578125, -0.14235687255859375, -0.137054443359375, -0.13175201416015625, -0.1264495849609375, -0.12114715576171875, -0.1158447265625, -0.11054229736328125, -0.1052398681640625, -0.09993743896484375, -0.094635009765625, -0.08933258056640625, -0.0840301513671875, -0.07872772216796875, -0.07342529296875, -0.06812286376953125, -0.0628204345703125, -0.05751800537109375, -0.052215576171875, -0.04691314697265625, -0.0416107177734375, -0.03630828857421875, -0.031005859375, -0.02570343017578125, -0.0204010009765625, -0.01509857177734375, -0.009796142578125, -0.00449371337890625, 0.0008087158203125, 0.00611114501953125, 0.01141357421875, 0.01671600341796875, 0.0220184326171875, 0.02732086181640625, 0.032623291015625, 0.03792572021484375, 0.0432281494140625, 0.04853057861328125, 0.0538330078125, 0.05913543701171875, 0.0644378662109375, 0.06974029541015625, 0.075042724609375, 0.08034515380859375, 0.0856475830078125, 0.09095001220703125, 0.09625244140625, 0.10155487060546875, 0.1068572998046875, 0.11215972900390625, 0.117462158203125, 0.12276458740234375, 0.1280670166015625, 0.13336944580078125, 0.138671875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 1.0, 1.0, 6.0, 6.0, 10.0, 4.0, 12.0, 16.0, 14.0, 25.0, 32.0, 35.0, 41.0, 39.0, 41.0, 37.0, 43.0, 54.0, 47.0, 52.0, 51.0, 54.0, 67.0, 59.0, 37.0, 38.0, 36.0, 28.0, 24.0, 26.0, 21.0, 6.0, 16.0, 6.0, 4.0, 3.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036956787109375, -0.03560924530029297, -0.03426170349121094, -0.032914161682128906, -0.031566619873046875, -0.030219078063964844, -0.028871536254882812, -0.02752399444580078, -0.02617645263671875, -0.02482891082763672, -0.023481369018554688, -0.022133827209472656, -0.020786285400390625, -0.019438743591308594, -0.018091201782226562, -0.01674365997314453, -0.0153961181640625, -0.014048576354980469, -0.012701034545898438, -0.011353492736816406, -0.010005950927734375, -0.008658409118652344, -0.0073108673095703125, -0.005963325500488281, -0.00461578369140625, -0.0032682418823242188, -0.0019207000732421875, -0.0005731582641601562, 0.000774383544921875, 0.0021219253540039062, 0.0034694671630859375, 0.004817008972167969, 0.00616455078125, 0.007512092590332031, 0.008859634399414062, 0.010207176208496094, 0.011554718017578125, 0.012902259826660156, 0.014249801635742188, 0.015597343444824219, 0.01694488525390625, 0.01829242706298828, 0.019639968872070312, 0.020987510681152344, 0.022335052490234375, 0.023682594299316406, 0.025030136108398438, 0.02637767791748047, 0.0277252197265625, 0.02907276153564453, 0.030420303344726562, 0.031767845153808594, 0.033115386962890625, 0.034462928771972656, 0.03581047058105469, 0.03715801239013672, 0.03850555419921875, 0.03985309600830078, 0.04120063781738281, 0.042548179626464844, 0.043895721435546875, 0.045243263244628906, 0.04659080505371094, 0.04793834686279297, 0.049285888671875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 6.0, 5.0, 3.0, 9.0, 11.0, 10.0, 20.0, 29.0, 57.0, 77.0, 104.0, 154.0, 218.0, 366.0, 603.0, 1075.0, 2766.0, 10626.0, 64564.0, 483514.0, 415087.0, 54553.0, 9413.0, 2575.0, 1084.0, 532.0, 350.0, 253.0, 172.0, 97.0, 49.0, 51.0, 39.0, 16.0, 23.0, 16.0, 12.0, 4.0, 2.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30322265625, -0.2923774719238281, -0.28153228759765625, -0.2706871032714844, -0.2598419189453125, -0.24899673461914062, -0.23815155029296875, -0.22730636596679688, -0.216461181640625, -0.20561599731445312, -0.19477081298828125, -0.18392562866210938, -0.1730804443359375, -0.16223526000976562, -0.15139007568359375, -0.14054489135742188, -0.12969970703125, -0.11885452270507812, -0.10800933837890625, -0.09716415405273438, -0.0863189697265625, -0.07547378540039062, -0.06462860107421875, -0.053783416748046875, -0.042938232421875, -0.032093048095703125, -0.02124786376953125, -0.010402679443359375, 0.0004425048828125, 0.011287689208984375, 0.02213287353515625, 0.032978057861328125, 0.0438232421875, 0.054668426513671875, 0.06551361083984375, 0.07635879516601562, 0.0872039794921875, 0.09804916381835938, 0.10889434814453125, 0.11973953247070312, 0.130584716796875, 0.14142990112304688, 0.15227508544921875, 0.16312026977539062, 0.1739654541015625, 0.18481063842773438, 0.19565582275390625, 0.20650100708007812, 0.21734619140625, 0.22819137573242188, 0.23903656005859375, 0.24988174438476562, 0.2607269287109375, 0.2715721130371094, 0.28241729736328125, 0.2932624816894531, 0.304107666015625, 0.3149528503417969, 0.32579803466796875, 0.3366432189941406, 0.3474884033203125, 0.3583335876464844, 0.36917877197265625, 0.3800239562988281, 0.390869140625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 0.0, 11.0, 9.0, 13.0, 9.0, 13.0, 15.0, 12.0, 17.0, 9.0, 20.0, 28.0, 34.0, 23.0, 32.0, 41.0, 40.0, 33.0, 24.0, 38.0, 39.0, 50.0, 35.0, 32.0, 32.0, 39.0, 42.0, 29.0, 30.0, 34.0, 33.0, 24.0, 25.0, 30.0, 25.0, 19.0, 14.0, 8.0, 10.0, 9.0, 6.0, 2.0, 4.0, 1.0, 2.0, 5.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1571044921875, -0.1520843505859375, -0.147064208984375, -0.1420440673828125, -0.13702392578125, -0.1320037841796875, -0.126983642578125, -0.1219635009765625, -0.116943359375, -0.1119232177734375, -0.106903076171875, -0.1018829345703125, -0.09686279296875, -0.0918426513671875, -0.086822509765625, -0.0818023681640625, -0.0767822265625, -0.0717620849609375, -0.066741943359375, -0.0617218017578125, -0.05670166015625, -0.0516815185546875, -0.046661376953125, -0.0416412353515625, -0.03662109375, -0.0316009521484375, -0.026580810546875, -0.0215606689453125, -0.01654052734375, -0.0115203857421875, -0.006500244140625, -0.0014801025390625, 0.0035400390625, 0.0085601806640625, 0.013580322265625, 0.0186004638671875, 0.02362060546875, 0.0286407470703125, 0.033660888671875, 0.0386810302734375, 0.043701171875, 0.0487213134765625, 0.053741455078125, 0.0587615966796875, 0.06378173828125, 0.0688018798828125, 0.073822021484375, 0.0788421630859375, 0.0838623046875, 0.0888824462890625, 0.093902587890625, 0.0989227294921875, 0.10394287109375, 0.1089630126953125, 0.113983154296875, 0.1190032958984375, 0.1240234375, 0.1290435791015625, 0.134063720703125, 0.1390838623046875, 0.14410400390625, 0.1491241455078125, 0.154144287109375, 0.1591644287109375, 0.1641845703125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 9.0, 3.0, 6.0, 12.0, 24.0, 33.0, 51.0, 89.0, 145.0, 221.0, 433.0, 907.0, 1894.0, 5959.0, 26107.0, 275447.0, 673728.0, 49345.0, 9153.0, 2664.0, 1096.0, 515.0, 267.0, 144.0, 93.0, 58.0, 41.0, 39.0, 21.0, 11.0, 14.0, 8.0, 2.0, 3.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.309326171875, -0.30052947998046875, -0.2917327880859375, -0.28293609619140625, -0.274139404296875, -0.26534271240234375, -0.2565460205078125, -0.24774932861328125, -0.23895263671875, -0.23015594482421875, -0.2213592529296875, -0.21256256103515625, -0.203765869140625, -0.19496917724609375, -0.1861724853515625, -0.17737579345703125, -0.1685791015625, -0.15978240966796875, -0.1509857177734375, -0.14218902587890625, -0.133392333984375, -0.12459564208984375, -0.1157989501953125, -0.10700225830078125, -0.09820556640625, -0.08940887451171875, -0.0806121826171875, -0.07181549072265625, -0.063018798828125, -0.05422210693359375, -0.0454254150390625, -0.03662872314453125, -0.02783203125, -0.01903533935546875, -0.0102386474609375, -0.00144195556640625, 0.007354736328125, 0.01615142822265625, 0.0249481201171875, 0.03374481201171875, 0.04254150390625, 0.05133819580078125, 0.0601348876953125, 0.06893157958984375, 0.077728271484375, 0.08652496337890625, 0.0953216552734375, 0.10411834716796875, 0.1129150390625, 0.12171173095703125, 0.1305084228515625, 0.13930511474609375, 0.148101806640625, 0.15689849853515625, 0.1656951904296875, 0.17449188232421875, 0.18328857421875, 0.19208526611328125, 0.2008819580078125, 0.20967864990234375, 0.218475341796875, 0.22727203369140625, 0.2360687255859375, 0.24486541748046875, 0.253662109375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 10.0, 6.0, 9.0, 9.0, 7.0, 13.0, 21.0, 36.0, 42.0, 42.0, 60.0, 69.0, 88.0, 94.0, 86.0, 81.0, 71.0, 58.0, 50.0, 35.0, 27.0, 22.0, 24.0, 12.0, 7.0, 6.0, 4.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.052587509155273e-05, -7.756520062685013e-05, -7.460452616214752e-05, -7.164385169744492e-05, -6.868317723274231e-05, -6.57225027680397e-05, -6.27618283033371e-05, -5.980115383863449e-05, -5.6840479373931885e-05, -5.387980490922928e-05, -5.091913044452667e-05, -4.7958455979824066e-05, -4.499778151512146e-05, -4.2037107050418854e-05, -3.907643258571625e-05, -3.611575812101364e-05, -3.3155083656311035e-05, -3.019440919160843e-05, -2.7233734726905823e-05, -2.4273060262203217e-05, -2.131238579750061e-05, -1.8351711332798004e-05, -1.5391036868095398e-05, -1.2430362403392792e-05, -9.469687938690186e-06, -6.509013473987579e-06, -3.548339009284973e-06, -5.876645445823669e-07, 2.3730099201202393e-06, 5.3336843848228455e-06, 8.294358849525452e-06, 1.1255033314228058e-05, 1.4215707778930664e-05, 1.717638224363327e-05, 2.0137056708335876e-05, 2.3097731173038483e-05, 2.605840563774109e-05, 2.9019080102443695e-05, 3.19797545671463e-05, 3.494042903184891e-05, 3.7901103496551514e-05, 4.086177796125412e-05, 4.3822452425956726e-05, 4.678312689065933e-05, 4.974380135536194e-05, 5.2704475820064545e-05, 5.566515028476715e-05, 5.862582474946976e-05, 6.158649921417236e-05, 6.454717367887497e-05, 6.750784814357758e-05, 7.046852260828018e-05, 7.342919707298279e-05, 7.63898715376854e-05, 7.9350546002388e-05, 8.23112204670906e-05, 8.527189493179321e-05, 8.823256939649582e-05, 9.119324386119843e-05, 9.415391832590103e-05, 9.711459279060364e-05, 0.00010007526725530624, 0.00010303594172000885, 0.00010599661618471146, 0.00010895729064941406]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 7.0, 9.0, 8.0, 13.0, 23.0, 31.0, 27.0, 58.0, 100.0, 214.0, 377.0, 1031.0, 3249.0, 11973.0, 88676.0, 847839.0, 78721.0, 11229.0, 3043.0, 992.0, 432.0, 196.0, 105.0, 66.0, 34.0, 30.0, 18.0, 12.0, 9.0, 7.0, 7.0, 1.0, 5.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30322265625, -0.29327392578125, -0.2833251953125, -0.27337646484375, -0.263427734375, -0.25347900390625, -0.2435302734375, -0.23358154296875, -0.2236328125, -0.21368408203125, -0.2037353515625, -0.19378662109375, -0.183837890625, -0.17388916015625, -0.1639404296875, -0.15399169921875, -0.14404296875, -0.13409423828125, -0.1241455078125, -0.11419677734375, -0.104248046875, -0.09429931640625, -0.0843505859375, -0.07440185546875, -0.064453125, -0.05450439453125, -0.0445556640625, -0.03460693359375, -0.024658203125, -0.01470947265625, -0.0047607421875, 0.00518798828125, 0.01513671875, 0.02508544921875, 0.0350341796875, 0.04498291015625, 0.054931640625, 0.06488037109375, 0.0748291015625, 0.08477783203125, 0.0947265625, 0.10467529296875, 0.1146240234375, 0.12457275390625, 0.134521484375, 0.14447021484375, 0.1544189453125, 0.16436767578125, 0.17431640625, 0.18426513671875, 0.1942138671875, 0.20416259765625, 0.214111328125, 0.22406005859375, 0.2340087890625, 0.24395751953125, 0.25390625, 0.26385498046875, 0.2738037109375, 0.28375244140625, 0.293701171875, 0.30364990234375, 0.3135986328125, 0.32354736328125, 0.33349609375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 2.0, 5.0, 7.0, 5.0, 3.0, 9.0, 13.0, 27.0, 34.0, 43.0, 79.0, 149.0, 219.0, 147.0, 77.0, 58.0, 37.0, 34.0, 10.0, 7.0, 4.0, 10.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2342529296875, -0.22802162170410156, -0.22179031372070312, -0.2155590057373047, -0.20932769775390625, -0.2030963897705078, -0.19686508178710938, -0.19063377380371094, -0.1844024658203125, -0.17817115783691406, -0.17193984985351562, -0.1657085418701172, -0.15947723388671875, -0.1532459259033203, -0.14701461791992188, -0.14078330993652344, -0.134552001953125, -0.12832069396972656, -0.12208938598632812, -0.11585807800292969, -0.10962677001953125, -0.10339546203613281, -0.09716415405273438, -0.09093284606933594, -0.0847015380859375, -0.07847023010253906, -0.07223892211914062, -0.06600761413574219, -0.05977630615234375, -0.05354499816894531, -0.047313690185546875, -0.04108238220214844, -0.03485107421875, -0.028619766235351562, -0.022388458251953125, -0.016157150268554688, -0.00992584228515625, -0.0036945343017578125, 0.002536773681640625, 0.008768081665039062, 0.0149993896484375, 0.021230697631835938, 0.027462005615234375, 0.03369331359863281, 0.03992462158203125, 0.04615592956542969, 0.052387237548828125, 0.05861854553222656, 0.064849853515625, 0.07108116149902344, 0.07731246948242188, 0.08354377746582031, 0.08977508544921875, 0.09600639343261719, 0.10223770141601562, 0.10846900939941406, 0.1147003173828125, 0.12093162536621094, 0.12716293334960938, 0.1333942413330078, 0.13962554931640625, 0.1458568572998047, 0.15208816528320312, 0.15831947326660156, 0.16455078125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 9.0, 32.0, 76.0, 101.0, 173.0, 172.0, 188.0, 111.0, 66.0, 39.0, 21.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.488983631134033, -3.4050533771514893, -3.3211233615875244, -3.2371931076049805, -3.1532630920410156, -3.0693328380584717, -2.9854025840759277, -2.901472568511963, -2.817542552947998, -2.733612298965454, -2.6496822834014893, -2.5657520294189453, -2.4818220138549805, -2.3978917598724365, -2.3139615058898926, -2.2300314903259277, -2.146101236343384, -2.06217098236084, -1.978240966796875, -1.894310712814331, -1.8103806972503662, -1.7264504432678223, -1.6425203084945679, -1.5585901737213135, -1.474660038948059, -1.3907299041748047, -1.3067997694015503, -1.222869634628296, -1.138939380645752, -1.055009365081787, -0.9710791110992432, -0.8871489763259888, -0.8032190799713135, -0.7192889451980591, -0.6353588104248047, -0.5514286160469055, -0.4674984812736511, -0.38356834650039673, -0.29963815212249756, -0.21570801734924316, -0.13177788257598877, -0.04784773290157318, 0.03608241677284241, 0.12001258134841919, 0.20394271612167358, 0.287872850894928, 0.37180304527282715, 0.45573318004608154, 0.5396633148193359, 0.6235934495925903, 0.7075235843658447, 0.7914537787437439, 0.8753839135169983, 0.9593140482902527, 1.0432442426681519, 1.1271743774414062, 1.2111045122146606, 1.295034646987915, 1.3789647817611694, 1.4628949165344238, 1.5468251705169678, 1.6307551860809326, 1.7146854400634766, 1.798615574836731, 1.8825457096099854]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [5.0, 0.0, 2.0, 0.0, 4.0, 1.0, 0.0, 3.0, 5.0, 8.0, 4.0, 5.0, 3.0, 15.0, 13.0, 21.0, 19.0, 17.0, 23.0, 25.0, 29.0, 28.0, 35.0, 29.0, 31.0, 38.0, 37.0, 44.0, 40.0, 51.0, 41.0, 31.0, 33.0, 38.0, 35.0, 30.0, 30.0, 25.0, 26.0, 26.0, 23.0, 20.0, 16.0, 11.0, 14.0, 17.0, 8.0, 8.0, 6.0, 11.0, 9.0, 10.0, 7.0, 2.0, 3.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8400186896324158, -0.8119205832481384, -0.7838225364685059, -0.7557244300842285, -0.7276263236999512, -0.6995282173156738, -0.6714301705360413, -0.6433320641517639, -0.6152340173721313, -0.587135910987854, -0.5590378642082214, -0.5309397578239441, -0.5028416514396667, -0.4747435748577118, -0.44664549827575684, -0.4185473918914795, -0.39044928550720215, -0.3623512089252472, -0.33425310254096985, -0.3061550259590149, -0.27805691957473755, -0.2499588429927826, -0.22186076641082764, -0.1937626749277115, -0.16566458344459534, -0.1375664919614792, -0.10946840792894363, -0.08137032389640808, -0.05327223241329193, -0.02517414093017578, 0.002923935651779175, 0.031022027134895325, 0.05912017822265625, 0.0872182697057724, 0.11531635373830795, 0.1434144377708435, 0.17151252925395966, 0.1996106207370758, 0.22770869731903076, 0.2558068037033081, 0.28390488028526306, 0.312002956867218, 0.34010106325149536, 0.3681991398334503, 0.3962972164154053, 0.4243953227996826, 0.4524933993816376, 0.48059147596359253, 0.5086895823478699, 0.5367876887321472, 0.5648857355117798, 0.5929838418960571, 0.6210819482803345, 0.6491800546646118, 0.6772781014442444, 0.7053762078285217, 0.7334742546081543, 0.7615723609924316, 0.7896704077720642, 0.8177685141563416, 0.8458666205406189, 0.8739646673202515, 0.9020627737045288, 0.9301608800888062, 0.9582589864730835]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 8.0, 7.0, 13.0, 24.0, 30.0, 40.0, 71.0, 109.0, 186.0, 292.0, 445.0, 731.0, 1297.0, 2356.0, 4433.0, 9154.0, 20311.0, 52235.0, 174134.0, 2199799.0, 1485832.0, 157193.0, 48157.0, 18876.0, 8702.0, 4254.0, 2220.0, 1256.0, 739.0, 447.0, 316.0, 173.0, 146.0, 92.0, 55.0, 50.0, 22.0, 23.0, 18.0, 7.0, 7.0, 2.0, 6.0, 5.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.137939453125, -0.13300704956054688, -0.12807464599609375, -0.12314224243164062, -0.1182098388671875, -0.11327743530273438, -0.10834503173828125, -0.10341262817382812, -0.098480224609375, -0.09354782104492188, -0.08861541748046875, -0.08368301391601562, -0.0787506103515625, -0.07381820678710938, -0.06888580322265625, -0.06395339965820312, -0.05902099609375, -0.054088592529296875, -0.04915618896484375, -0.044223785400390625, -0.0392913818359375, -0.034358978271484375, -0.02942657470703125, -0.024494171142578125, -0.019561767578125, -0.014629364013671875, -0.00969696044921875, -0.004764556884765625, 0.0001678466796875, 0.005100250244140625, 0.01003265380859375, 0.014965057373046875, 0.0198974609375, 0.024829864501953125, 0.02976226806640625, 0.034694671630859375, 0.0396270751953125, 0.044559478759765625, 0.04949188232421875, 0.054424285888671875, 0.059356689453125, 0.06428909301757812, 0.06922149658203125, 0.07415390014648438, 0.0790863037109375, 0.08401870727539062, 0.08895111083984375, 0.09388351440429688, 0.09881591796875, 0.10374832153320312, 0.10868072509765625, 0.11361312866210938, 0.1185455322265625, 0.12347793579101562, 0.12841033935546875, 0.13334274291992188, 0.138275146484375, 0.14320755004882812, 0.14813995361328125, 0.15307235717773438, 0.1580047607421875, 0.16293716430664062, 0.16786956787109375, 0.17280197143554688, 0.177734375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 7.0, 2.0, 9.0, 10.0, 6.0, 15.0, 12.0, 18.0, 17.0, 39.0, 35.0, 41.0, 48.0, 46.0, 65.0, 53.0, 57.0, 50.0, 55.0, 55.0, 62.0, 47.0, 54.0, 35.0, 34.0, 33.0, 22.0, 16.0, 16.0, 13.0, 13.0, 6.0, 1.0, 2.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.04644775390625, -0.04492473602294922, -0.04340171813964844, -0.041878700256347656, -0.040355682373046875, -0.038832664489746094, -0.03730964660644531, -0.03578662872314453, -0.03426361083984375, -0.03274059295654297, -0.031217575073242188, -0.029694557189941406, -0.028171539306640625, -0.026648521423339844, -0.025125503540039062, -0.02360248565673828, -0.0220794677734375, -0.02055644989013672, -0.019033432006835938, -0.017510414123535156, -0.015987396240234375, -0.014464378356933594, -0.012941360473632812, -0.011418342590332031, -0.00989532470703125, -0.008372306823730469, -0.0068492889404296875, -0.005326271057128906, -0.003803253173828125, -0.0022802352905273438, -0.0007572174072265625, 0.0007658004760742188, 0.002288818359375, 0.0038118362426757812, 0.0053348541259765625, 0.006857872009277344, 0.008380889892578125, 0.009903907775878906, 0.011426925659179688, 0.012949943542480469, 0.01447296142578125, 0.01599597930908203, 0.017518997192382812, 0.019042015075683594, 0.020565032958984375, 0.022088050842285156, 0.023611068725585938, 0.02513408660888672, 0.0266571044921875, 0.02818012237548828, 0.029703140258789062, 0.031226158142089844, 0.032749176025390625, 0.034272193908691406, 0.03579521179199219, 0.03731822967529297, 0.03884124755859375, 0.04036426544189453, 0.04188728332519531, 0.043410301208496094, 0.044933319091796875, 0.046456336975097656, 0.04797935485839844, 0.04950237274169922, 0.051025390625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 3.0, 5.0, 10.0, 16.0, 24.0, 33.0, 47.0, 69.0, 114.0, 162.0, 247.0, 379.0, 580.0, 1051.0, 1938.0, 3489.0, 6767.0, 14498.0, 33964.0, 95275.0, 374369.0, 2804256.0, 640749.0, 134993.0, 45317.0, 18445.0, 8201.0, 3977.0, 2213.0, 1171.0, 699.0, 440.0, 267.0, 183.0, 100.0, 84.0, 47.0, 27.0, 12.0, 20.0, 12.0, 16.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.179931640625, -0.17441940307617188, -0.16890716552734375, -0.16339492797851562, -0.1578826904296875, -0.15237045288085938, -0.14685821533203125, -0.14134597778320312, -0.135833740234375, -0.13032150268554688, -0.12480926513671875, -0.11929702758789062, -0.1137847900390625, -0.10827255249023438, -0.10276031494140625, -0.09724807739257812, -0.09173583984375, -0.08622360229492188, -0.08071136474609375, -0.07519912719726562, -0.0696868896484375, -0.06417465209960938, -0.05866241455078125, -0.053150177001953125, -0.047637939453125, -0.042125701904296875, -0.03661346435546875, -0.031101226806640625, -0.0255889892578125, -0.020076751708984375, -0.01456451416015625, -0.009052276611328125, -0.0035400390625, 0.001972198486328125, 0.00748443603515625, 0.012996673583984375, 0.0185089111328125, 0.024021148681640625, 0.02953338623046875, 0.035045623779296875, 0.040557861328125, 0.046070098876953125, 0.05158233642578125, 0.057094573974609375, 0.0626068115234375, 0.06811904907226562, 0.07363128662109375, 0.07914352416992188, 0.08465576171875, 0.09016799926757812, 0.09568023681640625, 0.10119247436523438, 0.1067047119140625, 0.11221694946289062, 0.11772918701171875, 0.12324142456054688, 0.128753662109375, 0.13426589965820312, 0.13977813720703125, 0.14529037475585938, 0.1508026123046875, 0.15631484985351562, 0.16182708740234375, 0.16733932495117188, 0.1728515625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 3.0, 4.0, 10.0, 5.0, 5.0, 11.0, 10.0, 14.0, 23.0, 24.0, 25.0, 59.0, 88.0, 101.0, 178.0, 238.0, 487.0, 1068.0, 700.0, 360.0, 195.0, 124.0, 90.0, 54.0, 46.0, 37.0, 24.0, 22.0, 18.0, 15.0, 13.0, 3.0, 4.0, 7.0, 4.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11700439453125, -0.11390399932861328, -0.11080360412597656, -0.10770320892333984, -0.10460281372070312, -0.1015024185180664, -0.09840202331542969, -0.09530162811279297, -0.09220123291015625, -0.08910083770751953, -0.08600044250488281, -0.0829000473022461, -0.07979965209960938, -0.07669925689697266, -0.07359886169433594, -0.07049846649169922, -0.0673980712890625, -0.06429767608642578, -0.06119728088378906, -0.058096885681152344, -0.054996490478515625, -0.051896095275878906, -0.04879570007324219, -0.04569530487060547, -0.04259490966796875, -0.03949451446533203, -0.03639411926269531, -0.033293724060058594, -0.030193328857421875, -0.027092933654785156, -0.023992538452148438, -0.02089214324951172, -0.017791748046875, -0.014691352844238281, -0.011590957641601562, -0.008490562438964844, -0.005390167236328125, -0.0022897720336914062, 0.0008106231689453125, 0.003911018371582031, 0.00701141357421875, 0.010111808776855469, 0.013212203979492188, 0.016312599182128906, 0.019412994384765625, 0.022513389587402344, 0.025613784790039062, 0.02871417999267578, 0.0318145751953125, 0.03491497039794922, 0.03801536560058594, 0.041115760803222656, 0.044216156005859375, 0.047316551208496094, 0.05041694641113281, 0.05351734161376953, 0.05661773681640625, 0.05971813201904297, 0.06281852722167969, 0.0659189224243164, 0.06901931762695312, 0.07211971282958984, 0.07522010803222656, 0.07832050323486328, 0.0814208984375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 4.0, 3.0, 11.0, 12.0, 30.0, 38.0, 61.0, 86.0, 110.0, 125.0, 117.0, 117.0, 98.0, 66.0, 43.0, 28.0, 19.0, 14.0, 11.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6959151029586792, -0.6721333265304565, -0.6483514904975891, -0.6245697140693665, -0.600787878036499, -0.5770061016082764, -0.5532243251800537, -0.5294424891471863, -0.5056606531143188, -0.4818788468837738, -0.45809704065322876, -0.4343152642250061, -0.41053342819213867, -0.386751651763916, -0.36296984553337097, -0.3391880393028259, -0.31540626287460327, -0.2916244566440582, -0.2678426504135132, -0.24406085908412933, -0.2202790528535843, -0.19649724662303925, -0.1727154552936554, -0.14893364906311035, -0.1251518428325653, -0.10137003660202026, -0.07758823782205582, -0.05380643904209137, -0.030024632811546326, -0.006242826581001282, 0.01753896474838257, 0.04132077097892761, 0.06510257720947266, 0.0888843834400177, 0.11266618221998215, 0.1364479809999466, 0.16022978723049164, 0.18401159346103668, 0.20779338479042053, 0.23157519102096558, 0.2553569972515106, 0.27913880348205566, 0.3029206097126007, 0.32670241594314575, 0.3504841923713684, 0.37426602840423584, 0.3980478048324585, 0.42182961106300354, 0.4456114172935486, 0.46939322352409363, 0.49317502975463867, 0.5169568061828613, 0.5407386422157288, 0.5645204186439514, 0.5883022546768188, 0.6120840311050415, 0.6358658075332642, 0.6596475839614868, 0.6834294199943542, 0.7072111964225769, 0.7309930324554443, 0.754774808883667, 0.7785565853118896, 0.8023384213447571, 0.8261202573776245]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 6.0, 7.0, 8.0, 9.0, 11.0, 19.0, 18.0, 11.0, 24.0, 22.0, 37.0, 39.0, 41.0, 35.0, 56.0, 52.0, 52.0, 46.0, 55.0, 54.0, 55.0, 54.0, 45.0, 53.0, 34.0, 34.0, 24.0, 17.0, 17.0, 17.0, 15.0, 14.0, 8.0, 5.0, 7.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5075972676277161, -0.49290984869003296, -0.47822245955467224, -0.4635350704193115, -0.4488476514816284, -0.4341602325439453, -0.4194728434085846, -0.4047854542732239, -0.39009803533554077, -0.37541061639785767, -0.36072322726249695, -0.34603583812713623, -0.3313484191894531, -0.31666100025177, -0.3019736111164093, -0.2872862219810486, -0.2725988030433655, -0.2579113841056824, -0.24322399497032166, -0.22853659093379974, -0.21384918689727783, -0.19916178286075592, -0.184474378824234, -0.1697869747877121, -0.15509957075119019, -0.14041216671466827, -0.12572476267814636, -0.11103735864162445, -0.09634995460510254, -0.08166255056858063, -0.06697514653205872, -0.052287742495536804, -0.03760033845901489, -0.02291293442249298, -0.00822553038597107, 0.006461873650550842, 0.021149277687072754, 0.035836681723594666, 0.05052408576011658, 0.06521148979663849, 0.0798988938331604, 0.09458629786968231, 0.10927370190620422, 0.12396110594272614, 0.13864850997924805, 0.15333591401576996, 0.16802331805229187, 0.18271072208881378, 0.1973981261253357, 0.2120855301618576, 0.22677293419837952, 0.24146033823490143, 0.25614774227142334, 0.27083516120910645, 0.28552255034446716, 0.3002099394798279, 0.314897358417511, 0.3295847773551941, 0.3442721664905548, 0.3589595556259155, 0.37364697456359863, 0.38833439350128174, 0.40302178263664246, 0.4177091717720032, 0.4323965907096863]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 4.0, 8.0, 10.0, 17.0, 22.0, 37.0, 37.0, 59.0, 107.0, 190.0, 293.0, 436.0, 759.0, 1302.0, 2238.0, 4201.0, 7451.0, 14096.0, 27677.0, 54913.0, 140837.0, 518185.0, 156178.0, 57785.0, 29010.0, 14815.0, 7989.0, 4213.0, 2317.0, 1312.0, 808.0, 427.0, 277.0, 185.0, 122.0, 67.0, 51.0, 32.0, 20.0, 14.0, 15.0, 11.0, 9.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.1690673828125, -0.1635303497314453, -0.15799331665039062, -0.15245628356933594, -0.14691925048828125, -0.14138221740722656, -0.13584518432617188, -0.1303081512451172, -0.1247711181640625, -0.11923408508300781, -0.11369705200195312, -0.10816001892089844, -0.10262298583984375, -0.09708595275878906, -0.09154891967773438, -0.08601188659667969, -0.080474853515625, -0.07493782043457031, -0.06940078735351562, -0.06386375427246094, -0.05832672119140625, -0.05278968811035156, -0.047252655029296875, -0.04171562194824219, -0.0361785888671875, -0.030641555786132812, -0.025104522705078125, -0.019567489624023438, -0.01403045654296875, -0.008493423461914062, -0.002956390380859375, 0.0025806427001953125, 0.00811767578125, 0.013654708862304688, 0.019191741943359375, 0.024728775024414062, 0.03026580810546875, 0.03580284118652344, 0.041339874267578125, 0.04687690734863281, 0.0524139404296875, 0.05795097351074219, 0.06348800659179688, 0.06902503967285156, 0.07456207275390625, 0.08009910583496094, 0.08563613891601562, 0.09117317199707031, 0.096710205078125, 0.10224723815917969, 0.10778427124023438, 0.11332130432128906, 0.11885833740234375, 0.12439537048339844, 0.12993240356445312, 0.1354694366455078, 0.1410064697265625, 0.1465435028076172, 0.15208053588867188, 0.15761756896972656, 0.16315460205078125, 0.16869163513183594, 0.17422866821289062, 0.1797657012939453, 0.185302734375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 8.0, 5.0, 10.0, 15.0, 8.0, 24.0, 24.0, 20.0, 33.0, 41.0, 51.0, 37.0, 37.0, 57.0, 58.0, 65.0, 40.0, 40.0, 44.0, 60.0, 44.0, 45.0, 45.0, 38.0, 22.0, 24.0, 23.0, 16.0, 16.0, 6.0, 16.0, 6.0, 8.0, 3.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.044403076171875, -0.042989253997802734, -0.04157543182373047, -0.0401616096496582, -0.03874778747558594, -0.03733396530151367, -0.035920143127441406, -0.03450632095336914, -0.033092498779296875, -0.03167867660522461, -0.030264854431152344, -0.028851032257080078, -0.027437210083007812, -0.026023387908935547, -0.02460956573486328, -0.023195743560791016, -0.02178192138671875, -0.020368099212646484, -0.01895427703857422, -0.017540454864501953, -0.016126632690429688, -0.014712810516357422, -0.013298988342285156, -0.01188516616821289, -0.010471343994140625, -0.00905752182006836, -0.007643699645996094, -0.006229877471923828, -0.0048160552978515625, -0.003402233123779297, -0.0019884109497070312, -0.0005745887756347656, 0.0008392333984375, 0.0022530555725097656, 0.0036668777465820312, 0.005080699920654297, 0.0064945220947265625, 0.007908344268798828, 0.009322166442871094, 0.01073598861694336, 0.012149810791015625, 0.01356363296508789, 0.014977455139160156, 0.016391277313232422, 0.017805099487304688, 0.019218921661376953, 0.02063274383544922, 0.022046566009521484, 0.02346038818359375, 0.024874210357666016, 0.02628803253173828, 0.027701854705810547, 0.029115676879882812, 0.030529499053955078, 0.031943321228027344, 0.03335714340209961, 0.034770965576171875, 0.03618478775024414, 0.037598609924316406, 0.03901243209838867, 0.04042625427246094, 0.0418400764465332, 0.04325389862060547, 0.044667720794677734, 0.04608154296875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 5.0, 3.0, 6.0, 4.0, 13.0, 18.0, 18.0, 20.0, 18.0, 37.0, 67.0, 61.0, 102.0, 112.0, 155.0, 219.0, 296.0, 459.0, 654.0, 1327.0, 2888.0, 8874.0, 33353.0, 132045.0, 694673.0, 126066.0, 32365.0, 8432.0, 2861.0, 1212.0, 663.0, 416.0, 270.0, 205.0, 165.0, 118.0, 81.0, 62.0, 47.0, 48.0, 29.0, 22.0, 18.0, 8.0, 12.0, 7.0, 7.0, 3.0, 8.0, 4.0, 5.0, 1.0, 1.0, 2.0], "bins": [-0.29052734375, -0.2821025848388672, -0.2736778259277344, -0.26525306701660156, -0.25682830810546875, -0.24840354919433594, -0.23997879028320312, -0.2315540313720703, -0.2231292724609375, -0.2147045135498047, -0.20627975463867188, -0.19785499572753906, -0.18943023681640625, -0.18100547790527344, -0.17258071899414062, -0.1641559600830078, -0.155731201171875, -0.1473064422607422, -0.13888168334960938, -0.13045692443847656, -0.12203216552734375, -0.11360740661621094, -0.10518264770507812, -0.09675788879394531, -0.0883331298828125, -0.07990837097167969, -0.07148361206054688, -0.06305885314941406, -0.05463409423828125, -0.04620933532714844, -0.037784576416015625, -0.029359817504882812, -0.02093505859375, -0.012510299682617188, -0.004085540771484375, 0.0043392181396484375, 0.01276397705078125, 0.021188735961914062, 0.029613494873046875, 0.03803825378417969, 0.0464630126953125, 0.05488777160644531, 0.06331253051757812, 0.07173728942871094, 0.08016204833984375, 0.08858680725097656, 0.09701156616210938, 0.10543632507324219, 0.113861083984375, 0.12228584289550781, 0.13071060180664062, 0.13913536071777344, 0.14756011962890625, 0.15598487854003906, 0.16440963745117188, 0.1728343963623047, 0.1812591552734375, 0.1896839141845703, 0.19810867309570312, 0.20653343200683594, 0.21495819091796875, 0.22338294982910156, 0.23180770874023438, 0.2402324676513672, 0.2486572265625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 6.0, 10.0, 9.0, 11.0, 12.0, 18.0, 19.0, 24.0, 24.0, 38.0, 37.0, 37.0, 49.0, 41.0, 42.0, 51.0, 65.0, 52.0, 48.0, 55.0, 33.0, 47.0, 38.0, 35.0, 30.0, 22.0, 25.0, 28.0, 23.0, 10.0, 16.0, 8.0, 7.0, 5.0, 5.0, 5.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.216552734375, -0.2099895477294922, -0.20342636108398438, -0.19686317443847656, -0.19029998779296875, -0.18373680114746094, -0.17717361450195312, -0.1706104278564453, -0.1640472412109375, -0.1574840545654297, -0.15092086791992188, -0.14435768127441406, -0.13779449462890625, -0.13123130798339844, -0.12466812133789062, -0.11810493469238281, -0.111541748046875, -0.10497856140136719, -0.09841537475585938, -0.09185218811035156, -0.08528900146484375, -0.07872581481933594, -0.07216262817382812, -0.06559944152832031, -0.0590362548828125, -0.05247306823730469, -0.045909881591796875, -0.03934669494628906, -0.03278350830078125, -0.026220321655273438, -0.019657135009765625, -0.013093948364257812, -0.00653076171875, 3.24249267578125e-05, 0.006595611572265625, 0.013158798217773438, 0.01972198486328125, 0.026285171508789062, 0.032848358154296875, 0.03941154479980469, 0.0459747314453125, 0.05253791809082031, 0.059101104736328125, 0.06566429138183594, 0.07222747802734375, 0.07879066467285156, 0.08535385131835938, 0.09191703796386719, 0.098480224609375, 0.10504341125488281, 0.11160659790039062, 0.11816978454589844, 0.12473297119140625, 0.13129615783691406, 0.13785934448242188, 0.1444225311279297, 0.1509857177734375, 0.1575489044189453, 0.16411209106445312, 0.17067527770996094, 0.17723846435546875, 0.18380165100097656, 0.19036483764648438, 0.1969280242919922, 0.2034912109375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 5.0, 10.0, 24.0, 40.0, 55.0, 89.0, 180.0, 350.0, 949.0, 3227.0, 16051.0, 133826.0, 837273.0, 46200.0, 7371.0, 1766.0, 582.0, 248.0, 115.0, 64.0, 42.0, 32.0, 27.0, 11.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31201171875, -0.30170440673828125, -0.2913970947265625, -0.28108978271484375, -0.270782470703125, -0.26047515869140625, -0.2501678466796875, -0.23986053466796875, -0.22955322265625, -0.21924591064453125, -0.2089385986328125, -0.19863128662109375, -0.188323974609375, -0.17801666259765625, -0.1677093505859375, -0.15740203857421875, -0.1470947265625, -0.13678741455078125, -0.1264801025390625, -0.11617279052734375, -0.105865478515625, -0.09555816650390625, -0.0852508544921875, -0.07494354248046875, -0.06463623046875, -0.05432891845703125, -0.0440216064453125, -0.03371429443359375, -0.023406982421875, -0.01309967041015625, -0.0027923583984375, 0.00751495361328125, 0.017822265625, 0.02812957763671875, 0.0384368896484375, 0.04874420166015625, 0.059051513671875, 0.06935882568359375, 0.0796661376953125, 0.08997344970703125, 0.10028076171875, 0.11058807373046875, 0.1208953857421875, 0.13120269775390625, 0.141510009765625, 0.15181732177734375, 0.1621246337890625, 0.17243194580078125, 0.1827392578125, 0.19304656982421875, 0.2033538818359375, 0.21366119384765625, 0.223968505859375, 0.23427581787109375, 0.2445831298828125, 0.25489044189453125, 0.26519775390625, 0.27550506591796875, 0.2858123779296875, 0.29611968994140625, 0.306427001953125, 0.31673431396484375, 0.3270416259765625, 0.33734893798828125, 0.34765625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 3.0, 8.0, 6.0, 15.0, 11.0, 27.0, 38.0, 49.0, 62.0, 105.0, 121.0, 114.0, 106.0, 85.0, 60.0, 52.0, 28.0, 29.0, 19.0, 10.0, 11.0, 3.0, 4.0, 3.0, 9.0, 3.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0], "bins": [-0.00013780593872070312, -0.00013447925448417664, -0.00013115257024765015, -0.00012782588601112366, -0.00012449920177459717, -0.00012117251753807068, -0.00011784583330154419, -0.0001145191490650177, -0.00011119246482849121, -0.00010786578059196472, -0.00010453909635543823, -0.00010121241211891174, -9.788572788238525e-05, -9.455904364585876e-05, -9.123235940933228e-05, -8.790567517280579e-05, -8.45789909362793e-05, -8.125230669975281e-05, -7.792562246322632e-05, -7.459893822669983e-05, -7.127225399017334e-05, -6.794556975364685e-05, -6.461888551712036e-05, -6.129220128059387e-05, -5.796551704406738e-05, -5.4638832807540894e-05, -5.1312148571014404e-05, -4.7985464334487915e-05, -4.4658780097961426e-05, -4.1332095861434937e-05, -3.800541162490845e-05, -3.467872738838196e-05, -3.135204315185547e-05, -2.802535891532898e-05, -2.469867467880249e-05, -2.1371990442276e-05, -1.8045306205749512e-05, -1.4718621969223022e-05, -1.1391937732696533e-05, -8.065253496170044e-06, -4.738569259643555e-06, -1.4118850231170654e-06, 1.914799213409424e-06, 5.241483449935913e-06, 8.568167686462402e-06, 1.1894851922988892e-05, 1.5221536159515381e-05, 1.854822039604187e-05, 2.187490463256836e-05, 2.520158886909485e-05, 2.8528273105621338e-05, 3.185495734214783e-05, 3.5181641578674316e-05, 3.8508325815200806e-05, 4.1835010051727295e-05, 4.5161694288253784e-05, 4.8488378524780273e-05, 5.181506276130676e-05, 5.514174699783325e-05, 5.846843123435974e-05, 6.179511547088623e-05, 6.512179970741272e-05, 6.844848394393921e-05, 7.17751681804657e-05, 7.510185241699219e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 8.0, 9.0, 13.0, 14.0, 30.0, 29.0, 51.0, 64.0, 102.0, 173.0, 274.0, 454.0, 980.0, 2424.0, 7281.0, 27906.0, 221879.0, 724612.0, 45629.0, 10617.0, 3331.0, 1265.0, 546.0, 308.0, 184.0, 118.0, 64.0, 50.0, 46.0, 31.0, 16.0, 12.0, 11.0, 8.0, 7.0, 2.0, 1.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2093505859375, -0.20191383361816406, -0.19447708129882812, -0.1870403289794922, -0.17960357666015625, -0.1721668243408203, -0.16473007202148438, -0.15729331970214844, -0.1498565673828125, -0.14241981506347656, -0.13498306274414062, -0.1275463104248047, -0.12010955810546875, -0.11267280578613281, -0.10523605346679688, -0.09779930114746094, -0.090362548828125, -0.08292579650878906, -0.07548904418945312, -0.06805229187011719, -0.06061553955078125, -0.05317878723144531, -0.045742034912109375, -0.03830528259277344, -0.0308685302734375, -0.023431777954101562, -0.015995025634765625, -0.008558273315429688, -0.00112152099609375, 0.0063152313232421875, 0.013751983642578125, 0.021188735961914062, 0.02862548828125, 0.03606224060058594, 0.043498992919921875, 0.05093574523925781, 0.05837249755859375, 0.06580924987792969, 0.07324600219726562, 0.08068275451660156, 0.0881195068359375, 0.09555625915527344, 0.10299301147460938, 0.11042976379394531, 0.11786651611328125, 0.1253032684326172, 0.13274002075195312, 0.14017677307128906, 0.147613525390625, 0.15505027770996094, 0.16248703002929688, 0.1699237823486328, 0.17736053466796875, 0.1847972869873047, 0.19223403930664062, 0.19967079162597656, 0.2071075439453125, 0.21454429626464844, 0.22198104858398438, 0.2294178009033203, 0.23685455322265625, 0.2442913055419922, 0.2517280578613281, 0.25916481018066406, 0.2666015625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 7.0, 3.0, 7.0, 4.0, 14.0, 15.0, 13.0, 16.0, 25.0, 33.0, 52.0, 107.0, 161.0, 157.0, 129.0, 67.0, 41.0, 23.0, 17.0, 25.0, 11.0, 12.0, 9.0, 10.0, 5.0, 5.0, 4.0, 3.0, 4.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.10833740234375, -0.10475635528564453, -0.10117530822753906, -0.0975942611694336, -0.09401321411132812, -0.09043216705322266, -0.08685111999511719, -0.08327007293701172, -0.07968902587890625, -0.07610797882080078, -0.07252693176269531, -0.06894588470458984, -0.06536483764648438, -0.061783790588378906, -0.05820274353027344, -0.05462169647216797, -0.0510406494140625, -0.04745960235595703, -0.04387855529785156, -0.040297508239746094, -0.036716461181640625, -0.033135414123535156, -0.029554367065429688, -0.02597332000732422, -0.02239227294921875, -0.01881122589111328, -0.015230178833007812, -0.011649131774902344, -0.008068084716796875, -0.004487037658691406, -0.0009059906005859375, 0.0026750564575195312, 0.006256103515625, 0.009837150573730469, 0.013418197631835938, 0.016999244689941406, 0.020580291748046875, 0.024161338806152344, 0.027742385864257812, 0.03132343292236328, 0.03490447998046875, 0.03848552703857422, 0.04206657409667969, 0.045647621154785156, 0.049228668212890625, 0.052809715270996094, 0.05639076232910156, 0.05997180938720703, 0.0635528564453125, 0.06713390350341797, 0.07071495056152344, 0.0742959976196289, 0.07787704467773438, 0.08145809173583984, 0.08503913879394531, 0.08862018585205078, 0.09220123291015625, 0.09578227996826172, 0.09936332702636719, 0.10294437408447266, 0.10652542114257812, 0.1101064682006836, 0.11368751525878906, 0.11726856231689453, 0.120849609375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 7.0, 6.0, 15.0, 37.0, 65.0, 121.0, 204.0, 199.0, 165.0, 90.0, 59.0, 17.0, 13.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7364709377288818, -1.6499820947647095, -1.563493251800537, -1.4770045280456543, -1.390515685081482, -1.3040268421173096, -1.2175381183624268, -1.1310492753982544, -1.044560432434082, -0.9580715894699097, -0.8715828061103821, -0.7850940227508545, -0.6986051797866821, -0.6121163368225098, -0.5256275534629822, -0.4391387701034546, -0.3526499271392822, -0.26616111397743225, -0.17967230081558228, -0.0931834876537323, -0.006694674491882324, 0.07979413866996765, 0.16628295183181763, 0.2527717351913452, 0.3392605781555176, 0.42574939131736755, 0.5122382044792175, 0.5987269878387451, 0.6852158308029175, 0.7717046737670898, 0.8581934571266174, 0.944682240486145, 1.0311708450317383, 1.1176596879959106, 1.204148530960083, 1.2906372547149658, 1.3771260976791382, 1.4636149406433105, 1.5501036643981934, 1.6365925073623657, 1.723081350326538, 1.8095701932907104, 1.8960590362548828, 1.9825477600097656, 2.0690364837646484, 2.1555254459381104, 2.242014169692993, 2.328503131866455, 2.414991855621338, 2.5014805793762207, 2.5879695415496826, 2.6744582653045654, 2.7609472274780273, 2.84743595123291, 2.933924674987793, 3.020413398742676, 3.1069023609161377, 3.1933910846710205, 3.2798800468444824, 3.3663687705993652, 3.452857494354248, 3.53934645652771, 3.6258351802825928, 3.7123241424560547, 3.7988128662109375]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 0.0, 5.0, 6.0, 6.0, 12.0, 14.0, 9.0, 10.0, 23.0, 23.0, 18.0, 22.0, 21.0, 24.0, 30.0, 34.0, 45.0, 40.0, 28.0, 43.0, 48.0, 50.0, 26.0, 38.0, 23.0, 41.0, 34.0, 38.0, 26.0, 26.0, 28.0, 26.0, 22.0, 16.0, 23.0, 24.0, 15.0, 9.0, 14.0, 10.0, 7.0, 11.0, 7.0, 5.0, 6.0, 4.0, 2.0, 4.0, 3.0, 3.0, 2.0, 0.0, 3.0], "bins": [-0.8749426603317261, -0.8487026691436768, -0.8224627375602722, -0.7962227463722229, -0.7699827551841736, -0.743742823600769, -0.7175028324127197, -0.6912628412246704, -0.6650228500366211, -0.6387828588485718, -0.6125429272651672, -0.5863029360771179, -0.5600629448890686, -0.5338230133056641, -0.5075830221176147, -0.48134303092956543, -0.4551030993461609, -0.42886313796043396, -0.40262314677238464, -0.3763831853866577, -0.3501431941986084, -0.32390323281288147, -0.29766327142715454, -0.2714232802391052, -0.2451833188533783, -0.21894334256649017, -0.19270336627960205, -0.16646340489387512, -0.140223428606987, -0.11398345232009888, -0.08774349093437195, -0.061503514647483826, -0.03526347875595093, -0.009023506194353104, 0.01721646636724472, 0.043456435203552246, 0.06969641149044037, 0.09593638777732849, 0.12217634916305542, 0.14841632544994354, 0.17465630173683167, 0.2008962780237198, 0.2271362543106079, 0.25337621569633484, 0.27961617708206177, 0.3058561682701111, 0.332096129655838, 0.35833609104156494, 0.38457608222961426, 0.4108160436153412, 0.4370560348033905, 0.46329599618911743, 0.48953598737716675, 0.5157759189605713, 0.5420159101486206, 0.5682559013366699, 0.5944958925247192, 0.6207358837127686, 0.6469758152961731, 0.6732158064842224, 0.6994557976722717, 0.7256957292556763, 0.7519357204437256, 0.7781757116317749, 0.8044156432151794]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 8.0, 4.0, 8.0, 19.0, 29.0, 59.0, 86.0, 156.0, 278.0, 560.0, 1190.0, 2407.0, 5528.0, 13296.0, 36141.0, 136115.0, 2906313.0, 942090.0, 99955.0, 29485.0, 11089.0, 4745.0, 2293.0, 1111.0, 570.0, 295.0, 176.0, 117.0, 66.0, 32.0, 22.0, 12.0, 13.0, 7.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2164306640625, -0.20919227600097656, -0.20195388793945312, -0.1947154998779297, -0.18747711181640625, -0.1802387237548828, -0.17300033569335938, -0.16576194763183594, -0.1585235595703125, -0.15128517150878906, -0.14404678344726562, -0.1368083953857422, -0.12957000732421875, -0.12233161926269531, -0.11509323120117188, -0.10785484313964844, -0.100616455078125, -0.09337806701660156, -0.08613967895507812, -0.07890129089355469, -0.07166290283203125, -0.06442451477050781, -0.057186126708984375, -0.04994773864746094, -0.0427093505859375, -0.03547096252441406, -0.028232574462890625, -0.020994186401367188, -0.01375579833984375, -0.0065174102783203125, 0.000720977783203125, 0.007959365844726562, 0.01519775390625, 0.022436141967773438, 0.029674530029296875, 0.03691291809082031, 0.04415130615234375, 0.05138969421386719, 0.058628082275390625, 0.06586647033691406, 0.0731048583984375, 0.08034324645996094, 0.08758163452148438, 0.09482002258300781, 0.10205841064453125, 0.10929679870605469, 0.11653518676757812, 0.12377357482910156, 0.131011962890625, 0.13825035095214844, 0.14548873901367188, 0.1527271270751953, 0.15996551513671875, 0.1672039031982422, 0.17444229125976562, 0.18168067932128906, 0.1889190673828125, 0.19615745544433594, 0.20339584350585938, 0.2106342315673828, 0.21787261962890625, 0.2251110076904297, 0.23234939575195312, 0.23958778381347656, 0.246826171875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 6.0, 5.0, 5.0, 7.0, 9.0, 12.0, 11.0, 8.0, 14.0, 14.0, 25.0, 21.0, 23.0, 37.0, 47.0, 48.0, 56.0, 55.0, 45.0, 50.0, 44.0, 48.0, 43.0, 48.0, 42.0, 41.0, 29.0, 39.0, 38.0, 45.0, 14.0, 11.0, 21.0, 14.0, 8.0, 8.0, 6.0, 4.0, 3.0, 5.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.045928955078125, -0.04445981979370117, -0.042990684509277344, -0.041521549224853516, -0.04005241394042969, -0.03858327865600586, -0.03711414337158203, -0.0356450080871582, -0.034175872802734375, -0.03270673751831055, -0.03123760223388672, -0.02976846694946289, -0.028299331665039062, -0.026830196380615234, -0.025361061096191406, -0.023891925811767578, -0.02242279052734375, -0.020953655242919922, -0.019484519958496094, -0.018015384674072266, -0.016546249389648438, -0.01507711410522461, -0.013607978820800781, -0.012138843536376953, -0.010669708251953125, -0.009200572967529297, -0.007731437683105469, -0.006262302398681641, -0.0047931671142578125, -0.0033240318298339844, -0.0018548965454101562, -0.0003857612609863281, 0.0010833740234375, 0.002552509307861328, 0.004021644592285156, 0.005490779876708984, 0.0069599151611328125, 0.00842905044555664, 0.009898185729980469, 0.011367321014404297, 0.012836456298828125, 0.014305591583251953, 0.01577472686767578, 0.01724386215209961, 0.018712997436523438, 0.020182132720947266, 0.021651268005371094, 0.023120403289794922, 0.02458953857421875, 0.026058673858642578, 0.027527809143066406, 0.028996944427490234, 0.030466079711914062, 0.03193521499633789, 0.03340435028076172, 0.03487348556518555, 0.036342620849609375, 0.0378117561340332, 0.03928089141845703, 0.04075002670288086, 0.04221916198730469, 0.043688297271728516, 0.045157432556152344, 0.04662656784057617, 0.048095703125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 5.0, 2.0, 5.0, 9.0, 14.0, 24.0, 33.0, 45.0, 66.0, 101.0, 204.0, 384.0, 819.0, 1944.0, 5764.0, 20423.0, 111546.0, 3244837.0, 726777.0, 60989.0, 13334.0, 4006.0, 1525.0, 666.0, 280.0, 180.0, 96.0, 62.0, 57.0, 21.0, 18.0, 15.0, 7.0, 13.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.300537109375, -0.2884368896484375, -0.276336669921875, -0.2642364501953125, -0.25213623046875, -0.2400360107421875, -0.227935791015625, -0.2158355712890625, -0.2037353515625, -0.1916351318359375, -0.179534912109375, -0.1674346923828125, -0.15533447265625, -0.1432342529296875, -0.131134033203125, -0.1190338134765625, -0.10693359375, -0.0948333740234375, -0.082733154296875, -0.0706329345703125, -0.05853271484375, -0.0464324951171875, -0.034332275390625, -0.0222320556640625, -0.0101318359375, 0.0019683837890625, 0.014068603515625, 0.0261688232421875, 0.03826904296875, 0.0503692626953125, 0.062469482421875, 0.0745697021484375, 0.086669921875, 0.0987701416015625, 0.110870361328125, 0.1229705810546875, 0.13507080078125, 0.1471710205078125, 0.159271240234375, 0.1713714599609375, 0.1834716796875, 0.1955718994140625, 0.207672119140625, 0.2197723388671875, 0.23187255859375, 0.2439727783203125, 0.256072998046875, 0.2681732177734375, 0.2802734375, 0.2923736572265625, 0.304473876953125, 0.3165740966796875, 0.32867431640625, 0.3407745361328125, 0.352874755859375, 0.3649749755859375, 0.3770751953125, 0.3891754150390625, 0.401275634765625, 0.4133758544921875, 0.42547607421875, 0.4375762939453125, 0.449676513671875, 0.4617767333984375, 0.473876953125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 8.0, 3.0, 4.0, 7.0, 12.0, 22.0, 27.0, 48.0, 87.0, 161.0, 303.0, 1015.0, 1556.0, 366.0, 186.0, 92.0, 65.0, 28.0, 31.0, 19.0, 15.0, 7.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11920166015625, -0.1142587661743164, -0.10931587219238281, -0.10437297821044922, -0.09943008422851562, -0.09448719024658203, -0.08954429626464844, -0.08460140228271484, -0.07965850830078125, -0.07471561431884766, -0.06977272033691406, -0.06482982635498047, -0.059886932373046875, -0.05494403839111328, -0.05000114440917969, -0.045058250427246094, -0.0401153564453125, -0.035172462463378906, -0.030229568481445312, -0.02528667449951172, -0.020343780517578125, -0.015400886535644531, -0.010457992553710938, -0.005515098571777344, -0.00057220458984375, 0.004370689392089844, 0.009313583374023438, 0.014256477355957031, 0.019199371337890625, 0.02414226531982422, 0.029085159301757812, 0.034028053283691406, 0.038970947265625, 0.043913841247558594, 0.04885673522949219, 0.05379962921142578, 0.058742523193359375, 0.06368541717529297, 0.06862831115722656, 0.07357120513916016, 0.07851409912109375, 0.08345699310302734, 0.08839988708496094, 0.09334278106689453, 0.09828567504882812, 0.10322856903076172, 0.10817146301269531, 0.1131143569946289, 0.1180572509765625, 0.1230001449584961, 0.1279430389404297, 0.13288593292236328, 0.13782882690429688, 0.14277172088623047, 0.14771461486816406, 0.15265750885009766, 0.15760040283203125, 0.16254329681396484, 0.16748619079589844, 0.17242908477783203, 0.17737197875976562, 0.18231487274169922, 0.1872577667236328, 0.1922006607055664, 0.1971435546875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 11.0, 27.0, 54.0, 115.0, 166.0, 207.0, 162.0, 130.0, 70.0, 41.0, 15.0, 7.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2911453247070312, -1.2512078285217285, -1.2112702131271362, -1.1713327169418335, -1.1313951015472412, -1.0914576053619385, -1.0515199899673462, -1.0115824937820435, -0.971644937992096, -0.9317073822021484, -0.8917698264122009, -0.8518322706222534, -0.8118947744369507, -0.7719571590423584, -0.7320196628570557, -0.6920821070671082, -0.6521445512771606, -0.6122069954872131, -0.5722694396972656, -0.5323318839073181, -0.492394357919693, -0.4524568021297455, -0.41251927614212036, -0.37258172035217285, -0.33264416456222534, -0.29270660877227783, -0.2527690529823303, -0.2128315269947052, -0.1728939712047577, -0.13295641541481018, -0.09301887452602386, -0.05308133363723755, -0.013143777847290039, 0.026793770492076874, 0.06673131883144379, 0.1066688671708107, 0.1466064155101776, 0.18654397130012512, 0.22648151218891144, 0.26641905307769775, 0.30635660886764526, 0.3462941646575928, 0.3862317204475403, 0.4261692464351654, 0.4661068022251129, 0.5060443878173828, 0.5459818840026855, 0.5859194397926331, 0.6258569955825806, 0.6657945513725281, 0.7057321071624756, 0.7456696629524231, 0.7856072187423706, 0.8255447149276733, 0.8654822707176208, 0.9054198265075684, 0.9453573822975159, 0.9852949380874634, 1.0252324342727661, 1.0651700496673584, 1.1051075458526611, 1.1450451612472534, 1.1849826574325562, 1.2249202728271484, 1.2648577690124512]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 5.0, 1.0, 5.0, 7.0, 6.0, 4.0, 5.0, 8.0, 11.0, 3.0, 12.0, 15.0, 15.0, 14.0, 14.0, 22.0, 14.0, 26.0, 24.0, 24.0, 30.0, 33.0, 37.0, 36.0, 34.0, 19.0, 27.0, 43.0, 41.0, 27.0, 54.0, 32.0, 29.0, 36.0, 22.0, 30.0, 27.0, 30.0, 32.0, 17.0, 21.0, 18.0, 10.0, 14.0, 13.0, 7.0, 10.0, 10.0, 9.0, 8.0, 3.0, 5.0, 7.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.33279120922088623, -0.3222312331199646, -0.31167125701904297, -0.30111128091812134, -0.2905513048171997, -0.2799912989139557, -0.26943132281303406, -0.2588713467121124, -0.2483113706111908, -0.23775139451026917, -0.22719141840934753, -0.2166314274072647, -0.20607145130634308, -0.19551147520542145, -0.18495148420333862, -0.174391508102417, -0.16383153200149536, -0.15327155590057373, -0.1427115797996521, -0.13215158879756927, -0.12159161269664764, -0.11103163659572601, -0.10047165304422379, -0.08991166949272156, -0.07935169339179993, -0.0687917172908783, -0.05823173373937607, -0.04767175391316414, -0.03711177408695221, -0.02655179426074028, -0.01599181443452835, -0.005431830883026123, 0.005128145217895508, 0.015688125044107437, 0.026248104870319366, 0.036808084696531296, 0.047368064522743225, 0.057928044348955154, 0.06848802417516708, 0.07904800772666931, 0.08960798382759094, 0.10016795992851257, 0.1107279434800148, 0.12128792703151703, 0.13184790313243866, 0.1424078792333603, 0.15296787023544312, 0.16352784633636475, 0.17408782243728638, 0.184647798538208, 0.19520777463912964, 0.20576776564121246, 0.2163277417421341, 0.22688771784305573, 0.23744770884513855, 0.24800768494606018, 0.2585676610469818, 0.26912763714790344, 0.2796876132488251, 0.2902475893497467, 0.3008075952529907, 0.31136757135391235, 0.321927547454834, 0.3324875235557556, 0.34304749965667725]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 7.0, 3.0, 6.0, 4.0, 3.0, 12.0, 13.0, 22.0, 33.0, 33.0, 57.0, 104.0, 151.0, 290.0, 580.0, 1090.0, 2317.0, 4703.0, 9492.0, 18947.0, 37169.0, 105279.0, 528488.0, 234875.0, 53932.0, 25254.0, 12956.0, 6298.0, 3260.0, 1511.0, 703.0, 401.0, 201.0, 134.0, 75.0, 38.0, 27.0, 26.0, 15.0, 18.0, 6.0, 9.0, 4.0, 8.0, 2.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.1798095703125, -0.1743144989013672, -0.16881942749023438, -0.16332435607910156, -0.15782928466796875, -0.15233421325683594, -0.14683914184570312, -0.1413440704345703, -0.1358489990234375, -0.1303539276123047, -0.12485885620117188, -0.11936378479003906, -0.11386871337890625, -0.10837364196777344, -0.10287857055664062, -0.09738349914550781, -0.091888427734375, -0.08639335632324219, -0.08089828491210938, -0.07540321350097656, -0.06990814208984375, -0.06441307067871094, -0.058917999267578125, -0.05342292785644531, -0.0479278564453125, -0.04243278503417969, -0.036937713623046875, -0.03144264221191406, -0.02594757080078125, -0.020452499389648438, -0.014957427978515625, -0.009462356567382812, -0.00396728515625, 0.0015277862548828125, 0.007022857666015625, 0.012517929077148438, 0.01801300048828125, 0.023508071899414062, 0.029003143310546875, 0.03449821472167969, 0.0399932861328125, 0.04548835754394531, 0.050983428955078125, 0.05647850036621094, 0.06197357177734375, 0.06746864318847656, 0.07296371459960938, 0.07845878601074219, 0.083953857421875, 0.08944892883300781, 0.09494400024414062, 0.10043907165527344, 0.10593414306640625, 0.11142921447753906, 0.11692428588867188, 0.12241935729980469, 0.1279144287109375, 0.1334095001220703, 0.13890457153320312, 0.14439964294433594, 0.14989471435546875, 0.15538978576660156, 0.16088485717773438, 0.1663799285888672, 0.171875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 6.0, 9.0, 16.0, 12.0, 13.0, 17.0, 18.0, 25.0, 25.0, 23.0, 36.0, 43.0, 45.0, 42.0, 47.0, 60.0, 69.0, 37.0, 42.0, 48.0, 50.0, 37.0, 39.0, 42.0, 31.0, 25.0, 24.0, 18.0, 18.0, 15.0, 18.0, 7.0, 12.0, 7.0, 5.0, 2.0, 8.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.052490234375, -0.05099678039550781, -0.049503326416015625, -0.04800987243652344, -0.04651641845703125, -0.04502296447753906, -0.043529510498046875, -0.04203605651855469, -0.0405426025390625, -0.03904914855957031, -0.037555694580078125, -0.03606224060058594, -0.03456878662109375, -0.03307533264160156, -0.031581878662109375, -0.030088424682617188, -0.028594970703125, -0.027101516723632812, -0.025608062744140625, -0.024114608764648438, -0.02262115478515625, -0.021127700805664062, -0.019634246826171875, -0.018140792846679688, -0.0166473388671875, -0.015153884887695312, -0.013660430908203125, -0.012166976928710938, -0.01067352294921875, -0.009180068969726562, -0.007686614990234375, -0.0061931610107421875, -0.00469970703125, -0.0032062530517578125, -0.001712799072265625, -0.0002193450927734375, 0.00127410888671875, 0.0027675628662109375, 0.004261016845703125, 0.0057544708251953125, 0.0072479248046875, 0.008741378784179688, 0.010234832763671875, 0.011728286743164062, 0.01322174072265625, 0.014715194702148438, 0.016208648681640625, 0.017702102661132812, 0.019195556640625, 0.020689010620117188, 0.022182464599609375, 0.023675918579101562, 0.02516937255859375, 0.026662826538085938, 0.028156280517578125, 0.029649734497070312, 0.0311431884765625, 0.03263664245605469, 0.034130096435546875, 0.03562355041503906, 0.03711700439453125, 0.03861045837402344, 0.040103912353515625, 0.04159736633300781, 0.0430908203125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 2.0, 5.0, 6.0, 10.0, 6.0, 12.0, 22.0, 26.0, 31.0, 46.0, 63.0, 75.0, 104.0, 173.0, 282.0, 555.0, 1313.0, 2872.0, 7346.0, 18918.0, 45951.0, 259189.0, 603094.0, 65032.0, 25785.0, 10310.0, 3907.0, 1623.0, 776.0, 350.0, 206.0, 139.0, 88.0, 53.0, 48.0, 41.0, 24.0, 17.0, 19.0, 6.0, 8.0, 7.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.232421875, -0.22496604919433594, -0.21751022338867188, -0.2100543975830078, -0.20259857177734375, -0.1951427459716797, -0.18768692016601562, -0.18023109436035156, -0.1727752685546875, -0.16531944274902344, -0.15786361694335938, -0.1504077911376953, -0.14295196533203125, -0.1354961395263672, -0.12804031372070312, -0.12058448791503906, -0.113128662109375, -0.10567283630371094, -0.09821701049804688, -0.09076118469238281, -0.08330535888671875, -0.07584953308105469, -0.06839370727539062, -0.06093788146972656, -0.0534820556640625, -0.04602622985839844, -0.038570404052734375, -0.031114578247070312, -0.02365875244140625, -0.016202926635742188, -0.008747100830078125, -0.0012912750244140625, 0.00616455078125, 0.013620376586914062, 0.021076202392578125, 0.028532028198242188, 0.03598785400390625, 0.04344367980957031, 0.050899505615234375, 0.05835533142089844, 0.0658111572265625, 0.07326698303222656, 0.08072280883789062, 0.08817863464355469, 0.09563446044921875, 0.10309028625488281, 0.11054611206054688, 0.11800193786621094, 0.125457763671875, 0.13291358947753906, 0.14036941528320312, 0.1478252410888672, 0.15528106689453125, 0.1627368927001953, 0.17019271850585938, 0.17764854431152344, 0.1851043701171875, 0.19256019592285156, 0.20001602172851562, 0.2074718475341797, 0.21492767333984375, 0.2223834991455078, 0.22983932495117188, 0.23729515075683594, 0.2447509765625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 5.0, 3.0, 2.0, 4.0, 12.0, 16.0, 16.0, 18.0, 26.0, 38.0, 38.0, 41.0, 44.0, 53.0, 56.0, 70.0, 69.0, 59.0, 62.0, 69.0, 52.0, 43.0, 36.0, 36.0, 33.0, 21.0, 19.0, 16.0, 12.0, 5.0, 3.0, 6.0, 8.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.28271484375, -0.2740974426269531, -0.26548004150390625, -0.2568626403808594, -0.2482452392578125, -0.23962783813476562, -0.23101043701171875, -0.22239303588867188, -0.213775634765625, -0.20515823364257812, -0.19654083251953125, -0.18792343139648438, -0.1793060302734375, -0.17068862915039062, -0.16207122802734375, -0.15345382690429688, -0.14483642578125, -0.13621902465820312, -0.12760162353515625, -0.11898422241210938, -0.1103668212890625, -0.10174942016601562, -0.09313201904296875, -0.08451461791992188, -0.075897216796875, -0.06727981567382812, -0.05866241455078125, -0.050045013427734375, -0.0414276123046875, -0.032810211181640625, -0.02419281005859375, -0.015575408935546875, -0.0069580078125, 0.001659393310546875, 0.01027679443359375, 0.018894195556640625, 0.0275115966796875, 0.036128997802734375, 0.04474639892578125, 0.053363800048828125, 0.061981201171875, 0.07059860229492188, 0.07921600341796875, 0.08783340454101562, 0.0964508056640625, 0.10506820678710938, 0.11368560791015625, 0.12230300903320312, 0.13092041015625, 0.13953781127929688, 0.14815521240234375, 0.15677261352539062, 0.1653900146484375, 0.17400741577148438, 0.18262481689453125, 0.19124221801757812, 0.199859619140625, 0.20847702026367188, 0.21709442138671875, 0.22571182250976562, 0.2343292236328125, 0.24294662475585938, 0.25156402587890625, 0.2601814270019531, 0.268798828125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 6.0, 6.0, 5.0, 10.0, 23.0, 17.0, 43.0, 41.0, 86.0, 102.0, 138.0, 233.0, 280.0, 438.0, 712.0, 1173.0, 2030.0, 3761.0, 8052.0, 21196.0, 62676.0, 608965.0, 266452.0, 42903.0, 15290.0, 6278.0, 2992.0, 1671.0, 1000.0, 684.0, 429.0, 280.0, 177.0, 107.0, 85.0, 74.0, 46.0, 30.0, 19.0, 11.0, 9.0, 9.0, 6.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.125732421875, -0.12151908874511719, -0.11730575561523438, -0.11309242248535156, -0.10887908935546875, -0.10466575622558594, -0.10045242309570312, -0.09623908996582031, -0.0920257568359375, -0.08781242370605469, -0.08359909057617188, -0.07938575744628906, -0.07517242431640625, -0.07095909118652344, -0.06674575805664062, -0.06253242492675781, -0.058319091796875, -0.05410575866699219, -0.049892425537109375, -0.04567909240722656, -0.04146575927734375, -0.03725242614746094, -0.033039093017578125, -0.028825759887695312, -0.0246124267578125, -0.020399093627929688, -0.016185760498046875, -0.011972427368164062, -0.00775909423828125, -0.0035457611083984375, 0.000667572021484375, 0.0048809051513671875, 0.00909423828125, 0.013307571411132812, 0.017520904541015625, 0.021734237670898438, 0.02594757080078125, 0.030160903930664062, 0.034374237060546875, 0.03858757019042969, 0.0428009033203125, 0.04701423645019531, 0.051227569580078125, 0.05544090270996094, 0.05965423583984375, 0.06386756896972656, 0.06808090209960938, 0.07229423522949219, 0.076507568359375, 0.08072090148925781, 0.08493423461914062, 0.08914756774902344, 0.09336090087890625, 0.09757423400878906, 0.10178756713867188, 0.10600090026855469, 0.1102142333984375, 0.11442756652832031, 0.11864089965820312, 0.12285423278808594, 0.12706756591796875, 0.13128089904785156, 0.13549423217773438, 0.1397075653076172, 0.1439208984375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 1.0, 0.0, 2.0, 2.0, 6.0, 2.0, 3.0, 4.0, 2.0, 6.0, 5.0, 8.0, 5.0, 9.0, 1.0, 8.0, 7.0, 24.0, 27.0, 18.0, 43.0, 53.0, 65.0, 80.0, 96.0, 86.0, 94.0, 76.0, 63.0, 43.0, 44.0, 21.0, 19.0, 16.0, 15.0, 11.0, 7.0, 9.0, 5.0, 4.0, 2.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.204843521118164e-05, -5.9856101870536804e-05, -5.766376852989197e-05, -5.547143518924713e-05, -5.3279101848602295e-05, -5.108676850795746e-05, -4.889443516731262e-05, -4.6702101826667786e-05, -4.450976848602295e-05, -4.231743514537811e-05, -4.0125101804733276e-05, -3.793276846408844e-05, -3.5740435123443604e-05, -3.354810178279877e-05, -3.135576844215393e-05, -2.9163435101509094e-05, -2.6971101760864258e-05, -2.477876842021942e-05, -2.2586435079574585e-05, -2.039410173892975e-05, -1.8201768398284912e-05, -1.6009435057640076e-05, -1.381710171699524e-05, -1.1624768376350403e-05, -9.432435035705566e-06, -7.24010169506073e-06, -5.0477683544158936e-06, -2.855435013771057e-06, -6.631016731262207e-07, 1.5292316675186157e-06, 3.721565008163452e-06, 5.9138983488082886e-06, 8.106231689453125e-06, 1.0298565030097961e-05, 1.2490898370742798e-05, 1.4683231711387634e-05, 1.687556505203247e-05, 1.9067898392677307e-05, 2.1260231733322144e-05, 2.345256507396698e-05, 2.5644898414611816e-05, 2.7837231755256653e-05, 3.002956509590149e-05, 3.2221898436546326e-05, 3.441423177719116e-05, 3.6606565117836e-05, 3.8798898458480835e-05, 4.099123179912567e-05, 4.318356513977051e-05, 4.5375898480415344e-05, 4.756823182106018e-05, 4.976056516170502e-05, 5.1952898502349854e-05, 5.414523184299469e-05, 5.6337565183639526e-05, 5.852989852428436e-05, 6.07222318649292e-05, 6.291456520557404e-05, 6.510689854621887e-05, 6.729923188686371e-05, 6.949156522750854e-05, 7.168389856815338e-05, 7.387623190879822e-05, 7.606856524944305e-05, 7.826089859008789e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 7.0, 5.0, 7.0, 7.0, 14.0, 9.0, 33.0, 41.0, 72.0, 75.0, 154.0, 276.0, 428.0, 768.0, 1584.0, 3019.0, 7579.0, 23173.0, 92868.0, 781752.0, 98416.0, 23646.0, 7862.0, 3265.0, 1561.0, 810.0, 447.0, 270.0, 154.0, 91.0, 55.0, 40.0, 23.0, 18.0, 10.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.1810302734375, -0.17578506469726562, -0.17053985595703125, -0.16529464721679688, -0.1600494384765625, -0.15480422973632812, -0.14955902099609375, -0.14431381225585938, -0.139068603515625, -0.13382339477539062, -0.12857818603515625, -0.12333297729492188, -0.1180877685546875, -0.11284255981445312, -0.10759735107421875, -0.10235214233398438, -0.09710693359375, -0.09186172485351562, -0.08661651611328125, -0.08137130737304688, -0.0761260986328125, -0.07088088989257812, -0.06563568115234375, -0.060390472412109375, -0.055145263671875, -0.049900054931640625, -0.04465484619140625, -0.039409637451171875, -0.0341644287109375, -0.028919219970703125, -0.02367401123046875, -0.018428802490234375, -0.01318359375, -0.007938385009765625, -0.00269317626953125, 0.002552032470703125, 0.0077972412109375, 0.013042449951171875, 0.01828765869140625, 0.023532867431640625, 0.028778076171875, 0.034023284912109375, 0.03926849365234375, 0.044513702392578125, 0.0497589111328125, 0.055004119873046875, 0.06024932861328125, 0.06549453735351562, 0.07073974609375, 0.07598495483398438, 0.08123016357421875, 0.08647537231445312, 0.0917205810546875, 0.09696578979492188, 0.10221099853515625, 0.10745620727539062, 0.112701416015625, 0.11794662475585938, 0.12319183349609375, 0.12843704223632812, 0.1336822509765625, 0.13892745971679688, 0.14417266845703125, 0.14941787719726562, 0.1546630859375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 11.0, 6.0, 15.0, 8.0, 18.0, 20.0, 19.0, 39.0, 88.0, 233.0, 259.0, 124.0, 46.0, 28.0, 18.0, 15.0, 11.0, 9.0, 3.0, 5.0, 8.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2208251953125, -0.2150249481201172, -0.20922470092773438, -0.20342445373535156, -0.19762420654296875, -0.19182395935058594, -0.18602371215820312, -0.1802234649658203, -0.1744232177734375, -0.1686229705810547, -0.16282272338867188, -0.15702247619628906, -0.15122222900390625, -0.14542198181152344, -0.13962173461914062, -0.1338214874267578, -0.128021240234375, -0.12222099304199219, -0.11642074584960938, -0.11062049865722656, -0.10482025146484375, -0.09902000427246094, -0.09321975708007812, -0.08741950988769531, -0.0816192626953125, -0.07581901550292969, -0.07001876831054688, -0.06421852111816406, -0.05841827392578125, -0.05261802673339844, -0.046817779541015625, -0.04101753234863281, -0.03521728515625, -0.029417037963867188, -0.023616790771484375, -0.017816543579101562, -0.01201629638671875, -0.0062160491943359375, -0.000415802001953125, 0.0053844451904296875, 0.0111846923828125, 0.016984939575195312, 0.022785186767578125, 0.028585433959960938, 0.03438568115234375, 0.04018592834472656, 0.045986175537109375, 0.05178642272949219, 0.057586669921875, 0.06338691711425781, 0.06918716430664062, 0.07498741149902344, 0.08078765869140625, 0.08658790588378906, 0.09238815307617188, 0.09818840026855469, 0.1039886474609375, 0.10978889465332031, 0.11558914184570312, 0.12138938903808594, 0.12718963623046875, 0.13298988342285156, 0.13879013061523438, 0.1445903778076172, 0.150390625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 4.0, 9.0, 31.0, 77.0, 137.0, 206.0, 217.0, 154.0, 91.0, 57.0, 11.0, 16.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9053446054458618, -0.815235435962677, -0.7251262664794922, -0.6350170969963074, -0.5449079275131226, -0.45479875802993774, -0.36468958854675293, -0.2745804190635681, -0.1844712495803833, -0.09436208009719849, -0.004252910614013672, 0.08585625886917114, 0.17596542835235596, 0.26607459783554077, 0.3561837673187256, 0.4462929368019104, 0.5364021062850952, 0.62651127576828, 0.7166204452514648, 0.8067296147346497, 0.8968387842178345, 0.9869479537010193, 1.077057123184204, 1.1671662330627441, 1.2572754621505737, 1.3473846912384033, 1.4374938011169434, 1.5276029109954834, 1.617712140083313, 1.7078213691711426, 1.7979304790496826, 1.8880395889282227, 1.9781489372253418, 2.068258047103882, 2.158367156982422, 2.248476505279541, 2.338585615158081, 2.428694725036621, 2.5188040733337402, 2.6089131832122803, 2.6990222930908203, 2.7891314029693604, 2.8792405128479004, 2.9693498611450195, 3.0594589710235596, 3.1495680809020996, 3.2396774291992188, 3.329786539077759, 3.419895648956299, 3.510004758834839, 3.600113868713379, 3.690223217010498, 3.780332326889038, 3.870441436767578, 3.9605507850646973, 4.050659656524658, 4.140769004821777, 4.2308783531188965, 4.320987224578857, 4.411096572875977, 4.5012054443359375, 4.591314792633057, 4.681424140930176, 4.771533012390137, 4.861642360687256]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 6.0, 5.0, 4.0, 3.0, 14.0, 6.0, 9.0, 7.0, 6.0, 18.0, 14.0, 15.0, 19.0, 30.0, 30.0, 18.0, 35.0, 34.0, 36.0, 31.0, 41.0, 33.0, 46.0, 52.0, 32.0, 43.0, 37.0, 33.0, 36.0, 28.0, 32.0, 36.0, 21.0, 27.0, 22.0, 18.0, 22.0, 21.0, 13.0, 15.0, 12.0, 9.0, 14.0, 7.0, 9.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-1.0460615158081055, -1.0176987648010254, -0.9893359541893005, -0.9609732031822205, -0.9326103925704956, -0.9042476415634155, -0.8758848905563354, -0.8475220799446106, -0.8191593289375305, -0.7907965779304504, -0.7624337673187256, -0.7340710163116455, -0.7057082056999207, -0.6773454546928406, -0.6489826440811157, -0.6206198930740356, -0.5922571420669556, -0.5638943910598755, -0.5355315804481506, -0.5071688294410706, -0.4788060486316681, -0.4504432678222656, -0.42208048701286316, -0.3937177062034607, -0.36535489559173584, -0.3369921147823334, -0.3086293339729309, -0.28026658296585083, -0.25190380215644836, -0.2235410213470459, -0.19517824053764343, -0.16681547462940216, -0.1384527087211609, -0.11008993536233902, -0.08172716200351715, -0.053364381194114685, -0.025001607835292816, 0.0033611655235290527, 0.03172394633293152, 0.06008671224117279, 0.08844949305057526, 0.11681226640939713, 0.145175039768219, 0.17353782057762146, 0.20190060138702393, 0.2302633672952652, 0.25862616300582886, 0.28698891401290894, 0.3153516948223114, 0.34371447563171387, 0.37207725644111633, 0.4004400372505188, 0.4288027882575989, 0.45716556906700134, 0.4855283498764038, 0.5138911008834839, 0.5422539114952087, 0.5706166625022888, 0.5989794731140137, 0.6273422241210938, 0.6557050347328186, 0.6840677857398987, 0.7124305963516235, 0.7407933473587036, 0.7691560983657837]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 7.0, 12.0, 10.0, 37.0, 46.0, 75.0, 119.0, 186.0, 332.0, 580.0, 1087.0, 2152.0, 4182.0, 8643.0, 19959.0, 52269.0, 213105.0, 3411347.0, 364186.0, 70298.0, 24489.0, 10452.0, 5023.0, 2510.0, 1364.0, 707.0, 387.0, 255.0, 167.0, 109.0, 57.0, 40.0, 27.0, 20.0, 10.0, 8.0, 11.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.222900390625, -0.214202880859375, -0.20550537109375, -0.196807861328125, -0.1881103515625, -0.179412841796875, -0.17071533203125, -0.162017822265625, -0.1533203125, -0.144622802734375, -0.13592529296875, -0.127227783203125, -0.1185302734375, -0.109832763671875, -0.10113525390625, -0.092437744140625, -0.083740234375, -0.075042724609375, -0.06634521484375, -0.057647705078125, -0.0489501953125, -0.040252685546875, -0.03155517578125, -0.022857666015625, -0.01416015625, -0.005462646484375, 0.00323486328125, 0.011932373046875, 0.0206298828125, 0.029327392578125, 0.03802490234375, 0.046722412109375, 0.055419921875, 0.064117431640625, 0.07281494140625, 0.081512451171875, 0.0902099609375, 0.098907470703125, 0.10760498046875, 0.116302490234375, 0.125, 0.133697509765625, 0.14239501953125, 0.151092529296875, 0.1597900390625, 0.168487548828125, 0.17718505859375, 0.185882568359375, 0.194580078125, 0.203277587890625, 0.21197509765625, 0.220672607421875, 0.2293701171875, 0.238067626953125, 0.24676513671875, 0.255462646484375, 0.26416015625, 0.272857666015625, 0.28155517578125, 0.290252685546875, 0.2989501953125, 0.307647705078125, 0.31634521484375, 0.325042724609375, 0.333740234375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 2.0, 1.0, 5.0, 3.0, 5.0, 11.0, 7.0, 9.0, 9.0, 15.0, 13.0, 21.0, 13.0, 23.0, 28.0, 37.0, 27.0, 30.0, 44.0, 39.0, 52.0, 47.0, 51.0, 54.0, 47.0, 42.0, 46.0, 32.0, 35.0, 36.0, 36.0, 26.0, 23.0, 22.0, 23.0, 20.0, 15.0, 10.0, 9.0, 4.0, 9.0, 6.0, 5.0, 3.0, 5.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.048583984375, -0.04720878601074219, -0.045833587646484375, -0.04445838928222656, -0.04308319091796875, -0.04170799255371094, -0.040332794189453125, -0.03895759582519531, -0.0375823974609375, -0.03620719909667969, -0.034832000732421875, -0.03345680236816406, -0.03208160400390625, -0.030706405639648438, -0.029331207275390625, -0.027956008911132812, -0.026580810546875, -0.025205612182617188, -0.023830413818359375, -0.022455215454101562, -0.02108001708984375, -0.019704818725585938, -0.018329620361328125, -0.016954421997070312, -0.0155792236328125, -0.014204025268554688, -0.012828826904296875, -0.011453628540039062, -0.01007843017578125, -0.008703231811523438, -0.007328033447265625, -0.0059528350830078125, -0.00457763671875, -0.0032024383544921875, -0.001827239990234375, -0.0004520416259765625, 0.00092315673828125, 0.0022983551025390625, 0.003673553466796875, 0.0050487518310546875, 0.0064239501953125, 0.0077991485595703125, 0.009174346923828125, 0.010549545288085938, 0.01192474365234375, 0.013299942016601562, 0.014675140380859375, 0.016050338745117188, 0.017425537109375, 0.018800735473632812, 0.020175933837890625, 0.021551132202148438, 0.02292633056640625, 0.024301528930664062, 0.025676727294921875, 0.027051925659179688, 0.0284271240234375, 0.029802322387695312, 0.031177520751953125, 0.03255271911621094, 0.03392791748046875, 0.03530311584472656, 0.036678314208984375, 0.03805351257324219, 0.0394287109375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 7.0, 14.0, 11.0, 30.0, 23.0, 36.0, 46.0, 58.0, 129.0, 221.0, 449.0, 1084.0, 3324.0, 12413.0, 67241.0, 3108118.0, 937155.0, 49369.0, 9814.0, 2830.0, 963.0, 404.0, 198.0, 98.0, 86.0, 51.0, 26.0, 22.0, 15.0, 12.0, 4.0, 3.0, 7.0, 6.0, 3.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6640625, -0.6455764770507812, -0.6270904541015625, -0.6086044311523438, -0.590118408203125, -0.5716323852539062, -0.5531463623046875, -0.5346603393554688, -0.51617431640625, -0.49768829345703125, -0.4792022705078125, -0.46071624755859375, -0.442230224609375, -0.42374420166015625, -0.4052581787109375, -0.38677215576171875, -0.3682861328125, -0.34980010986328125, -0.3313140869140625, -0.31282806396484375, -0.294342041015625, -0.27585601806640625, -0.2573699951171875, -0.23888397216796875, -0.22039794921875, -0.20191192626953125, -0.1834259033203125, -0.16493988037109375, -0.146453857421875, -0.12796783447265625, -0.1094818115234375, -0.09099578857421875, -0.072509765625, -0.05402374267578125, -0.0355377197265625, -0.01705169677734375, 0.001434326171875, 0.01992034912109375, 0.0384063720703125, 0.05689239501953125, 0.07537841796875, 0.09386444091796875, 0.1123504638671875, 0.13083648681640625, 0.149322509765625, 0.16780853271484375, 0.1862945556640625, 0.20478057861328125, 0.2232666015625, 0.24175262451171875, 0.2602386474609375, 0.27872467041015625, 0.297210693359375, 0.31569671630859375, 0.3341827392578125, 0.35266876220703125, 0.37115478515625, 0.38964080810546875, 0.4081268310546875, 0.42661285400390625, 0.445098876953125, 0.46358489990234375, 0.4820709228515625, 0.5005569458007812, 0.51904296875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 7.0, 15.0, 17.0, 18.0, 27.0, 53.0, 107.0, 230.0, 866.0, 2064.0, 349.0, 147.0, 74.0, 48.0, 15.0, 16.0, 7.0, 9.0, 4.0, 4.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27978515625, -0.2724609375, -0.26513671875, -0.2578125, -0.25048828125, -0.2431640625, -0.23583984375, -0.228515625, -0.22119140625, -0.2138671875, -0.20654296875, -0.19921875, -0.19189453125, -0.1845703125, -0.17724609375, -0.169921875, -0.16259765625, -0.1552734375, -0.14794921875, -0.140625, -0.13330078125, -0.1259765625, -0.11865234375, -0.111328125, -0.10400390625, -0.0966796875, -0.08935546875, -0.08203125, -0.07470703125, -0.0673828125, -0.06005859375, -0.052734375, -0.04541015625, -0.0380859375, -0.03076171875, -0.0234375, -0.01611328125, -0.0087890625, -0.00146484375, 0.005859375, 0.01318359375, 0.0205078125, 0.02783203125, 0.03515625, 0.04248046875, 0.0498046875, 0.05712890625, 0.064453125, 0.07177734375, 0.0791015625, 0.08642578125, 0.09375, 0.10107421875, 0.1083984375, 0.11572265625, 0.123046875, 0.13037109375, 0.1376953125, 0.14501953125, 0.15234375, 0.15966796875, 0.1669921875, 0.17431640625, 0.181640625, 0.18896484375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 30.0, 52.0, 146.0, 234.0, 259.0, 162.0, 76.0, 34.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5402299165725708, -1.4762042760849, -1.4121785163879395, -1.3481528759002686, -1.2841272354125977, -1.2201015949249268, -1.1560758352279663, -1.0920501947402954, -1.028024435043335, -0.9639987349510193, -0.8999730944633484, -0.8359473943710327, -0.7719217538833618, -0.7078960537910461, -0.6438703536987305, -0.5798447132110596, -0.5158190727233887, -0.4517934024333954, -0.3877677321434021, -0.3237420320510864, -0.25971636176109314, -0.19569069147109985, -0.13166499137878418, -0.0676393210887909, -0.0036136507987976074, 0.060412026941776276, 0.12443770468235016, 0.18846338987350464, 0.2524890601634979, 0.3165147304534912, 0.3805404305458069, 0.44456610083580017, 0.508591890335083, 0.5726175904273987, 0.6366432309150696, 0.7006689310073853, 0.7646945714950562, 0.8287202715873718, 0.8927459716796875, 0.9567716121673584, 1.0207972526550293, 1.0848228931427002, 1.1488486528396606, 1.2128742933273315, 1.2768999338150024, 1.340925693511963, 1.4049513339996338, 1.4689769744873047, 1.5330027341842651, 1.597028374671936, 1.6610541343688965, 1.7250797748565674, 1.7891054153442383, 1.8531310558319092, 1.9171568155288696, 1.9811824560165405, 2.045208215713501, 2.109233856201172, 2.1732594966888428, 2.2372851371765137, 2.3013110160827637, 2.3653366565704346, 2.4293622970581055, 2.4933879375457764, 2.5574135780334473]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 1.0, 7.0, 5.0, 7.0, 6.0, 7.0, 11.0, 14.0, 17.0, 19.0, 21.0, 26.0, 26.0, 33.0, 44.0, 44.0, 38.0, 40.0, 36.0, 46.0, 33.0, 55.0, 37.0, 45.0, 32.0, 31.0, 40.0, 37.0, 22.0, 27.0, 29.0, 28.0, 17.0, 16.0, 16.0, 14.0, 13.0, 12.0, 8.0, 11.0, 7.0, 9.0, 6.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4492684602737427, -0.435070663690567, -0.42087286710739136, -0.4066750705242157, -0.39247727394104004, -0.37827950716018677, -0.3640817105770111, -0.34988391399383545, -0.3356861174106598, -0.32148832082748413, -0.30729052424430847, -0.2930927276611328, -0.27889496088027954, -0.2646971344947815, -0.2504993677139282, -0.23630157113075256, -0.2221037745475769, -0.20790597796440125, -0.19370818138122559, -0.17951039969921112, -0.16531260311603546, -0.1511148065328598, -0.13691702485084534, -0.12271922826766968, -0.10852143168449402, -0.09432363510131836, -0.0801258459687233, -0.06592805683612823, -0.051730260252952576, -0.037532463669776917, -0.023334674537181854, -0.009136885404586792, 0.005060911178588867, 0.019258704036474228, 0.03345649689435959, 0.04765428975224495, 0.06185208261013031, 0.07604987919330597, 0.09024766832590103, 0.1044454574584961, 0.11864325404167175, 0.1328410506248474, 0.14703884720802307, 0.16123662889003754, 0.1754344254732132, 0.18963222205638885, 0.20383000373840332, 0.21802780032157898, 0.23222559690475464, 0.2464233934879303, 0.26062119007110596, 0.2748189866542816, 0.2890167832374573, 0.30321455001831055, 0.3174123466014862, 0.33161014318466187, 0.3458079397678375, 0.3600057363510132, 0.37420353293418884, 0.3884013295173645, 0.4025990962982178, 0.4167969226837158, 0.4309946894645691, 0.44519248604774475, 0.4593902826309204]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 11.0, 6.0, 8.0, 13.0, 11.0, 15.0, 33.0, 39.0, 63.0, 82.0, 107.0, 174.0, 259.0, 416.0, 647.0, 1110.0, 1980.0, 3226.0, 5651.0, 9819.0, 16639.0, 28372.0, 47405.0, 78956.0, 138817.0, 255778.0, 200036.0, 105649.0, 61966.0, 37586.0, 22025.0, 13205.0, 7503.0, 4392.0, 2602.0, 1493.0, 890.0, 543.0, 353.0, 216.0, 138.0, 86.0, 74.0, 49.0, 32.0, 26.0, 14.0, 13.0, 15.0, 6.0, 5.0, 7.0, 1.0, 4.0], "bins": [-0.1546630859375, -0.15033912658691406, -0.14601516723632812, -0.1416912078857422, -0.13736724853515625, -0.1330432891845703, -0.12871932983398438, -0.12439537048339844, -0.1200714111328125, -0.11574745178222656, -0.11142349243164062, -0.10709953308105469, -0.10277557373046875, -0.09845161437988281, -0.09412765502929688, -0.08980369567871094, -0.085479736328125, -0.08115577697753906, -0.07683181762695312, -0.07250785827636719, -0.06818389892578125, -0.06385993957519531, -0.059535980224609375, -0.05521202087402344, -0.0508880615234375, -0.04656410217285156, -0.042240142822265625, -0.03791618347167969, -0.03359222412109375, -0.029268264770507812, -0.024944305419921875, -0.020620346069335938, -0.01629638671875, -0.011972427368164062, -0.007648468017578125, -0.0033245086669921875, 0.00099945068359375, 0.0053234100341796875, 0.009647369384765625, 0.013971328735351562, 0.0182952880859375, 0.022619247436523438, 0.026943206787109375, 0.03126716613769531, 0.03559112548828125, 0.03991508483886719, 0.044239044189453125, 0.04856300354003906, 0.052886962890625, 0.05721092224121094, 0.061534881591796875, 0.06585884094238281, 0.07018280029296875, 0.07450675964355469, 0.07883071899414062, 0.08315467834472656, 0.0874786376953125, 0.09180259704589844, 0.09612655639648438, 0.10045051574707031, 0.10477447509765625, 0.10909843444824219, 0.11342239379882812, 0.11774635314941406, 0.1220703125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 6.0, 4.0, 7.0, 9.0, 9.0, 14.0, 17.0, 8.0, 19.0, 22.0, 25.0, 25.0, 29.0, 22.0, 40.0, 36.0, 34.0, 53.0, 44.0, 39.0, 52.0, 49.0, 47.0, 43.0, 39.0, 32.0, 34.0, 32.0, 27.0, 32.0, 22.0, 25.0, 24.0, 15.0, 14.0, 9.0, 10.0, 9.0, 8.0, 8.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05560302734375, -0.0540013313293457, -0.052399635314941406, -0.05079793930053711, -0.04919624328613281, -0.047594547271728516, -0.04599285125732422, -0.04439115524291992, -0.042789459228515625, -0.04118776321411133, -0.03958606719970703, -0.037984371185302734, -0.03638267517089844, -0.03478097915649414, -0.033179283142089844, -0.03157758712768555, -0.02997589111328125, -0.028374195098876953, -0.026772499084472656, -0.02517080307006836, -0.023569107055664062, -0.021967411041259766, -0.02036571502685547, -0.018764019012451172, -0.017162322998046875, -0.015560626983642578, -0.013958930969238281, -0.012357234954833984, -0.010755538940429688, -0.00915384292602539, -0.007552146911621094, -0.005950450897216797, -0.0043487548828125, -0.002747058868408203, -0.0011453628540039062, 0.0004563331604003906, 0.0020580291748046875, 0.0036597251892089844, 0.005261421203613281, 0.006863117218017578, 0.008464813232421875, 0.010066509246826172, 0.011668205261230469, 0.013269901275634766, 0.014871597290039062, 0.01647329330444336, 0.018074989318847656, 0.019676685333251953, 0.02127838134765625, 0.022880077362060547, 0.024481773376464844, 0.02608346939086914, 0.027685165405273438, 0.029286861419677734, 0.03088855743408203, 0.03249025344848633, 0.034091949462890625, 0.03569364547729492, 0.03729534149169922, 0.038897037506103516, 0.04049873352050781, 0.04210042953491211, 0.043702125549316406, 0.0453038215637207, 0.046905517578125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 6.0, 14.0, 15.0, 27.0, 33.0, 49.0, 61.0, 79.0, 146.0, 192.0, 285.0, 475.0, 987.0, 2429.0, 9740.0, 76417.0, 708195.0, 218069.0, 23890.0, 4245.0, 1425.0, 674.0, 359.0, 245.0, 151.0, 102.0, 61.0, 53.0, 44.0, 24.0, 12.0, 15.0, 12.0, 13.0, 3.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52685546875, -0.5097122192382812, -0.4925689697265625, -0.47542572021484375, -0.458282470703125, -0.44113922119140625, -0.4239959716796875, -0.40685272216796875, -0.38970947265625, -0.37256622314453125, -0.3554229736328125, -0.33827972412109375, -0.321136474609375, -0.30399322509765625, -0.2868499755859375, -0.26970672607421875, -0.2525634765625, -0.23542022705078125, -0.2182769775390625, -0.20113372802734375, -0.183990478515625, -0.16684722900390625, -0.1497039794921875, -0.13256072998046875, -0.11541748046875, -0.09827423095703125, -0.0811309814453125, -0.06398773193359375, -0.046844482421875, -0.02970123291015625, -0.0125579833984375, 0.00458526611328125, 0.021728515625, 0.03887176513671875, 0.0560150146484375, 0.07315826416015625, 0.090301513671875, 0.10744476318359375, 0.1245880126953125, 0.14173126220703125, 0.15887451171875, 0.17601776123046875, 0.1931610107421875, 0.21030426025390625, 0.227447509765625, 0.24459075927734375, 0.2617340087890625, 0.27887725830078125, 0.2960205078125, 0.31316375732421875, 0.3303070068359375, 0.34745025634765625, 0.364593505859375, 0.38173675537109375, 0.3988800048828125, 0.41602325439453125, 0.43316650390625, 0.45030975341796875, 0.4674530029296875, 0.48459625244140625, 0.501739501953125, 0.5188827514648438, 0.5360260009765625, 0.5531692504882812, 0.5703125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 4.0, 8.0, 10.0, 9.0, 14.0, 17.0, 14.0, 14.0, 25.0, 19.0, 30.0, 33.0, 40.0, 41.0, 48.0, 35.0, 57.0, 45.0, 39.0, 45.0, 59.0, 52.0, 38.0, 40.0, 45.0, 37.0, 24.0, 20.0, 25.0, 25.0, 25.0, 10.0, 14.0, 5.0, 8.0, 2.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2822265625, -0.27355194091796875, -0.2648773193359375, -0.25620269775390625, -0.247528076171875, -0.23885345458984375, -0.2301788330078125, -0.22150421142578125, -0.21282958984375, -0.20415496826171875, -0.1954803466796875, -0.18680572509765625, -0.178131103515625, -0.16945648193359375, -0.1607818603515625, -0.15210723876953125, -0.1434326171875, -0.13475799560546875, -0.1260833740234375, -0.11740875244140625, -0.108734130859375, -0.10005950927734375, -0.0913848876953125, -0.08271026611328125, -0.07403564453125, -0.06536102294921875, -0.0566864013671875, -0.04801177978515625, -0.039337158203125, -0.03066253662109375, -0.0219879150390625, -0.01331329345703125, -0.004638671875, 0.00403594970703125, 0.0127105712890625, 0.02138519287109375, 0.030059814453125, 0.03873443603515625, 0.0474090576171875, 0.05608367919921875, 0.06475830078125, 0.07343292236328125, 0.0821075439453125, 0.09078216552734375, 0.099456787109375, 0.10813140869140625, 0.1168060302734375, 0.12548065185546875, 0.1341552734375, 0.14282989501953125, 0.1515045166015625, 0.16017913818359375, 0.168853759765625, 0.17752838134765625, 0.1862030029296875, 0.19487762451171875, 0.20355224609375, 0.21222686767578125, 0.2209014892578125, 0.22957611083984375, 0.238250732421875, 0.24692535400390625, 0.2555999755859375, 0.26427459716796875, 0.27294921875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 7.0, 18.0, 17.0, 27.0, 51.0, 92.0, 210.0, 565.0, 2295.0, 14587.0, 280624.0, 717363.0, 27875.0, 3448.0, 849.0, 272.0, 106.0, 58.0, 32.0, 20.0, 11.0, 12.0, 5.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26416015625, -0.2503509521484375, -0.236541748046875, -0.2227325439453125, -0.20892333984375, -0.1951141357421875, -0.181304931640625, -0.1674957275390625, -0.1536865234375, -0.1398773193359375, -0.126068115234375, -0.1122589111328125, -0.09844970703125, -0.0846405029296875, -0.070831298828125, -0.0570220947265625, -0.043212890625, -0.0294036865234375, -0.015594482421875, -0.0017852783203125, 0.01202392578125, 0.0258331298828125, 0.039642333984375, 0.0534515380859375, 0.0672607421875, 0.0810699462890625, 0.094879150390625, 0.1086883544921875, 0.12249755859375, 0.1363067626953125, 0.150115966796875, 0.1639251708984375, 0.177734375, 0.1915435791015625, 0.205352783203125, 0.2191619873046875, 0.23297119140625, 0.2467803955078125, 0.260589599609375, 0.2743988037109375, 0.2882080078125, 0.3020172119140625, 0.315826416015625, 0.3296356201171875, 0.34344482421875, 0.3572540283203125, 0.371063232421875, 0.3848724365234375, 0.398681640625, 0.4124908447265625, 0.426300048828125, 0.4401092529296875, 0.45391845703125, 0.4677276611328125, 0.481536865234375, 0.4953460693359375, 0.5091552734375, 0.5229644775390625, 0.536773681640625, 0.5505828857421875, 0.56439208984375, 0.5782012939453125, 0.592010498046875, 0.6058197021484375, 0.61962890625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 8.0, 2.0, 6.0, 6.0, 14.0, 18.0, 15.0, 24.0, 20.0, 23.0, 31.0, 42.0, 50.0, 86.0, 96.0, 80.0, 94.0, 78.0, 58.0, 46.0, 38.0, 32.0, 25.0, 27.0, 11.0, 15.0, 12.0, 11.0, 7.0, 3.0, 6.0, 3.0, 8.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.03010368347168e-05, -8.769892156124115e-05, -8.50968062877655e-05, -8.249469101428986e-05, -7.989257574081421e-05, -7.729046046733856e-05, -7.468834519386292e-05, -7.208622992038727e-05, -6.948411464691162e-05, -6.688199937343597e-05, -6.427988409996033e-05, -6.167776882648468e-05, -5.907565355300903e-05, -5.6473538279533386e-05, -5.387142300605774e-05, -5.126930773258209e-05, -4.8667192459106445e-05, -4.60650771856308e-05, -4.346296191215515e-05, -4.0860846638679504e-05, -3.825873136520386e-05, -3.565661609172821e-05, -3.3054500818252563e-05, -3.0452385544776917e-05, -2.785027027130127e-05, -2.5248154997825623e-05, -2.2646039724349976e-05, -2.004392445087433e-05, -1.744180917739868e-05, -1.4839693903923035e-05, -1.2237578630447388e-05, -9.63546335697174e-06, -7.033348083496094e-06, -4.431232810020447e-06, -1.8291175365447998e-06, 7.729977369308472e-07, 3.375113010406494e-06, 5.977228283882141e-06, 8.579343557357788e-06, 1.1181458830833435e-05, 1.3783574104309082e-05, 1.638568937778473e-05, 1.8987804651260376e-05, 2.1589919924736023e-05, 2.419203519821167e-05, 2.6794150471687317e-05, 2.9396265745162964e-05, 3.199838101863861e-05, 3.460049629211426e-05, 3.7202611565589905e-05, 3.980472683906555e-05, 4.24068421125412e-05, 4.5008957386016846e-05, 4.761107265949249e-05, 5.021318793296814e-05, 5.281530320644379e-05, 5.5417418479919434e-05, 5.801953375339508e-05, 6.062164902687073e-05, 6.322376430034637e-05, 6.582587957382202e-05, 6.842799484729767e-05, 7.103011012077332e-05, 7.363222539424896e-05, 7.623434066772461e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 8.0, 3.0, 6.0, 3.0, 6.0, 8.0, 13.0, 13.0, 12.0, 29.0, 28.0, 51.0, 59.0, 87.0, 147.0, 235.0, 362.0, 673.0, 1309.0, 2999.0, 8834.0, 37561.0, 264803.0, 615896.0, 90226.0, 16170.0, 4896.0, 1901.0, 897.0, 477.0, 294.0, 149.0, 108.0, 86.0, 49.0, 34.0, 32.0, 18.0, 24.0, 17.0, 5.0, 8.0, 8.0, 3.0, 2.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.23193359375, -0.22450828552246094, -0.21708297729492188, -0.2096576690673828, -0.20223236083984375, -0.1948070526123047, -0.18738174438476562, -0.17995643615722656, -0.1725311279296875, -0.16510581970214844, -0.15768051147460938, -0.1502552032470703, -0.14282989501953125, -0.1354045867919922, -0.12797927856445312, -0.12055397033691406, -0.113128662109375, -0.10570335388183594, -0.09827804565429688, -0.09085273742675781, -0.08342742919921875, -0.07600212097167969, -0.06857681274414062, -0.06115150451660156, -0.0537261962890625, -0.04630088806152344, -0.038875579833984375, -0.03145027160644531, -0.02402496337890625, -0.016599655151367188, -0.009174346923828125, -0.0017490386962890625, 0.00567626953125, 0.013101577758789062, 0.020526885986328125, 0.027952194213867188, 0.03537750244140625, 0.04280281066894531, 0.050228118896484375, 0.05765342712402344, 0.0650787353515625, 0.07250404357910156, 0.07992935180664062, 0.08735466003417969, 0.09477996826171875, 0.10220527648925781, 0.10963058471679688, 0.11705589294433594, 0.124481201171875, 0.13190650939941406, 0.13933181762695312, 0.1467571258544922, 0.15418243408203125, 0.1616077423095703, 0.16903305053710938, 0.17645835876464844, 0.1838836669921875, 0.19130897521972656, 0.19873428344726562, 0.2061595916748047, 0.21358489990234375, 0.2210102081298828, 0.22843551635742188, 0.23586082458496094, 0.2432861328125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 5.0, 12.0, 15.0, 11.0, 19.0, 30.0, 40.0, 58.0, 83.0, 98.0, 132.0, 152.0, 81.0, 79.0, 39.0, 33.0, 36.0, 21.0, 11.0, 15.0, 6.0, 0.0, 10.0, 2.0, 5.0, 0.0, 3.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1954345703125, -0.1887035369873047, -0.18197250366210938, -0.17524147033691406, -0.16851043701171875, -0.16177940368652344, -0.15504837036132812, -0.1483173370361328, -0.1415863037109375, -0.1348552703857422, -0.12812423706054688, -0.12139320373535156, -0.11466217041015625, -0.10793113708496094, -0.10120010375976562, -0.09446907043457031, -0.087738037109375, -0.08100700378417969, -0.07427597045898438, -0.06754493713378906, -0.06081390380859375, -0.05408287048339844, -0.047351837158203125, -0.04062080383300781, -0.0338897705078125, -0.027158737182617188, -0.020427703857421875, -0.013696670532226562, -0.00696563720703125, -0.0002346038818359375, 0.006496429443359375, 0.013227462768554688, 0.01995849609375, 0.026689529418945312, 0.033420562744140625, 0.04015159606933594, 0.04688262939453125, 0.05361366271972656, 0.060344696044921875, 0.06707572937011719, 0.0738067626953125, 0.08053779602050781, 0.08726882934570312, 0.09399986267089844, 0.10073089599609375, 0.10746192932128906, 0.11419296264648438, 0.12092399597167969, 0.127655029296875, 0.1343860626220703, 0.14111709594726562, 0.14784812927246094, 0.15457916259765625, 0.16131019592285156, 0.16804122924804688, 0.1747722625732422, 0.1815032958984375, 0.1882343292236328, 0.19496536254882812, 0.20169639587402344, 0.20842742919921875, 0.21515846252441406, 0.22188949584960938, 0.2286205291748047, 0.2353515625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 29.0, 61.0, 141.0, 211.0, 237.0, 175.0, 89.0, 36.0, 17.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.012458324432373, -2.864086151123047, -2.7157137393951416, -2.5673415660858154, -2.41896915435791, -2.270596981048584, -2.122224807739258, -1.973852515220642, -1.8254802227020264, -1.6771079301834106, -1.528735637664795, -1.3803634643554688, -1.231991171836853, -1.0836188793182373, -0.9352466464042664, -0.7868744134902954, -0.6385021209716797, -0.49012985825538635, -0.341757595539093, -0.19338533282279968, -0.04501307010650635, 0.10335922241210938, 0.2517314553260803, 0.40010368824005127, 0.548475980758667, 0.6968482732772827, 0.8452205061912537, 0.9935927391052246, 1.1419650316238403, 1.290337324142456, 1.4387094974517822, 1.587081789970398, 1.7354545593261719, 1.8838268518447876, 2.0321991443634033, 2.1805713176727295, 2.3289437294006348, 2.477315902709961, 2.625688076019287, 2.7740602493286133, 2.9224326610565186, 3.0708048343658447, 3.21917724609375, 3.367549419403076, 3.5159215927124023, 3.6642940044403076, 3.812666177749634, 3.961038589477539, 4.109410762786865, 4.257782936096191, 4.406155109405518, 4.554527759552002, 4.702899932861328, 4.851272106170654, 4.9996442794799805, 5.148016452789307, 5.296388626098633, 5.444760799407959, 5.593132972717285, 5.7415056228637695, 5.889877796173096, 6.038249969482422, 6.186622142791748, 6.334994316101074, 6.483366966247559]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 9.0, 8.0, 10.0, 10.0, 12.0, 14.0, 10.0, 13.0, 20.0, 23.0, 22.0, 32.0, 28.0, 41.0, 35.0, 49.0, 48.0, 35.0, 48.0, 52.0, 35.0, 46.0, 28.0, 37.0, 32.0, 39.0, 36.0, 32.0, 28.0, 28.0, 21.0, 15.0, 19.0, 13.0, 18.0, 13.0, 8.0, 8.0, 2.0, 7.0, 5.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.4552820920944214, -1.4109429121017456, -1.3666038513183594, -1.3222646713256836, -1.2779256105422974, -1.2335864305496216, -1.1892473697662354, -1.1449081897735596, -1.1005690097808838, -1.056229829788208, -1.0118907690048218, -0.967551589012146, -0.9232125282287598, -0.878873348236084, -0.834534227848053, -0.790195107460022, -0.7458560466766357, -0.7015169262886047, -0.6571778059005737, -0.612838625907898, -0.5684995651245117, -0.5241603851318359, -0.47982126474380493, -0.4354821443557739, -0.3911430239677429, -0.3468039035797119, -0.3024647831916809, -0.2581256330013275, -0.2137865126132965, -0.1694473922252655, -0.1251082420349121, -0.0807691216468811, -0.03642988204956055, 0.007909245789051056, 0.05224837362766266, 0.09658750891685486, 0.14092662930488586, 0.18526574969291687, 0.22960489988327026, 0.27394402027130127, 0.3182831406593323, 0.3626222610473633, 0.4069613814353943, 0.4513005316257477, 0.4956396520137787, 0.5399787425994873, 0.5843179225921631, 0.6286570429801941, 0.6729961633682251, 0.7173352837562561, 0.7616744041442871, 0.8060135841369629, 0.8503526449203491, 0.8946918249130249, 0.9390309453010559, 0.9833700656890869, 1.0277092456817627, 1.0720484256744385, 1.1163874864578247, 1.1607266664505005, 1.2050657272338867, 1.2494049072265625, 1.2937440872192383, 1.3380831480026245, 1.3824222087860107]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 1.0, 6.0, 7.0, 6.0, 24.0, 19.0, 29.0, 43.0, 39.0, 75.0, 149.0, 180.0, 293.0, 451.0, 654.0, 1090.0, 1627.0, 2784.0, 4674.0, 8621.0, 16466.0, 35014.0, 87426.0, 312157.0, 2999522.0, 520149.0, 115036.0, 43688.0, 20013.0, 10214.0, 5466.0, 3216.0, 1898.0, 1148.0, 734.0, 427.0, 302.0, 210.0, 152.0, 81.0, 65.0, 33.0, 36.0, 25.0, 12.0, 9.0, 10.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.222900390625, -0.21607017517089844, -0.20923995971679688, -0.2024097442626953, -0.19557952880859375, -0.1887493133544922, -0.18191909790039062, -0.17508888244628906, -0.1682586669921875, -0.16142845153808594, -0.15459823608398438, -0.1477680206298828, -0.14093780517578125, -0.1341075897216797, -0.12727737426757812, -0.12044715881347656, -0.113616943359375, -0.10678672790527344, -0.09995651245117188, -0.09312629699707031, -0.08629608154296875, -0.07946586608886719, -0.07263565063476562, -0.06580543518066406, -0.0589752197265625, -0.05214500427246094, -0.045314788818359375, -0.03848457336425781, -0.03165435791015625, -0.024824142456054688, -0.017993927001953125, -0.011163711547851562, -0.00433349609375, 0.0024967193603515625, 0.009326934814453125, 0.016157150268554688, 0.02298736572265625, 0.029817581176757812, 0.036647796630859375, 0.04347801208496094, 0.0503082275390625, 0.05713844299316406, 0.06396865844726562, 0.07079887390136719, 0.07762908935546875, 0.08445930480957031, 0.09128952026367188, 0.09811973571777344, 0.104949951171875, 0.11178016662597656, 0.11861038208007812, 0.1254405975341797, 0.13227081298828125, 0.1391010284423828, 0.14593124389648438, 0.15276145935058594, 0.1595916748046875, 0.16642189025878906, 0.17325210571289062, 0.1800823211669922, 0.18691253662109375, 0.1937427520751953, 0.20057296752929688, 0.20740318298339844, 0.2142333984375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 9.0, 7.0, 2.0, 5.0, 7.0, 8.0, 13.0, 13.0, 11.0, 13.0, 16.0, 22.0, 19.0, 32.0, 25.0, 29.0, 35.0, 34.0, 22.0, 41.0, 56.0, 36.0, 41.0, 37.0, 35.0, 38.0, 46.0, 37.0, 38.0, 34.0, 33.0, 25.0, 29.0, 24.0, 19.0, 19.0, 15.0, 18.0, 12.0, 7.0, 7.0, 8.0, 10.0, 6.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.05242919921875, -0.05089378356933594, -0.049358367919921875, -0.04782295227050781, -0.04628753662109375, -0.04475212097167969, -0.043216705322265625, -0.04168128967285156, -0.0401458740234375, -0.03861045837402344, -0.037075042724609375, -0.03553962707519531, -0.03400421142578125, -0.03246879577636719, -0.030933380126953125, -0.029397964477539062, -0.027862548828125, -0.026327133178710938, -0.024791717529296875, -0.023256301879882812, -0.02172088623046875, -0.020185470581054688, -0.018650054931640625, -0.017114639282226562, -0.0155792236328125, -0.014043807983398438, -0.012508392333984375, -0.010972976684570312, -0.00943756103515625, -0.007902145385742188, -0.006366729736328125, -0.0048313140869140625, -0.0032958984375, -0.0017604827880859375, -0.000225067138671875, 0.0013103485107421875, 0.00284576416015625, 0.0043811798095703125, 0.005916595458984375, 0.0074520111083984375, 0.0089874267578125, 0.010522842407226562, 0.012058258056640625, 0.013593673706054688, 0.01512908935546875, 0.016664505004882812, 0.018199920654296875, 0.019735336303710938, 0.021270751953125, 0.022806167602539062, 0.024341583251953125, 0.025876998901367188, 0.02741241455078125, 0.028947830200195312, 0.030483245849609375, 0.03201866149902344, 0.0335540771484375, 0.03508949279785156, 0.036624908447265625, 0.03816032409667969, 0.03969573974609375, 0.04123115539550781, 0.042766571044921875, 0.04430198669433594, 0.04583740234375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 4.0, 7.0, 12.0, 12.0, 11.0, 24.0, 24.0, 49.0, 37.0, 67.0, 113.0, 180.0, 333.0, 754.0, 2252.0, 9633.0, 62177.0, 2254977.0, 1790887.0, 59570.0, 9315.0, 2210.0, 745.0, 323.0, 192.0, 104.0, 75.0, 58.0, 39.0, 22.0, 25.0, 15.0, 6.0, 8.0, 7.0, 6.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.8056640625, -0.7826385498046875, -0.759613037109375, -0.7365875244140625, -0.71356201171875, -0.6905364990234375, -0.667510986328125, -0.6444854736328125, -0.6214599609375, -0.5984344482421875, -0.575408935546875, -0.5523834228515625, -0.52935791015625, -0.5063323974609375, -0.483306884765625, -0.4602813720703125, -0.437255859375, -0.4142303466796875, -0.391204833984375, -0.3681793212890625, -0.34515380859375, -0.3221282958984375, -0.299102783203125, -0.2760772705078125, -0.2530517578125, -0.2300262451171875, -0.207000732421875, -0.1839752197265625, -0.16094970703125, -0.1379241943359375, -0.114898681640625, -0.0918731689453125, -0.06884765625, -0.0458221435546875, -0.022796630859375, 0.0002288818359375, 0.02325439453125, 0.0462799072265625, 0.069305419921875, 0.0923309326171875, 0.1153564453125, 0.1383819580078125, 0.161407470703125, 0.1844329833984375, 0.20745849609375, 0.2304840087890625, 0.253509521484375, 0.2765350341796875, 0.299560546875, 0.3225860595703125, 0.345611572265625, 0.3686370849609375, 0.39166259765625, 0.4146881103515625, 0.437713623046875, 0.4607391357421875, 0.4837646484375, 0.5067901611328125, 0.529815673828125, 0.5528411865234375, 0.57586669921875, 0.5988922119140625, 0.621917724609375, 0.6449432373046875, 0.66796875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 2.0, 14.0, 26.0, 35.0, 72.0, 153.0, 285.0, 1118.0, 1689.0, 356.0, 127.0, 96.0, 40.0, 26.0, 17.0, 12.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43798828125, -0.426483154296875, -0.41497802734375, -0.403472900390625, -0.3919677734375, -0.380462646484375, -0.36895751953125, -0.357452392578125, -0.345947265625, -0.334442138671875, -0.32293701171875, -0.311431884765625, -0.2999267578125, -0.288421630859375, -0.27691650390625, -0.265411376953125, -0.25390625, -0.242401123046875, -0.23089599609375, -0.219390869140625, -0.2078857421875, -0.196380615234375, -0.18487548828125, -0.173370361328125, -0.161865234375, -0.150360107421875, -0.13885498046875, -0.127349853515625, -0.1158447265625, -0.104339599609375, -0.09283447265625, -0.081329345703125, -0.06982421875, -0.058319091796875, -0.04681396484375, -0.035308837890625, -0.0238037109375, -0.012298583984375, -0.00079345703125, 0.010711669921875, 0.022216796875, 0.033721923828125, 0.04522705078125, 0.056732177734375, 0.0682373046875, 0.079742431640625, 0.09124755859375, 0.102752685546875, 0.1142578125, 0.125762939453125, 0.13726806640625, 0.148773193359375, 0.1602783203125, 0.171783447265625, 0.18328857421875, 0.194793701171875, 0.206298828125, 0.217803955078125, 0.22930908203125, 0.240814208984375, 0.2523193359375, 0.263824462890625, 0.27532958984375, 0.286834716796875, 0.29833984375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 11.0, 19.0, 47.0, 79.0, 128.0, 206.0, 187.0, 149.0, 99.0, 36.0, 22.0, 16.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.169520854949951, -2.097560167312622, -2.025599241256714, -1.9536384344100952, -1.8816776275634766, -1.8097169399261475, -1.7377561330795288, -1.6657953262329102, -1.5938345193862915, -1.5218737125396729, -1.4499129056930542, -1.3779520988464355, -1.3059914112091064, -1.2340304851531982, -1.1620697975158691, -1.0901089906692505, -1.0181481838226318, -0.9461873769760132, -0.8742265701293945, -0.8022658228874207, -0.730305016040802, -0.6583442091941833, -0.5863834619522095, -0.5144226551055908, -0.44246184825897217, -0.3705010414123535, -0.29854026436805725, -0.2265794724225998, -0.15461868047714233, -0.08265787363052368, -0.010697096586227417, 0.06126368045806885, 0.1332244873046875, 0.20518527925014496, 0.2771460711956024, 0.3491068482398987, 0.42106765508651733, 0.493028461933136, 0.5649892091751099, 0.6369500160217285, 0.7089108228683472, 0.7808716297149658, 0.8528324365615845, 0.9247931838035583, 0.996753990650177, 1.0687148571014404, 1.1406755447387695, 1.2126363515853882, 1.2845971584320068, 1.3565579652786255, 1.4285187721252441, 1.5004795789718628, 1.5724403858184814, 1.6444010734558105, 1.7163618803024292, 1.7883226871490479, 1.8602834939956665, 1.9322443008422852, 2.0042049884796143, 2.0761659145355225, 2.1481266021728516, 2.2200875282287598, 2.292048215866089, 2.364008903503418, 2.435969829559326]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 6.0, 4.0, 2.0, 4.0, 13.0, 10.0, 18.0, 10.0, 18.0, 23.0, 30.0, 26.0, 34.0, 31.0, 31.0, 46.0, 55.0, 59.0, 47.0, 49.0, 43.0, 60.0, 57.0, 57.0, 49.0, 38.0, 37.0, 32.0, 31.0, 15.0, 20.0, 14.0, 11.0, 9.0, 9.0, 4.0, 5.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8771454691886902, -0.8493988513946533, -0.8216522336006165, -0.7939056158065796, -0.7661590576171875, -0.7384123802185059, -0.7106658220291138, -0.6829192042350769, -0.65517258644104, -0.6274259686470032, -0.5996793508529663, -0.5719327330589294, -0.5441861152648926, -0.5164395570755005, -0.4886929392814636, -0.46094632148742676, -0.4331997036933899, -0.405453085899353, -0.37770646810531616, -0.3499598801136017, -0.3222132623195648, -0.29446664452552795, -0.2667200565338135, -0.2389734387397766, -0.21122682094573975, -0.18348020315170288, -0.1557336002588272, -0.12798699736595154, -0.10024037957191467, -0.07249376177787781, -0.044747158885002136, -0.017000555992126465, 0.010746002197265625, 0.03849261254072189, 0.06623922288417816, 0.09398583322763443, 0.1217324435710907, 0.14947906136512756, 0.17722566425800323, 0.2049722671508789, 0.23271888494491577, 0.26046550273895264, 0.2882121205329895, 0.315958708524704, 0.34370532631874084, 0.3714519441127777, 0.3991985321044922, 0.42694514989852905, 0.4546917676925659, 0.4824383854866028, 0.5101850032806396, 0.5379316210746765, 0.5656782388687134, 0.5934247970581055, 0.6211714148521423, 0.6489180326461792, 0.6766646504402161, 0.7044112682342529, 0.7321578860282898, 0.7599045038223267, 0.7876510620117188, 0.8153977394104004, 0.8431442975997925, 0.8708909153938293, 0.8986375331878662]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 18.0, 15.0, 19.0, 41.0, 48.0, 72.0, 96.0, 151.0, 241.0, 345.0, 511.0, 775.0, 1200.0, 1916.0, 2824.0, 4579.0, 7602.0, 12536.0, 21236.0, 36711.0, 62860.0, 104247.0, 158814.0, 194483.0, 164645.0, 109371.0, 66442.0, 39239.0, 22626.0, 13306.0, 8036.0, 4856.0, 2977.0, 2022.0, 1171.0, 867.0, 553.0, 383.0, 241.0, 149.0, 108.0, 63.0, 49.0, 32.0, 21.0, 20.0, 12.0, 11.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.150146484375, -0.14553451538085938, -0.14092254638671875, -0.13631057739257812, -0.1316986083984375, -0.12708663940429688, -0.12247467041015625, -0.11786270141601562, -0.113250732421875, -0.10863876342773438, -0.10402679443359375, -0.09941482543945312, -0.0948028564453125, -0.09019088745117188, -0.08557891845703125, -0.08096694946289062, -0.07635498046875, -0.07174301147460938, -0.06713104248046875, -0.06251907348632812, -0.0579071044921875, -0.053295135498046875, -0.04868316650390625, -0.044071197509765625, -0.039459228515625, -0.034847259521484375, -0.03023529052734375, -0.025623321533203125, -0.0210113525390625, -0.016399383544921875, -0.01178741455078125, -0.007175445556640625, -0.0025634765625, 0.002048492431640625, 0.00666046142578125, 0.011272430419921875, 0.0158843994140625, 0.020496368408203125, 0.02510833740234375, 0.029720306396484375, 0.034332275390625, 0.038944244384765625, 0.04355621337890625, 0.048168182373046875, 0.0527801513671875, 0.057392120361328125, 0.06200408935546875, 0.06661605834960938, 0.07122802734375, 0.07583999633789062, 0.08045196533203125, 0.08506393432617188, 0.0896759033203125, 0.09428787231445312, 0.09889984130859375, 0.10351181030273438, 0.108123779296875, 0.11273574829101562, 0.11734771728515625, 0.12195968627929688, 0.1265716552734375, 0.13118362426757812, 0.13579559326171875, 0.14040756225585938, 0.14501953125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 3.0, 8.0, 3.0, 4.0, 3.0, 5.0, 8.0, 8.0, 11.0, 14.0, 10.0, 14.0, 18.0, 25.0, 30.0, 28.0, 29.0, 29.0, 29.0, 31.0, 39.0, 35.0, 37.0, 54.0, 52.0, 47.0, 41.0, 44.0, 43.0, 42.0, 34.0, 32.0, 19.0, 24.0, 25.0, 12.0, 20.0, 13.0, 13.0, 14.0, 15.0, 8.0, 15.0, 5.0, 6.0, 5.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.057830810546875, -0.05599164962768555, -0.054152488708496094, -0.05231332778930664, -0.05047416687011719, -0.048635005950927734, -0.04679584503173828, -0.04495668411254883, -0.043117523193359375, -0.04127836227416992, -0.03943920135498047, -0.037600040435791016, -0.03576087951660156, -0.03392171859741211, -0.032082557678222656, -0.030243396759033203, -0.02840423583984375, -0.026565074920654297, -0.024725914001464844, -0.02288675308227539, -0.021047592163085938, -0.019208431243896484, -0.01736927032470703, -0.015530109405517578, -0.013690948486328125, -0.011851787567138672, -0.010012626647949219, -0.008173465728759766, -0.0063343048095703125, -0.004495143890380859, -0.0026559829711914062, -0.0008168220520019531, 0.0010223388671875, 0.002861499786376953, 0.004700660705566406, 0.006539821624755859, 0.008378982543945312, 0.010218143463134766, 0.012057304382324219, 0.013896465301513672, 0.015735626220703125, 0.017574787139892578, 0.01941394805908203, 0.021253108978271484, 0.023092269897460938, 0.02493143081665039, 0.026770591735839844, 0.028609752655029297, 0.03044891357421875, 0.0322880744934082, 0.034127235412597656, 0.03596639633178711, 0.03780555725097656, 0.039644718170166016, 0.04148387908935547, 0.04332304000854492, 0.045162200927734375, 0.04700136184692383, 0.04884052276611328, 0.050679683685302734, 0.05251884460449219, 0.05435800552368164, 0.056197166442871094, 0.05803632736206055, 0.05987548828125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 12.0, 11.0, 12.0, 19.0, 15.0, 26.0, 31.0, 34.0, 59.0, 66.0, 112.0, 143.0, 196.0, 290.0, 460.0, 763.0, 1430.0, 3039.0, 7999.0, 30109.0, 155318.0, 563977.0, 224152.0, 42153.0, 10402.0, 3591.0, 1568.0, 887.0, 498.0, 360.0, 219.0, 174.0, 146.0, 67.0, 59.0, 42.0, 40.0, 30.0, 15.0, 12.0, 8.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.419921875, -0.405242919921875, -0.39056396484375, -0.375885009765625, -0.3612060546875, -0.346527099609375, -0.33184814453125, -0.317169189453125, -0.302490234375, -0.287811279296875, -0.27313232421875, -0.258453369140625, -0.2437744140625, -0.229095458984375, -0.21441650390625, -0.199737548828125, -0.18505859375, -0.170379638671875, -0.15570068359375, -0.141021728515625, -0.1263427734375, -0.111663818359375, -0.09698486328125, -0.082305908203125, -0.067626953125, -0.052947998046875, -0.03826904296875, -0.023590087890625, -0.0089111328125, 0.005767822265625, 0.02044677734375, 0.035125732421875, 0.0498046875, 0.064483642578125, 0.07916259765625, 0.093841552734375, 0.1085205078125, 0.123199462890625, 0.13787841796875, 0.152557373046875, 0.167236328125, 0.181915283203125, 0.19659423828125, 0.211273193359375, 0.2259521484375, 0.240631103515625, 0.25531005859375, 0.269989013671875, 0.28466796875, 0.299346923828125, 0.31402587890625, 0.328704833984375, 0.3433837890625, 0.358062744140625, 0.37274169921875, 0.387420654296875, 0.402099609375, 0.416778564453125, 0.43145751953125, 0.446136474609375, 0.4608154296875, 0.475494384765625, 0.49017333984375, 0.504852294921875, 0.51953125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [5.0, 3.0, 2.0, 5.0, 3.0, 2.0, 4.0, 6.0, 4.0, 7.0, 8.0, 14.0, 6.0, 2.0, 9.0, 16.0, 18.0, 18.0, 24.0, 18.0, 24.0, 43.0, 37.0, 41.0, 37.0, 32.0, 32.0, 40.0, 50.0, 37.0, 41.0, 37.0, 47.0, 33.0, 42.0, 30.0, 32.0, 23.0, 22.0, 27.0, 21.0, 20.0, 14.0, 11.0, 14.0, 11.0, 10.0, 10.0, 7.0, 2.0, 4.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.290771484375, -0.2807655334472656, -0.27075958251953125, -0.2607536315917969, -0.2507476806640625, -0.24074172973632812, -0.23073577880859375, -0.22072982788085938, -0.210723876953125, -0.20071792602539062, -0.19071197509765625, -0.18070602416992188, -0.1707000732421875, -0.16069412231445312, -0.15068817138671875, -0.14068222045898438, -0.13067626953125, -0.12067031860351562, -0.11066436767578125, -0.10065841674804688, -0.0906524658203125, -0.08064651489257812, -0.07064056396484375, -0.060634613037109375, -0.050628662109375, -0.040622711181640625, -0.03061676025390625, -0.020610809326171875, -0.0106048583984375, -0.000598907470703125, 0.00940704345703125, 0.019412994384765625, 0.0294189453125, 0.039424896240234375, 0.04943084716796875, 0.059436798095703125, 0.0694427490234375, 0.07944869995117188, 0.08945465087890625, 0.09946060180664062, 0.109466552734375, 0.11947250366210938, 0.12947845458984375, 0.13948440551757812, 0.1494903564453125, 0.15949630737304688, 0.16950225830078125, 0.17950820922851562, 0.18951416015625, 0.19952011108398438, 0.20952606201171875, 0.21953201293945312, 0.2295379638671875, 0.23954391479492188, 0.24954986572265625, 0.2595558166503906, 0.269561767578125, 0.2795677185058594, 0.28957366943359375, 0.2995796203613281, 0.3095855712890625, 0.3195915222167969, 0.32959747314453125, 0.3396034240722656, 0.349609375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 6.0, 5.0, 8.0, 9.0, 16.0, 18.0, 32.0, 30.0, 43.0, 46.0, 86.0, 137.0, 234.0, 457.0, 889.0, 2204.0, 5913.0, 25029.0, 331964.0, 626484.0, 41475.0, 8249.0, 2832.0, 1129.0, 520.0, 276.0, 154.0, 92.0, 59.0, 41.0, 27.0, 28.0, 15.0, 15.0, 12.0, 6.0, 6.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43896484375, -0.42278289794921875, -0.4066009521484375, -0.39041900634765625, -0.374237060546875, -0.35805511474609375, -0.3418731689453125, -0.32569122314453125, -0.30950927734375, -0.29332733154296875, -0.2771453857421875, -0.26096343994140625, -0.244781494140625, -0.22859954833984375, -0.2124176025390625, -0.19623565673828125, -0.1800537109375, -0.16387176513671875, -0.1476898193359375, -0.13150787353515625, -0.115325927734375, -0.09914398193359375, -0.0829620361328125, -0.06678009033203125, -0.05059814453125, -0.03441619873046875, -0.0182342529296875, -0.00205230712890625, 0.014129638671875, 0.03031158447265625, 0.0464935302734375, 0.06267547607421875, 0.078857421875, 0.09503936767578125, 0.1112213134765625, 0.12740325927734375, 0.143585205078125, 0.15976715087890625, 0.1759490966796875, 0.19213104248046875, 0.20831298828125, 0.22449493408203125, 0.2406768798828125, 0.25685882568359375, 0.273040771484375, 0.28922271728515625, 0.3054046630859375, 0.32158660888671875, 0.3377685546875, 0.35395050048828125, 0.3701324462890625, 0.38631439208984375, 0.402496337890625, 0.41867828369140625, 0.4348602294921875, 0.45104217529296875, 0.46722412109375, 0.48340606689453125, 0.4995880126953125, 0.5157699584960938, 0.531951904296875, 0.5481338500976562, 0.5643157958984375, 0.5804977416992188, 0.5966796875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 0.0, 3.0, 4.0, 13.0, 18.0, 14.0, 18.0, 22.0, 39.0, 45.0, 61.0, 96.0, 98.0, 119.0, 100.0, 86.0, 59.0, 65.0, 36.0, 22.0, 22.0, 14.0, 17.0, 17.0, 9.0, 0.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001277923583984375, -0.0001238640397787094, -0.00011993572115898132, -0.00011600740253925323, -0.00011207908391952515, -0.00010815076529979706, -0.00010422244668006897, -0.00010029412806034088, -9.636580944061279e-05, -9.24374908208847e-05, -8.850917220115662e-05, -8.458085358142853e-05, -8.065253496170044e-05, -7.672421634197235e-05, -7.279589772224426e-05, -6.886757910251617e-05, -6.493926048278809e-05, -6.101094186306e-05, -5.708262324333191e-05, -5.315430462360382e-05, -4.922598600387573e-05, -4.5297667384147644e-05, -4.1369348764419556e-05, -3.744103014469147e-05, -3.351271152496338e-05, -2.958439290523529e-05, -2.5656074285507202e-05, -2.1727755665779114e-05, -1.7799437046051025e-05, -1.3871118426322937e-05, -9.942799806594849e-06, -6.01448118686676e-06, -2.086162567138672e-06, 1.8421560525894165e-06, 5.770474672317505e-06, 9.698793292045593e-06, 1.3627111911773682e-05, 1.755543053150177e-05, 2.148374915122986e-05, 2.5412067770957947e-05, 2.9340386390686035e-05, 3.3268705010414124e-05, 3.719702363014221e-05, 4.11253422498703e-05, 4.505366086959839e-05, 4.898197948932648e-05, 5.2910298109054565e-05, 5.6838616728782654e-05, 6.076693534851074e-05, 6.469525396823883e-05, 6.862357258796692e-05, 7.255189120769501e-05, 7.64802098274231e-05, 8.040852844715118e-05, 8.433684706687927e-05, 8.826516568660736e-05, 9.219348430633545e-05, 9.612180292606354e-05, 0.00010005012154579163, 0.00010397844016551971, 0.0001079067587852478, 0.00011183507740497589, 0.00011576339602470398, 0.00011969171464443207, 0.00012362003326416016]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 5.0, 5.0, 3.0, 12.0, 8.0, 17.0, 16.0, 18.0, 40.0, 66.0, 105.0, 188.0, 320.0, 567.0, 1247.0, 2979.0, 9152.0, 46240.0, 692919.0, 262685.0, 22188.0, 5678.0, 2147.0, 870.0, 451.0, 258.0, 111.0, 73.0, 52.0, 39.0, 22.0, 17.0, 10.0, 9.0, 10.0, 3.0, 13.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.451904296875, -0.4350471496582031, -0.41819000244140625, -0.4013328552246094, -0.3844757080078125, -0.3676185607910156, -0.35076141357421875, -0.3339042663574219, -0.317047119140625, -0.3001899719238281, -0.28333282470703125, -0.2664756774902344, -0.2496185302734375, -0.23276138305664062, -0.21590423583984375, -0.19904708862304688, -0.18218994140625, -0.16533279418945312, -0.14847564697265625, -0.13161849975585938, -0.1147613525390625, -0.09790420532226562, -0.08104705810546875, -0.06418991088867188, -0.047332763671875, -0.030475616455078125, -0.01361846923828125, 0.003238677978515625, 0.0200958251953125, 0.036952972412109375, 0.05381011962890625, 0.07066726684570312, 0.0875244140625, 0.10438156127929688, 0.12123870849609375, 0.13809585571289062, 0.1549530029296875, 0.17181015014648438, 0.18866729736328125, 0.20552444458007812, 0.222381591796875, 0.23923873901367188, 0.25609588623046875, 0.2729530334472656, 0.2898101806640625, 0.3066673278808594, 0.32352447509765625, 0.3403816223144531, 0.35723876953125, 0.3740959167480469, 0.39095306396484375, 0.4078102111816406, 0.4246673583984375, 0.4415245056152344, 0.45838165283203125, 0.4752388000488281, 0.492095947265625, 0.5089530944824219, 0.5258102416992188, 0.5426673889160156, 0.5595245361328125, 0.5763816833496094, 0.5932388305664062, 0.6100959777832031, 0.626953125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 11.0, 8.0, 15.0, 21.0, 29.0, 48.0, 81.0, 121.0, 188.0, 171.0, 107.0, 58.0, 44.0, 31.0, 19.0, 8.0, 4.0, 9.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3486328125, -0.33455657958984375, -0.3204803466796875, -0.30640411376953125, -0.292327880859375, -0.27825164794921875, -0.2641754150390625, -0.25009918212890625, -0.23602294921875, -0.22194671630859375, -0.2078704833984375, -0.19379425048828125, -0.179718017578125, -0.16564178466796875, -0.1515655517578125, -0.13748931884765625, -0.1234130859375, -0.10933685302734375, -0.0952606201171875, -0.08118438720703125, -0.067108154296875, -0.05303192138671875, -0.0389556884765625, -0.02487945556640625, -0.01080322265625, 0.00327301025390625, 0.0173492431640625, 0.03142547607421875, 0.045501708984375, 0.05957794189453125, 0.0736541748046875, 0.08773040771484375, 0.101806640625, 0.11588287353515625, 0.1299591064453125, 0.14403533935546875, 0.158111572265625, 0.17218780517578125, 0.1862640380859375, 0.20034027099609375, 0.21441650390625, 0.22849273681640625, 0.2425689697265625, 0.25664520263671875, 0.270721435546875, 0.28479766845703125, 0.2988739013671875, 0.31295013427734375, 0.3270263671875, 0.34110260009765625, 0.3551788330078125, 0.36925506591796875, 0.383331298828125, 0.39740753173828125, 0.4114837646484375, 0.42555999755859375, 0.43963623046875, 0.45371246337890625, 0.4677886962890625, 0.48186492919921875, 0.495941162109375, 0.5100173950195312, 0.5240936279296875, 0.5381698608398438, 0.55224609375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 7.0, 28.0, 81.0, 199.0, 284.0, 241.0, 103.0, 45.0, 12.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.073443412780762, -5.803980827331543, -5.534518241882324, -5.265056133270264, -4.995593547821045, -4.726130962371826, -4.456668853759766, -4.187206268310547, -3.917743682861328, -3.6482810974121094, -3.3788187503814697, -3.10935640335083, -2.8398938179016113, -2.5704312324523926, -2.300968885421753, -2.0315065383911133, -1.7620439529418945, -1.4925814867019653, -1.2231190204620361, -0.9536565542221069, -0.6841940879821777, -0.41473162174224854, -0.14526915550231934, 0.12419331073760986, 0.39365577697753906, 0.6631182432174683, 0.9325807094573975, 1.2020431756973267, 1.4715056419372559, 1.740968108177185, 2.0104305744171143, 2.279892921447754, 2.5493555068969727, 2.8188180923461914, 3.088280439376831, 3.3577427864074707, 3.6272053718566895, 3.896667957305908, 4.166130065917969, 4.4355926513671875, 4.705055236816406, 4.974517822265625, 5.243980407714844, 5.513442516326904, 5.782905101776123, 6.052367687225342, 6.321829795837402, 6.591292381286621, 6.86075496673584, 7.130217552185059, 7.399680137634277, 7.669142246246338, 7.938604831695557, 8.208066940307617, 8.477529525756836, 8.746992111206055, 9.016454696655273, 9.285917282104492, 9.555379867553711, 9.82484245300293, 10.094305038452148, 10.36376667022705, 10.63322925567627, 10.902691841125488, 11.172154426574707]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 11.0, 11.0, 5.0, 11.0, 17.0, 18.0, 16.0, 21.0, 20.0, 22.0, 26.0, 31.0, 42.0, 35.0, 42.0, 32.0, 32.0, 40.0, 43.0, 51.0, 38.0, 45.0, 33.0, 30.0, 42.0, 37.0, 20.0, 39.0, 27.0, 19.0, 20.0, 18.0, 11.0, 11.0, 10.0, 12.0, 10.0, 11.0, 8.0, 4.0, 7.0, 6.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-1.894853115081787, -1.8376237154006958, -1.780394196510315, -1.7231647968292236, -1.6659353971481323, -1.608705997467041, -1.5514764785766602, -1.4942470788955688, -1.4370176792144775, -1.3797882795333862, -1.3225587606430054, -1.265329360961914, -1.2080999612808228, -1.1508705615997314, -1.0936410427093506, -1.0364116430282593, -0.9791821241378784, -0.9219526648521423, -0.864723265171051, -0.8074938058853149, -0.7502644062042236, -0.6930349469184875, -0.6358054876327515, -0.5785760879516602, -0.5213466286659241, -0.4641171991825104, -0.4068877696990967, -0.3496583104133606, -0.2924288809299469, -0.2351994514465332, -0.17796999216079712, -0.12074056267738342, -0.06351113319396973, -0.006281696259975433, 0.05094774067401886, 0.10817718505859375, 0.16540661454200745, 0.22263604402542114, 0.2798655033111572, 0.3370949327945709, 0.3943243622779846, 0.4515537917613983, 0.508783221244812, 0.5660126805305481, 0.6232421398162842, 0.6804715394973755, 0.7377009987831116, 0.7949304580688477, 0.852159857749939, 0.909389317035675, 0.9666187167167664, 1.0238481760025024, 1.0810775756835938, 1.1383070945739746, 1.195536494255066, 1.2527658939361572, 1.309995412826538, 1.3672248125076294, 1.4244543313980103, 1.4816837310791016, 1.5389131307601929, 1.5961425304412842, 1.653372049331665, 1.7106014490127563, 1.7678308486938477]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 5.0, 4.0, 6.0, 10.0, 15.0, 28.0, 28.0, 59.0, 77.0, 98.0, 133.0, 206.0, 358.0, 571.0, 1099.0, 2436.0, 5815.0, 22564.0, 3668344.0, 463347.0, 19086.0, 5225.0, 2162.0, 1064.0, 529.0, 339.0, 195.0, 156.0, 99.0, 70.0, 45.0, 38.0, 27.0, 14.0, 9.0, 8.0, 7.0, 3.0, 4.0, 3.0, 0.0, 1.0, 4.0], "bins": [-0.92236328125, -0.8992767333984375, -0.876190185546875, -0.8531036376953125, -0.83001708984375, -0.8069305419921875, -0.783843994140625, -0.7607574462890625, -0.7376708984375, -0.7145843505859375, -0.691497802734375, -0.6684112548828125, -0.64532470703125, -0.6222381591796875, -0.599151611328125, -0.5760650634765625, -0.552978515625, -0.5298919677734375, -0.506805419921875, -0.4837188720703125, -0.46063232421875, -0.4375457763671875, -0.414459228515625, -0.3913726806640625, -0.3682861328125, -0.3451995849609375, -0.322113037109375, -0.2990264892578125, -0.27593994140625, -0.2528533935546875, -0.229766845703125, -0.2066802978515625, -0.18359375, -0.1605072021484375, -0.137420654296875, -0.1143341064453125, -0.09124755859375, -0.0681610107421875, -0.045074462890625, -0.0219879150390625, 0.0010986328125, 0.0241851806640625, 0.047271728515625, 0.0703582763671875, 0.09344482421875, 0.1165313720703125, 0.139617919921875, 0.1627044677734375, 0.185791015625, 0.2088775634765625, 0.231964111328125, 0.2550506591796875, 0.27813720703125, 0.3012237548828125, 0.324310302734375, 0.3473968505859375, 0.3704833984375, 0.3935699462890625, 0.416656494140625, 0.4397430419921875, 0.46282958984375, 0.4859161376953125, 0.509002685546875, 0.5320892333984375, 0.55517578125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 9.0, 3.0, 7.0, 6.0, 8.0, 13.0, 16.0, 14.0, 17.0, 25.0, 22.0, 20.0, 32.0, 49.0, 27.0, 23.0, 46.0, 37.0, 43.0, 52.0, 49.0, 45.0, 43.0, 45.0, 34.0, 42.0, 39.0, 30.0, 21.0, 30.0, 22.0, 18.0, 28.0, 17.0, 16.0, 10.0, 11.0, 8.0, 6.0, 3.0, 2.0, 3.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0718994140625, -0.06975078582763672, -0.06760215759277344, -0.06545352935791016, -0.06330490112304688, -0.061156272888183594, -0.05900764465332031, -0.05685901641845703, -0.05471038818359375, -0.05256175994873047, -0.05041313171386719, -0.048264503479003906, -0.046115875244140625, -0.043967247009277344, -0.04181861877441406, -0.03966999053955078, -0.0375213623046875, -0.03537273406982422, -0.03322410583496094, -0.031075477600097656, -0.028926849365234375, -0.026778221130371094, -0.024629592895507812, -0.02248096466064453, -0.02033233642578125, -0.01818370819091797, -0.016035079956054688, -0.013886451721191406, -0.011737823486328125, -0.009589195251464844, -0.0074405670166015625, -0.005291938781738281, -0.003143310546875, -0.0009946823120117188, 0.0011539459228515625, 0.0033025741577148438, 0.005451202392578125, 0.007599830627441406, 0.009748458862304688, 0.011897087097167969, 0.01404571533203125, 0.01619434356689453, 0.018342971801757812, 0.020491600036621094, 0.022640228271484375, 0.024788856506347656, 0.026937484741210938, 0.02908611297607422, 0.0312347412109375, 0.03338336944580078, 0.03553199768066406, 0.037680625915527344, 0.039829254150390625, 0.041977882385253906, 0.04412651062011719, 0.04627513885498047, 0.04842376708984375, 0.05057239532470703, 0.05272102355957031, 0.054869651794433594, 0.057018280029296875, 0.059166908264160156, 0.06131553649902344, 0.06346416473388672, 0.06561279296875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 8.0, 11.0, 12.0, 10.0, 18.0, 28.0, 38.0, 41.0, 42.0, 80.0, 83.0, 130.0, 201.0, 283.0, 564.0, 1053.0, 2331.0, 6725.0, 29851.0, 3927393.0, 200893.0, 16234.0, 4345.0, 1717.0, 784.0, 412.0, 269.0, 211.0, 121.0, 104.0, 64.0, 58.0, 53.0, 39.0, 19.0, 17.0, 13.0, 8.0, 10.0, 5.0, 2.0, 1.0, 7.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9208984375, -0.888946533203125, -0.85699462890625, -0.825042724609375, -0.7930908203125, -0.761138916015625, -0.72918701171875, -0.697235107421875, -0.665283203125, -0.633331298828125, -0.60137939453125, -0.569427490234375, -0.5374755859375, -0.505523681640625, -0.47357177734375, -0.441619873046875, -0.40966796875, -0.377716064453125, -0.34576416015625, -0.313812255859375, -0.2818603515625, -0.249908447265625, -0.21795654296875, -0.186004638671875, -0.154052734375, -0.122100830078125, -0.09014892578125, -0.058197021484375, -0.0262451171875, 0.005706787109375, 0.03765869140625, 0.069610595703125, 0.1015625, 0.133514404296875, 0.16546630859375, 0.197418212890625, 0.2293701171875, 0.261322021484375, 0.29327392578125, 0.325225830078125, 0.357177734375, 0.389129638671875, 0.42108154296875, 0.453033447265625, 0.4849853515625, 0.516937255859375, 0.54888916015625, 0.580841064453125, 0.61279296875, 0.644744873046875, 0.67669677734375, 0.708648681640625, 0.7406005859375, 0.772552490234375, 0.80450439453125, 0.836456298828125, 0.868408203125, 0.900360107421875, 0.93231201171875, 0.964263916015625, 0.9962158203125, 1.028167724609375, 1.06011962890625, 1.092071533203125, 1.1240234375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 6.0, 13.0, 16.0, 25.0, 68.0, 167.0, 3288.0, 333.0, 68.0, 37.0, 16.0, 11.0, 5.0, 5.0, 2.0, 8.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.187255859375, -0.18094825744628906, -0.17464065551757812, -0.1683330535888672, -0.16202545166015625, -0.1557178497314453, -0.14941024780273438, -0.14310264587402344, -0.1367950439453125, -0.13048744201660156, -0.12417984008789062, -0.11787223815917969, -0.11156463623046875, -0.10525703430175781, -0.09894943237304688, -0.09264183044433594, -0.086334228515625, -0.08002662658691406, -0.07371902465820312, -0.06741142272949219, -0.06110382080078125, -0.05479621887207031, -0.048488616943359375, -0.04218101501464844, -0.0358734130859375, -0.029565811157226562, -0.023258209228515625, -0.016950607299804688, -0.01064300537109375, -0.0043354034423828125, 0.001972198486328125, 0.008279800415039062, 0.01458740234375, 0.020895004272460938, 0.027202606201171875, 0.03351020812988281, 0.03981781005859375, 0.04612541198730469, 0.052433013916015625, 0.05874061584472656, 0.0650482177734375, 0.07135581970214844, 0.07766342163085938, 0.08397102355957031, 0.09027862548828125, 0.09658622741699219, 0.10289382934570312, 0.10920143127441406, 0.115509033203125, 0.12181663513183594, 0.12812423706054688, 0.1344318389892578, 0.14073944091796875, 0.1470470428466797, 0.15335464477539062, 0.15966224670410156, 0.1659698486328125, 0.17227745056152344, 0.17858505249023438, 0.1848926544189453, 0.19120025634765625, 0.1975078582763672, 0.20381546020507812, 0.21012306213378906, 0.2164306640625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 8.0, 16.0, 13.0, 29.0, 46.0, 76.0, 92.0, 125.0, 139.0, 122.0, 95.0, 77.0, 66.0, 40.0, 17.0, 16.0, 9.0, 11.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4653366804122925, -0.441852331161499, -0.41836798191070557, -0.3948836326599121, -0.37139928340911865, -0.3479149341583252, -0.3244306147098541, -0.30094626545906067, -0.2774619162082672, -0.25397756695747375, -0.2304932177066803, -0.20700888335704803, -0.18352453410625458, -0.16004018485546112, -0.13655585050582886, -0.1130715012550354, -0.08958715200424194, -0.06610280275344849, -0.042618460953235626, -0.019134119153022766, 0.004350230097770691, 0.027834579348564148, 0.05131891369819641, 0.07480326294898987, 0.09828761219978333, 0.12177196145057678, 0.14525631070137024, 0.1687406450510025, 0.19222499430179596, 0.21570934355258942, 0.23919367790222168, 0.26267802715301514, 0.2861623764038086, 0.30964672565460205, 0.3331310749053955, 0.35661542415618896, 0.3800997734069824, 0.4035841226577759, 0.42706844210624695, 0.4505527913570404, 0.47403714060783386, 0.4975214898586273, 0.5210058093070984, 0.5444901585578918, 0.5679745078086853, 0.5914588570594788, 0.6149432063102722, 0.6384275555610657, 0.6619119048118591, 0.6853962540626526, 0.708880603313446, 0.7323649525642395, 0.755849301815033, 0.7793336510658264, 0.8028179407119751, 0.8263022899627686, 0.849786639213562, 0.8732709884643555, 0.8967553377151489, 0.9202396869659424, 0.9437240362167358, 0.9672083854675293, 0.9906927347183228, 1.0141770839691162, 1.0376614332199097]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 4.0, 4.0, 9.0, 10.0, 7.0, 9.0, 10.0, 13.0, 16.0, 23.0, 20.0, 28.0, 25.0, 36.0, 44.0, 41.0, 34.0, 46.0, 35.0, 55.0, 47.0, 51.0, 37.0, 44.0, 35.0, 37.0, 30.0, 28.0, 32.0, 21.0, 28.0, 25.0, 14.0, 24.0, 16.0, 23.0, 11.0, 9.0, 6.0, 4.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26968783140182495, -0.259859174489975, -0.2500304877758026, -0.24020181596279144, -0.23037314414978027, -0.2205444872379303, -0.21071581542491913, -0.20088714361190796, -0.1910584717988968, -0.18122979998588562, -0.17140112817287445, -0.16157245635986328, -0.1517437994480133, -0.14191511273384094, -0.13208645582199097, -0.1222577840089798, -0.11242911219596863, -0.10260044038295746, -0.09277176856994629, -0.08294310420751572, -0.07311443239450455, -0.06328576058149338, -0.05345709249377251, -0.043628424406051636, -0.033799752593040466, -0.023971082642674446, -0.014142412692308426, -0.004313742741942406, 0.0055149272084236145, 0.015343599021434784, 0.025172267109155655, 0.035000935196876526, 0.044829607009887695, 0.054658278822898865, 0.06448695063591003, 0.0743156149983406, 0.08414428681135178, 0.09397295862436295, 0.10380162298679352, 0.11363029479980469, 0.12345896661281586, 0.13328763842582703, 0.1431163102388382, 0.15294498205184937, 0.16277363896369934, 0.1726023256778717, 0.18243098258972168, 0.19225965440273285, 0.20208832621574402, 0.2119169980287552, 0.22174566984176636, 0.23157434165477753, 0.2414030134677887, 0.25123167037963867, 0.26106035709381104, 0.270889014005661, 0.280717670917511, 0.29054632782936096, 0.3003750145435333, 0.3102036714553833, 0.32003235816955566, 0.32986101508140564, 0.339689701795578, 0.349518358707428, 0.35934704542160034]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 5.0, 4.0, 3.0, 1.0, 6.0, 8.0, 24.0, 26.0, 29.0, 49.0, 65.0, 123.0, 238.0, 365.0, 570.0, 1013.0, 1727.0, 3059.0, 5683.0, 10843.0, 20971.0, 41697.0, 81778.0, 153324.0, 229099.0, 216496.0, 135413.0, 70692.0, 36114.0, 18224.0, 9478.0, 5047.0, 2606.0, 1606.0, 859.0, 491.0, 299.0, 197.0, 99.0, 78.0, 55.0, 29.0, 19.0, 15.0, 13.0, 11.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2093505859375, -0.2029857635498047, -0.19662094116210938, -0.19025611877441406, -0.18389129638671875, -0.17752647399902344, -0.17116165161132812, -0.1647968292236328, -0.1584320068359375, -0.1520671844482422, -0.14570236206054688, -0.13933753967285156, -0.13297271728515625, -0.12660789489746094, -0.12024307250976562, -0.11387825012207031, -0.107513427734375, -0.10114860534667969, -0.09478378295898438, -0.08841896057128906, -0.08205413818359375, -0.07568931579589844, -0.06932449340820312, -0.06295967102050781, -0.0565948486328125, -0.05023002624511719, -0.043865203857421875, -0.03750038146972656, -0.03113555908203125, -0.024770736694335938, -0.018405914306640625, -0.012041091918945312, -0.00567626953125, 0.0006885528564453125, 0.007053375244140625, 0.013418197631835938, 0.01978302001953125, 0.026147842407226562, 0.032512664794921875, 0.03887748718261719, 0.0452423095703125, 0.05160713195800781, 0.057971954345703125, 0.06433677673339844, 0.07070159912109375, 0.07706642150878906, 0.08343124389648438, 0.08979606628417969, 0.096160888671875, 0.10252571105957031, 0.10889053344726562, 0.11525535583496094, 0.12162017822265625, 0.12798500061035156, 0.13434982299804688, 0.1407146453857422, 0.1470794677734375, 0.1534442901611328, 0.15980911254882812, 0.16617393493652344, 0.17253875732421875, 0.17890357971191406, 0.18526840209960938, 0.1916332244873047, 0.197998046875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 6.0, 7.0, 8.0, 12.0, 9.0, 22.0, 12.0, 16.0, 15.0, 26.0, 27.0, 39.0, 36.0, 44.0, 40.0, 41.0, 42.0, 56.0, 43.0, 51.0, 46.0, 48.0, 47.0, 47.0, 44.0, 35.0, 30.0, 31.0, 19.0, 14.0, 17.0, 18.0, 10.0, 14.0, 5.0, 9.0, 8.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.09375, -0.09087657928466797, -0.08800315856933594, -0.0851297378540039, -0.08225631713867188, -0.07938289642333984, -0.07650947570800781, -0.07363605499267578, -0.07076263427734375, -0.06788921356201172, -0.06501579284667969, -0.062142372131347656, -0.059268951416015625, -0.056395530700683594, -0.05352210998535156, -0.05064868927001953, -0.0477752685546875, -0.04490184783935547, -0.04202842712402344, -0.039155006408691406, -0.036281585693359375, -0.033408164978027344, -0.030534744262695312, -0.02766132354736328, -0.02478790283203125, -0.02191448211669922, -0.019041061401367188, -0.016167640686035156, -0.013294219970703125, -0.010420799255371094, -0.0075473785400390625, -0.004673957824707031, -0.001800537109375, 0.0010728836059570312, 0.0039463043212890625, 0.006819725036621094, 0.009693145751953125, 0.012566566467285156, 0.015439987182617188, 0.01831340789794922, 0.02118682861328125, 0.02406024932861328, 0.026933670043945312, 0.029807090759277344, 0.032680511474609375, 0.035553932189941406, 0.03842735290527344, 0.04130077362060547, 0.0441741943359375, 0.04704761505126953, 0.04992103576660156, 0.052794456481933594, 0.055667877197265625, 0.058541297912597656, 0.06141471862792969, 0.06428813934326172, 0.06716156005859375, 0.07003498077392578, 0.07290840148925781, 0.07578182220458984, 0.07865524291992188, 0.0815286636352539, 0.08440208435058594, 0.08727550506591797, 0.09014892578125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 0.0, 1.0, 4.0, 3.0, 7.0, 5.0, 7.0, 12.0, 15.0, 21.0, 26.0, 35.0, 50.0, 66.0, 108.0, 131.0, 193.0, 230.0, 399.0, 648.0, 1027.0, 2175.0, 6023.0, 22617.0, 130454.0, 603618.0, 229236.0, 36424.0, 8515.0, 2905.0, 1359.0, 754.0, 441.0, 304.0, 218.0, 140.0, 115.0, 78.0, 48.0, 37.0, 23.0, 26.0, 12.0, 13.0, 11.0, 5.0, 0.0, 4.0, 2.0, 7.0, 5.0, 2.0, 0.0, 1.0, 2.0, 3.0], "bins": [-0.56884765625, -0.55194091796875, -0.5350341796875, -0.51812744140625, -0.501220703125, -0.48431396484375, -0.4674072265625, -0.45050048828125, -0.43359375, -0.41668701171875, -0.3997802734375, -0.38287353515625, -0.365966796875, -0.34906005859375, -0.3321533203125, -0.31524658203125, -0.29833984375, -0.28143310546875, -0.2645263671875, -0.24761962890625, -0.230712890625, -0.21380615234375, -0.1968994140625, -0.17999267578125, -0.1630859375, -0.14617919921875, -0.1292724609375, -0.11236572265625, -0.095458984375, -0.07855224609375, -0.0616455078125, -0.04473876953125, -0.02783203125, -0.01092529296875, 0.0059814453125, 0.02288818359375, 0.039794921875, 0.05670166015625, 0.0736083984375, 0.09051513671875, 0.107421875, 0.12432861328125, 0.1412353515625, 0.15814208984375, 0.175048828125, 0.19195556640625, 0.2088623046875, 0.22576904296875, 0.24267578125, 0.25958251953125, 0.2764892578125, 0.29339599609375, 0.310302734375, 0.32720947265625, 0.3441162109375, 0.36102294921875, 0.3779296875, 0.39483642578125, 0.4117431640625, 0.42864990234375, 0.445556640625, 0.46246337890625, 0.4793701171875, 0.49627685546875, 0.51318359375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 5.0, 6.0, 2.0, 7.0, 5.0, 7.0, 12.0, 6.0, 25.0, 22.0, 13.0, 16.0, 20.0, 21.0, 24.0, 35.0, 38.0, 30.0, 38.0, 37.0, 39.0, 49.0, 35.0, 32.0, 40.0, 53.0, 32.0, 41.0, 31.0, 39.0, 27.0, 25.0, 31.0, 28.0, 11.0, 20.0, 16.0, 15.0, 13.0, 15.0, 10.0, 9.0, 6.0, 5.0, 7.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.441650390625, -0.42737579345703125, -0.4131011962890625, -0.39882659912109375, -0.384552001953125, -0.37027740478515625, -0.3560028076171875, -0.34172821044921875, -0.32745361328125, -0.31317901611328125, -0.2989044189453125, -0.28462982177734375, -0.270355224609375, -0.25608062744140625, -0.2418060302734375, -0.22753143310546875, -0.2132568359375, -0.19898223876953125, -0.1847076416015625, -0.17043304443359375, -0.156158447265625, -0.14188385009765625, -0.1276092529296875, -0.11333465576171875, -0.09906005859375, -0.08478546142578125, -0.0705108642578125, -0.05623626708984375, -0.041961669921875, -0.02768707275390625, -0.0134124755859375, 0.00086212158203125, 0.01513671875, 0.02941131591796875, 0.0436859130859375, 0.05796051025390625, 0.072235107421875, 0.08650970458984375, 0.1007843017578125, 0.11505889892578125, 0.12933349609375, 0.14360809326171875, 0.1578826904296875, 0.17215728759765625, 0.186431884765625, 0.20070648193359375, 0.2149810791015625, 0.22925567626953125, 0.2435302734375, 0.25780487060546875, 0.2720794677734375, 0.28635406494140625, 0.300628662109375, 0.31490325927734375, 0.3291778564453125, 0.34345245361328125, 0.35772705078125, 0.37200164794921875, 0.3862762451171875, 0.40055084228515625, 0.414825439453125, 0.42910003662109375, 0.4433746337890625, 0.45764923095703125, 0.471923828125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 9.0, 15.0, 18.0, 17.0, 26.0, 37.0, 64.0, 112.0, 174.0, 276.0, 511.0, 1028.0, 2007.0, 4713.0, 13567.0, 48078.0, 226797.0, 544022.0, 154179.0, 34721.0, 10557.0, 3907.0, 1774.0, 791.0, 487.0, 220.0, 147.0, 102.0, 58.0, 47.0, 25.0, 12.0, 11.0, 15.0, 9.0, 6.0, 1.0, 4.0, 7.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2064208984375, -0.19914817810058594, -0.19187545776367188, -0.1846027374267578, -0.17733001708984375, -0.1700572967529297, -0.16278457641601562, -0.15551185607910156, -0.1482391357421875, -0.14096641540527344, -0.13369369506835938, -0.1264209747314453, -0.11914825439453125, -0.11187553405761719, -0.10460281372070312, -0.09733009338378906, -0.090057373046875, -0.08278465270996094, -0.07551193237304688, -0.06823921203613281, -0.06096649169921875, -0.05369377136230469, -0.046421051025390625, -0.03914833068847656, -0.0318756103515625, -0.024602890014648438, -0.017330169677734375, -0.010057449340820312, -0.00278472900390625, 0.0044879913330078125, 0.011760711669921875, 0.019033432006835938, 0.02630615234375, 0.03357887268066406, 0.040851593017578125, 0.04812431335449219, 0.05539703369140625, 0.06266975402832031, 0.06994247436523438, 0.07721519470214844, 0.0844879150390625, 0.09176063537597656, 0.09903335571289062, 0.10630607604980469, 0.11357879638671875, 0.12085151672363281, 0.12812423706054688, 0.13539695739746094, 0.142669677734375, 0.14994239807128906, 0.15721511840820312, 0.1644878387451172, 0.17176055908203125, 0.1790332794189453, 0.18630599975585938, 0.19357872009277344, 0.2008514404296875, 0.20812416076660156, 0.21539688110351562, 0.2226696014404297, 0.22994232177734375, 0.2372150421142578, 0.24448776245117188, 0.25176048278808594, 0.259033203125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 8.0, 4.0, 3.0, 12.0, 14.0, 22.0, 42.0, 65.0, 81.0, 98.0, 101.0, 130.0, 107.0, 89.0, 67.0, 51.0, 47.0, 31.0, 13.0, 8.0, 11.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00023412704467773438, -0.00022896192967891693, -0.0002237968146800995, -0.00021863169968128204, -0.0002134665846824646, -0.00020830146968364716, -0.0002031363546848297, -0.00019797123968601227, -0.00019280612468719482, -0.00018764100968837738, -0.00018247589468955994, -0.0001773107796907425, -0.00017214566469192505, -0.0001669805496931076, -0.00016181543469429016, -0.00015665031969547272, -0.00015148520469665527, -0.00014632008969783783, -0.00014115497469902039, -0.00013598985970020294, -0.0001308247447013855, -0.00012565962970256805, -0.00012049451470375061, -0.00011532939970493317, -0.00011016428470611572, -0.00010499916970729828, -9.983405470848083e-05, -9.466893970966339e-05, -8.950382471084595e-05, -8.43387097120285e-05, -7.917359471321106e-05, -7.400847971439362e-05, -6.884336471557617e-05, -6.367824971675873e-05, -5.8513134717941284e-05, -5.334801971912384e-05, -4.8182904720306396e-05, -4.301778972148895e-05, -3.785267472267151e-05, -3.2687559723854065e-05, -2.752244472503662e-05, -2.2357329726219177e-05, -1.7192214727401733e-05, -1.202709972858429e-05, -6.861984729766846e-06, -1.6968697309494019e-06, 3.468245267868042e-06, 8.633360266685486e-06, 1.379847526550293e-05, 1.8963590264320374e-05, 2.4128705263137817e-05, 2.929382026195526e-05, 3.4458935260772705e-05, 3.962405025959015e-05, 4.478916525840759e-05, 4.995428025722504e-05, 5.511939525604248e-05, 6.0284510254859924e-05, 6.544962525367737e-05, 7.061474025249481e-05, 7.577985525131226e-05, 8.09449702501297e-05, 8.611008524894714e-05, 9.127520024776459e-05, 9.644031524658203e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 13.0, 14.0, 27.0, 34.0, 37.0, 68.0, 124.0, 257.0, 508.0, 1077.0, 2599.0, 8946.0, 51394.0, 512146.0, 417017.0, 42267.0, 7668.0, 2358.0, 948.0, 461.0, 232.0, 152.0, 73.0, 49.0, 30.0, 21.0, 12.0, 9.0, 6.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.335205078125, -0.3243751525878906, -0.31354522705078125, -0.3027153015136719, -0.2918853759765625, -0.2810554504394531, -0.27022552490234375, -0.2593955993652344, -0.248565673828125, -0.23773574829101562, -0.22690582275390625, -0.21607589721679688, -0.2052459716796875, -0.19441604614257812, -0.18358612060546875, -0.17275619506835938, -0.16192626953125, -0.15109634399414062, -0.14026641845703125, -0.12943649291992188, -0.1186065673828125, -0.10777664184570312, -0.09694671630859375, -0.08611679077148438, -0.075286865234375, -0.06445693969726562, -0.05362701416015625, -0.042797088623046875, -0.0319671630859375, -0.021137237548828125, -0.01030731201171875, 0.000522613525390625, 0.0113525390625, 0.022182464599609375, 0.03301239013671875, 0.043842315673828125, 0.0546722412109375, 0.06550216674804688, 0.07633209228515625, 0.08716201782226562, 0.097991943359375, 0.10882186889648438, 0.11965179443359375, 0.13048171997070312, 0.1413116455078125, 0.15214157104492188, 0.16297149658203125, 0.17380142211914062, 0.18463134765625, 0.19546127319335938, 0.20629119873046875, 0.21712112426757812, 0.2279510498046875, 0.23878097534179688, 0.24961090087890625, 0.2604408264160156, 0.271270751953125, 0.2821006774902344, 0.29293060302734375, 0.3037605285644531, 0.3145904541015625, 0.3254203796386719, 0.33625030517578125, 0.3470802307128906, 0.35791015625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 2.0, 1.0, 6.0, 2.0, 11.0, 9.0, 3.0, 11.0, 21.0, 32.0, 42.0, 77.0, 96.0, 104.0, 91.0, 115.0, 78.0, 77.0, 64.0, 42.0, 34.0, 29.0, 14.0, 16.0, 12.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29052734375, -0.2820281982421875, -0.273529052734375, -0.2650299072265625, -0.25653076171875, -0.2480316162109375, -0.239532470703125, -0.2310333251953125, -0.2225341796875, -0.2140350341796875, -0.205535888671875, -0.1970367431640625, -0.18853759765625, -0.1800384521484375, -0.171539306640625, -0.1630401611328125, -0.154541015625, -0.1460418701171875, -0.137542724609375, -0.1290435791015625, -0.12054443359375, -0.1120452880859375, -0.103546142578125, -0.0950469970703125, -0.0865478515625, -0.0780487060546875, -0.069549560546875, -0.0610504150390625, -0.05255126953125, -0.0440521240234375, -0.035552978515625, -0.0270538330078125, -0.0185546875, -0.0100555419921875, -0.001556396484375, 0.0069427490234375, 0.01544189453125, 0.0239410400390625, 0.032440185546875, 0.0409393310546875, 0.0494384765625, 0.0579376220703125, 0.066436767578125, 0.0749359130859375, 0.08343505859375, 0.0919342041015625, 0.100433349609375, 0.1089324951171875, 0.117431640625, 0.1259307861328125, 0.134429931640625, 0.1429290771484375, 0.15142822265625, 0.1599273681640625, 0.168426513671875, 0.1769256591796875, 0.1854248046875, 0.1939239501953125, 0.202423095703125, 0.2109222412109375, 0.21942138671875, 0.2279205322265625, 0.236419677734375, 0.2449188232421875, 0.25341796875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 8.0, 17.0, 66.0, 182.0, 264.0, 264.0, 130.0, 63.0, 10.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.13332748413086, -13.860851287841797, -13.58837604522705, -13.315899848937988, -13.043423652648926, -12.77094841003418, -12.498472213745117, -12.225996017456055, -11.953519821166992, -11.68104362487793, -11.408568382263184, -11.136092185974121, -10.863615989685059, -10.591140747070312, -10.31866455078125, -10.046188354492188, -9.773713111877441, -9.501236915588379, -9.228761672973633, -8.95628547668457, -8.683809280395508, -8.411333084106445, -8.1388578414917, -7.866381645202637, -7.593905925750732, -7.321430206298828, -7.048954010009766, -6.776478290557861, -6.504002571105957, -6.2315263748168945, -5.95905065536499, -5.686574935913086, -5.414098739624023, -5.141623020172119, -4.869146823883057, -4.596671104431152, -4.32419490814209, -4.0517191886901855, -3.7792434692382812, -3.506767511367798, -3.2342917919158936, -2.96181583404541, -2.689340114593506, -2.4168641567230225, -2.144388198852539, -1.8719122409820557, -1.5994364023208618, -1.326960563659668, -1.0544846057891846, -0.782008707523346, -0.5095328092575073, -0.2370569109916687, 0.03541898727416992, 0.3078949451446533, 0.5803707838058472, 0.852846622467041, 1.1253225803375244, 1.3977985382080078, 1.6702743768692017, 1.9427502155303955, 2.215226173400879, 2.4877021312713623, 2.7601780891418457, 3.03265380859375, 3.3051297664642334]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 7.0, 7.0, 6.0, 11.0, 12.0, 10.0, 20.0, 7.0, 21.0, 15.0, 24.0, 24.0, 30.0, 35.0, 42.0, 53.0, 50.0, 54.0, 54.0, 59.0, 44.0, 48.0, 48.0, 47.0, 39.0, 40.0, 29.0, 40.0, 20.0, 25.0, 21.0, 17.0, 15.0, 7.0, 8.0, 4.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.524672031402588, -2.429678440093994, -2.3346848487854004, -2.2396912574768066, -2.144697904586792, -2.0497043132781982, -1.9547107219696045, -1.8597171306610107, -1.764723539352417, -1.6697299480438232, -1.574736475944519, -1.4797428846359253, -1.3847492933273315, -1.2897558212280273, -1.1947622299194336, -1.0997686386108398, -1.0047751665115356, -0.9097816348075867, -0.8147880434989929, -0.719794511795044, -0.6248009204864502, -0.5298073887825012, -0.43481385707855225, -0.3398202657699585, -0.24482673406600952, -0.14983317255973816, -0.05483962595462799, 0.04015392065048218, 0.13514748215675354, 0.2301410436630249, 0.3251345753669739, 0.4201281666755676, 0.5151216983795166, 0.6101152300834656, 0.7051088213920593, 0.8001023530960083, 0.895095944404602, 0.990089476108551, 1.0850830078125, 1.1800765991210938, 1.2750701904296875, 1.3700637817382812, 1.4650572538375854, 1.5600508451461792, 1.655044436454773, 1.7500379085540771, 1.845031499862671, 1.9400250911712646, 2.0350184440612793, 2.130012035369873, 2.225005626678467, 2.3199992179870605, 2.414992570877075, 2.509986162185669, 2.6049797534942627, 2.6999733448028564, 2.79496693611145, 2.889960527420044, 2.9849541187286377, 3.0799474716186523, 3.174941062927246, 3.26993465423584, 3.3649282455444336, 3.4599218368530273, 3.554915428161621]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 7.0, 2.0, 4.0, 2.0, 11.0, 13.0, 12.0, 21.0, 19.0, 29.0, 44.0, 56.0, 75.0, 112.0, 180.0, 208.0, 359.0, 578.0, 810.0, 1513.0, 2694.0, 6037.0, 15480.0, 61868.0, 3881574.0, 178863.0, 25789.0, 9007.0, 3931.0, 1948.0, 1061.0, 624.0, 401.0, 268.0, 191.0, 139.0, 89.0, 84.0, 56.0, 36.0, 25.0, 18.0, 17.0, 14.0, 9.0, 3.0, 2.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.55322265625, -0.5377349853515625, -0.522247314453125, -0.5067596435546875, -0.49127197265625, -0.4757843017578125, -0.460296630859375, -0.4448089599609375, -0.4293212890625, -0.4138336181640625, -0.398345947265625, -0.3828582763671875, -0.36737060546875, -0.3518829345703125, -0.336395263671875, -0.3209075927734375, -0.305419921875, -0.2899322509765625, -0.274444580078125, -0.2589569091796875, -0.24346923828125, -0.2279815673828125, -0.212493896484375, -0.1970062255859375, -0.1815185546875, -0.1660308837890625, -0.150543212890625, -0.1350555419921875, -0.11956787109375, -0.1040802001953125, -0.088592529296875, -0.0731048583984375, -0.0576171875, -0.0421295166015625, -0.026641845703125, -0.0111541748046875, 0.00433349609375, 0.0198211669921875, 0.035308837890625, 0.0507965087890625, 0.0662841796875, 0.0817718505859375, 0.097259521484375, 0.1127471923828125, 0.12823486328125, 0.1437225341796875, 0.159210205078125, 0.1746978759765625, 0.190185546875, 0.2056732177734375, 0.221160888671875, 0.2366485595703125, 0.25213623046875, 0.2676239013671875, 0.283111572265625, 0.2985992431640625, 0.3140869140625, 0.3295745849609375, 0.345062255859375, 0.3605499267578125, 0.37603759765625, 0.3915252685546875, 0.407012939453125, 0.4225006103515625, 0.43798828125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 6.0, 11.0, 11.0, 10.0, 11.0, 9.0, 17.0, 28.0, 26.0, 35.0, 45.0, 51.0, 43.0, 47.0, 51.0, 44.0, 56.0, 65.0, 41.0, 36.0, 45.0, 58.0, 35.0, 36.0, 28.0, 33.0, 20.0, 21.0, 11.0, 16.0, 10.0, 10.0, 5.0, 8.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1136474609375, -0.1103668212890625, -0.107086181640625, -0.1038055419921875, -0.10052490234375, -0.0972442626953125, -0.093963623046875, -0.0906829833984375, -0.08740234375, -0.0841217041015625, -0.080841064453125, -0.0775604248046875, -0.07427978515625, -0.0709991455078125, -0.067718505859375, -0.0644378662109375, -0.0611572265625, -0.0578765869140625, -0.054595947265625, -0.0513153076171875, -0.04803466796875, -0.0447540283203125, -0.041473388671875, -0.0381927490234375, -0.034912109375, -0.0316314697265625, -0.028350830078125, -0.0250701904296875, -0.02178955078125, -0.0185089111328125, -0.015228271484375, -0.0119476318359375, -0.0086669921875, -0.0053863525390625, -0.002105712890625, 0.0011749267578125, 0.00445556640625, 0.0077362060546875, 0.011016845703125, 0.0142974853515625, 0.017578125, 0.0208587646484375, 0.024139404296875, 0.0274200439453125, 0.03070068359375, 0.0339813232421875, 0.037261962890625, 0.0405426025390625, 0.0438232421875, 0.0471038818359375, 0.050384521484375, 0.0536651611328125, 0.05694580078125, 0.0602264404296875, 0.063507080078125, 0.0667877197265625, 0.070068359375, 0.0733489990234375, 0.076629638671875, 0.0799102783203125, 0.08319091796875, 0.0864715576171875, 0.089752197265625, 0.0930328369140625, 0.0963134765625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 6.0, 15.0, 19.0, 15.0, 15.0, 33.0, 37.0, 53.0, 77.0, 92.0, 147.0, 180.0, 261.0, 407.0, 509.0, 826.0, 1415.0, 2516.0, 6460.0, 30672.0, 3887442.0, 236486.0, 16454.0, 4525.0, 2060.0, 1161.0, 739.0, 472.0, 329.0, 241.0, 175.0, 117.0, 84.0, 66.0, 38.0, 42.0, 25.0, 22.0, 13.0, 15.0, 7.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0087890625, -0.9749755859375, -0.941162109375, -0.9073486328125, -0.87353515625, -0.8397216796875, -0.805908203125, -0.7720947265625, -0.73828125, -0.7044677734375, -0.670654296875, -0.6368408203125, -0.60302734375, -0.5692138671875, -0.535400390625, -0.5015869140625, -0.4677734375, -0.4339599609375, -0.400146484375, -0.3663330078125, -0.33251953125, -0.2987060546875, -0.264892578125, -0.2310791015625, -0.197265625, -0.1634521484375, -0.129638671875, -0.0958251953125, -0.06201171875, -0.0281982421875, 0.005615234375, 0.0394287109375, 0.0732421875, 0.1070556640625, 0.140869140625, 0.1746826171875, 0.20849609375, 0.2423095703125, 0.276123046875, 0.3099365234375, 0.34375, 0.3775634765625, 0.411376953125, 0.4451904296875, 0.47900390625, 0.5128173828125, 0.546630859375, 0.5804443359375, 0.6142578125, 0.6480712890625, 0.681884765625, 0.7156982421875, 0.74951171875, 0.7833251953125, 0.817138671875, 0.8509521484375, 0.884765625, 0.9185791015625, 0.952392578125, 0.9862060546875, 1.02001953125, 1.0538330078125, 1.087646484375, 1.1214599609375, 1.1552734375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 4.0, 3.0, 1.0, 3.0, 4.0, 4.0, 6.0, 12.0, 30.0, 57.0, 161.0, 3244.0, 369.0, 104.0, 27.0, 18.0, 10.0, 13.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.263427734375, -0.25484466552734375, -0.2462615966796875, -0.23767852783203125, -0.229095458984375, -0.22051239013671875, -0.2119293212890625, -0.20334625244140625, -0.19476318359375, -0.18618011474609375, -0.1775970458984375, -0.16901397705078125, -0.160430908203125, -0.15184783935546875, -0.1432647705078125, -0.13468170166015625, -0.1260986328125, -0.11751556396484375, -0.1089324951171875, -0.10034942626953125, -0.091766357421875, -0.08318328857421875, -0.0746002197265625, -0.06601715087890625, -0.05743408203125, -0.04885101318359375, -0.0402679443359375, -0.03168487548828125, -0.023101806640625, -0.01451873779296875, -0.0059356689453125, 0.00264739990234375, 0.01123046875, 0.01981353759765625, 0.0283966064453125, 0.03697967529296875, 0.045562744140625, 0.05414581298828125, 0.0627288818359375, 0.07131195068359375, 0.07989501953125, 0.08847808837890625, 0.0970611572265625, 0.10564422607421875, 0.114227294921875, 0.12281036376953125, 0.1313934326171875, 0.13997650146484375, 0.1485595703125, 0.15714263916015625, 0.1657257080078125, 0.17430877685546875, 0.182891845703125, 0.19147491455078125, 0.2000579833984375, 0.20864105224609375, 0.21722412109375, 0.22580718994140625, 0.2343902587890625, 0.24297332763671875, 0.251556396484375, 0.26013946533203125, 0.2687225341796875, 0.27730560302734375, 0.285888671875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 5.0, 8.0, 7.0, 21.0, 20.0, 31.0, 57.0, 61.0, 84.0, 119.0, 127.0, 123.0, 96.0, 86.0, 52.0, 41.0, 24.0, 17.0, 10.0, 3.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2159082889556885, -1.1850411891937256, -1.1541740894317627, -1.1233069896697998, -1.092439889907837, -1.061572790145874, -1.0307056903839111, -0.9998385906219482, -0.9689714908599854, -0.9381043910980225, -0.9072372913360596, -0.8763701915740967, -0.8455030918121338, -0.8146359920501709, -0.783768892288208, -0.7529017925262451, -0.7220346331596375, -0.6911675333976746, -0.6603004336357117, -0.6294333338737488, -0.5985662341117859, -0.567699134349823, -0.5368319749832153, -0.5059648752212524, -0.47509780526161194, -0.44423070549964905, -0.41336360573768616, -0.3824964761734009, -0.351629376411438, -0.3207622766494751, -0.2898951768875122, -0.2590280771255493, -0.22816097736358643, -0.19729387760162354, -0.16642677783966064, -0.13555966317653656, -0.10469256341457367, -0.07382546365261078, -0.042958348989486694, -0.012091249227523804, 0.018775850534439087, 0.049642954021692276, 0.08051005750894547, 0.11137716472148895, 0.14224426448345184, 0.17311136424541473, 0.20397847890853882, 0.2348455786705017, 0.2657126784324646, 0.2965797781944275, 0.3274468779563904, 0.35831397771835327, 0.38918107748031616, 0.42004817724227905, 0.45091530680656433, 0.4817824065685272, 0.5126495361328125, 0.5435166358947754, 0.5743837356567383, 0.6052508354187012, 0.6361179351806641, 0.666985034942627, 0.6978521347045898, 0.7287192344665527, 0.7595863342285156]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 5.0, 0.0, 4.0, 3.0, 2.0, 6.0, 6.0, 10.0, 15.0, 9.0, 14.0, 15.0, 15.0, 21.0, 18.0, 23.0, 27.0, 28.0, 27.0, 34.0, 29.0, 50.0, 35.0, 34.0, 38.0, 47.0, 31.0, 36.0, 45.0, 40.0, 40.0, 35.0, 23.0, 30.0, 35.0, 30.0, 18.0, 15.0, 19.0, 13.0, 16.0, 14.0, 11.0, 16.0, 11.0, 2.0, 5.0, 7.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.47331738471984863, -0.4597143530845642, -0.4461112916469574, -0.432508260011673, -0.41890519857406616, -0.40530216693878174, -0.3916991055011749, -0.3780960738658905, -0.3644930124282837, -0.35088998079299927, -0.33728691935539246, -0.32368388772010803, -0.3100808262825012, -0.2964777946472168, -0.28287473320961, -0.26927170157432556, -0.25566864013671875, -0.24206559360027313, -0.22846254706382751, -0.2148595005273819, -0.20125645399093628, -0.18765342235565186, -0.17405036091804504, -0.16044732928276062, -0.1468442976474762, -0.13324125111103058, -0.11963820457458496, -0.10603515803813934, -0.09243211150169373, -0.0788290724158287, -0.06522602587938309, -0.05162297934293747, -0.038019925355911255, -0.024416878819465637, -0.010813834145665169, 0.0027892105281352997, 0.016392257064580917, 0.029995299875736237, 0.043598346412181854, 0.05720139294862747, 0.07080443948507309, 0.08440748602151871, 0.09801053255796432, 0.11161357164382935, 0.12521661818027496, 0.13881966471672058, 0.1524227112531662, 0.16602575778961182, 0.17962880432605743, 0.19323185086250305, 0.20683489739894867, 0.2204379439353943, 0.2340409904718399, 0.24764403700828552, 0.26124706864356995, 0.27485013008117676, 0.2884531617164612, 0.3020561933517456, 0.3156592547893524, 0.32926228642463684, 0.34286534786224365, 0.3564683794975281, 0.3700714409351349, 0.3836744725704193, 0.3972775340080261]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 4.0, 7.0, 7.0, 8.0, 13.0, 23.0, 34.0, 56.0, 99.0, 150.0, 211.0, 339.0, 467.0, 869.0, 1282.0, 2086.0, 3720.0, 6298.0, 11335.0, 21607.0, 42092.0, 84130.0, 162882.0, 250754.0, 214195.0, 119202.0, 59972.0, 30159.0, 15812.0, 8597.0, 4810.0, 2789.0, 1635.0, 1047.0, 685.0, 429.0, 239.0, 176.0, 115.0, 67.0, 56.0, 36.0, 22.0, 13.0, 10.0, 10.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.20263671875, -0.19604873657226562, -0.18946075439453125, -0.18287277221679688, -0.1762847900390625, -0.16969680786132812, -0.16310882568359375, -0.15652084350585938, -0.149932861328125, -0.14334487915039062, -0.13675689697265625, -0.13016891479492188, -0.1235809326171875, -0.11699295043945312, -0.11040496826171875, -0.10381698608398438, -0.09722900390625, -0.09064102172851562, -0.08405303955078125, -0.07746505737304688, -0.0708770751953125, -0.06428909301757812, -0.05770111083984375, -0.051113128662109375, -0.044525146484375, -0.037937164306640625, -0.03134918212890625, -0.024761199951171875, -0.0181732177734375, -0.011585235595703125, -0.00499725341796875, 0.001590728759765625, 0.0081787109375, 0.014766693115234375, 0.02135467529296875, 0.027942657470703125, 0.0345306396484375, 0.041118621826171875, 0.04770660400390625, 0.054294586181640625, 0.060882568359375, 0.06747055053710938, 0.07405853271484375, 0.08064651489257812, 0.0872344970703125, 0.09382247924804688, 0.10041046142578125, 0.10699844360351562, 0.11358642578125, 0.12017440795898438, 0.12676239013671875, 0.13335037231445312, 0.1399383544921875, 0.14652633666992188, 0.15311431884765625, 0.15970230102539062, 0.166290283203125, 0.17287826538085938, 0.17946624755859375, 0.18605422973632812, 0.1926422119140625, 0.19923019409179688, 0.20581817626953125, 0.21240615844726562, 0.218994140625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 7.0, 7.0, 4.0, 4.0, 14.0, 9.0, 14.0, 15.0, 18.0, 29.0, 41.0, 33.0, 37.0, 41.0, 57.0, 44.0, 49.0, 43.0, 56.0, 48.0, 48.0, 48.0, 45.0, 31.0, 35.0, 32.0, 40.0, 27.0, 30.0, 21.0, 18.0, 7.0, 4.0, 8.0, 5.0, 6.0, 7.0, 7.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12188720703125, -0.1180410385131836, -0.11419486999511719, -0.11034870147705078, -0.10650253295898438, -0.10265636444091797, -0.09881019592285156, -0.09496402740478516, -0.09111785888671875, -0.08727169036865234, -0.08342552185058594, -0.07957935333251953, -0.07573318481445312, -0.07188701629638672, -0.06804084777832031, -0.0641946792602539, -0.0603485107421875, -0.056502342224121094, -0.05265617370605469, -0.04881000518798828, -0.044963836669921875, -0.04111766815185547, -0.03727149963378906, -0.033425331115722656, -0.02957916259765625, -0.025732994079589844, -0.021886825561523438, -0.01804065704345703, -0.014194488525390625, -0.010348320007324219, -0.0065021514892578125, -0.0026559829711914062, 0.001190185546875, 0.005036354064941406, 0.008882522583007812, 0.012728691101074219, 0.016574859619140625, 0.02042102813720703, 0.024267196655273438, 0.028113365173339844, 0.03195953369140625, 0.035805702209472656, 0.03965187072753906, 0.04349803924560547, 0.047344207763671875, 0.05119037628173828, 0.05503654479980469, 0.058882713317871094, 0.0627288818359375, 0.0665750503540039, 0.07042121887207031, 0.07426738739013672, 0.07811355590820312, 0.08195972442626953, 0.08580589294433594, 0.08965206146240234, 0.09349822998046875, 0.09734439849853516, 0.10119056701660156, 0.10503673553466797, 0.10888290405273438, 0.11272907257080078, 0.11657524108886719, 0.1204214096069336, 0.124267578125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 8.0, 6.0, 13.0, 9.0, 18.0, 22.0, 36.0, 53.0, 72.0, 117.0, 165.0, 241.0, 329.0, 527.0, 831.0, 1693.0, 4286.0, 15527.0, 100438.0, 690515.0, 198036.0, 24938.0, 5857.0, 2125.0, 926.0, 586.0, 386.0, 237.0, 149.0, 134.0, 87.0, 57.0, 42.0, 28.0, 23.0, 18.0, 8.0, 8.0, 5.0, 3.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.546875, -0.5270919799804688, -0.5073089599609375, -0.48752593994140625, -0.467742919921875, -0.44795989990234375, -0.4281768798828125, -0.40839385986328125, -0.38861083984375, -0.36882781982421875, -0.3490447998046875, -0.32926177978515625, -0.309478759765625, -0.28969573974609375, -0.2699127197265625, -0.25012969970703125, -0.2303466796875, -0.21056365966796875, -0.1907806396484375, -0.17099761962890625, -0.151214599609375, -0.13143157958984375, -0.1116485595703125, -0.09186553955078125, -0.07208251953125, -0.05229949951171875, -0.0325164794921875, -0.01273345947265625, 0.007049560546875, 0.02683258056640625, 0.0466156005859375, 0.06639862060546875, 0.086181640625, 0.10596466064453125, 0.1257476806640625, 0.14553070068359375, 0.165313720703125, 0.18509674072265625, 0.2048797607421875, 0.22466278076171875, 0.24444580078125, 0.26422882080078125, 0.2840118408203125, 0.30379486083984375, 0.323577880859375, 0.34336090087890625, 0.3631439208984375, 0.38292694091796875, 0.4027099609375, 0.42249298095703125, 0.4422760009765625, 0.46205902099609375, 0.481842041015625, 0.5016250610351562, 0.5214080810546875, 0.5411911010742188, 0.56097412109375, 0.5807571411132812, 0.6005401611328125, 0.6203231811523438, 0.640106201171875, 0.6598892211914062, 0.6796722412109375, 0.6994552612304688, 0.71923828125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 2.0, 7.0, 7.0, 8.0, 12.0, 23.0, 26.0, 20.0, 27.0, 14.0, 28.0, 28.0, 23.0, 43.0, 42.0, 43.0, 53.0, 48.0, 55.0, 52.0, 51.0, 39.0, 43.0, 44.0, 37.0, 42.0, 29.0, 26.0, 29.0, 16.0, 14.0, 14.0, 11.0, 15.0, 7.0, 10.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.6923828125, -0.6723556518554688, -0.6523284912109375, -0.6323013305664062, -0.612274169921875, -0.5922470092773438, -0.5722198486328125, -0.5521926879882812, -0.53216552734375, -0.5121383666992188, -0.4921112060546875, -0.47208404541015625, -0.452056884765625, -0.43202972412109375, -0.4120025634765625, -0.39197540283203125, -0.3719482421875, -0.35192108154296875, -0.3318939208984375, -0.31186676025390625, -0.291839599609375, -0.27181243896484375, -0.2517852783203125, -0.23175811767578125, -0.21173095703125, -0.19170379638671875, -0.1716766357421875, -0.15164947509765625, -0.131622314453125, -0.11159515380859375, -0.0915679931640625, -0.07154083251953125, -0.051513671875, -0.03148651123046875, -0.0114593505859375, 0.00856781005859375, 0.028594970703125, 0.04862213134765625, 0.0686492919921875, 0.08867645263671875, 0.10870361328125, 0.12873077392578125, 0.1487579345703125, 0.16878509521484375, 0.188812255859375, 0.20883941650390625, 0.2288665771484375, 0.24889373779296875, 0.2689208984375, 0.28894805908203125, 0.3089752197265625, 0.32900238037109375, 0.349029541015625, 0.36905670166015625, 0.3890838623046875, 0.40911102294921875, 0.42913818359375, 0.44916534423828125, 0.4691925048828125, 0.48921966552734375, 0.509246826171875, 0.5292739868164062, 0.5493011474609375, 0.5693283081054688, 0.58935546875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 6.0, 14.0, 24.0, 66.0, 99.0, 274.0, 951.0, 5245.0, 114925.0, 883608.0, 39370.0, 2927.0, 673.0, 217.0, 89.0, 36.0, 19.0, 3.0, 4.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6708984375, -0.6519241333007812, -0.6329498291015625, -0.6139755249023438, -0.595001220703125, -0.5760269165039062, -0.5570526123046875, -0.5380783081054688, -0.51910400390625, -0.5001296997070312, -0.4811553955078125, -0.46218109130859375, -0.443206787109375, -0.42423248291015625, -0.4052581787109375, -0.38628387451171875, -0.3673095703125, -0.34833526611328125, -0.3293609619140625, -0.31038665771484375, -0.291412353515625, -0.27243804931640625, -0.2534637451171875, -0.23448944091796875, -0.21551513671875, -0.19654083251953125, -0.1775665283203125, -0.15859222412109375, -0.139617919921875, -0.12064361572265625, -0.1016693115234375, -0.08269500732421875, -0.063720703125, -0.04474639892578125, -0.0257720947265625, -0.00679779052734375, 0.012176513671875, 0.03115081787109375, 0.0501251220703125, 0.06909942626953125, 0.08807373046875, 0.10704803466796875, 0.1260223388671875, 0.14499664306640625, 0.163970947265625, 0.18294525146484375, 0.2019195556640625, 0.22089385986328125, 0.2398681640625, 0.25884246826171875, 0.2778167724609375, 0.29679107666015625, 0.315765380859375, 0.33473968505859375, 0.3537139892578125, 0.37268829345703125, 0.39166259765625, 0.41063690185546875, 0.4296112060546875, 0.44858551025390625, 0.467559814453125, 0.48653411865234375, 0.5055084228515625, 0.5244827270507812, 0.54345703125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 9.0, 3.0, 9.0, 8.0, 6.0, 11.0, 15.0, 14.0, 24.0, 29.0, 39.0, 34.0, 47.0, 60.0, 70.0, 77.0, 74.0, 85.0, 75.0, 66.0, 42.0, 38.0, 33.0, 26.0, 27.0, 15.0, 17.0, 15.0, 8.0, 6.0, 2.0, 5.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.368492126464844e-05, -8.074101060628891e-05, -7.779709994792938e-05, -7.485318928956985e-05, -7.190927863121033e-05, -6.89653679728508e-05, -6.602145731449127e-05, -6.307754665613174e-05, -6.013363599777222e-05, -5.718972533941269e-05, -5.424581468105316e-05, -5.1301904022693634e-05, -4.8357993364334106e-05, -4.541408270597458e-05, -4.247017204761505e-05, -3.9526261389255524e-05, -3.6582350730895996e-05, -3.363844007253647e-05, -3.069452941417694e-05, -2.7750618755817413e-05, -2.4806708097457886e-05, -2.1862797439098358e-05, -1.891888678073883e-05, -1.5974976122379303e-05, -1.3031065464019775e-05, -1.0087154805660248e-05, -7.14324414730072e-06, -4.199333488941193e-06, -1.255422830581665e-06, 1.6884878277778625e-06, 4.63239848613739e-06, 7.576309144496918e-06, 1.0520219802856445e-05, 1.3464130461215973e-05, 1.64080411195755e-05, 1.9351951777935028e-05, 2.2295862436294556e-05, 2.5239773094654083e-05, 2.818368375301361e-05, 3.112759441137314e-05, 3.4071505069732666e-05, 3.7015415728092194e-05, 3.995932638645172e-05, 4.290323704481125e-05, 4.5847147703170776e-05, 4.8791058361530304e-05, 5.173496901988983e-05, 5.467887967824936e-05, 5.762279033660889e-05, 6.0566700994968414e-05, 6.351061165332794e-05, 6.645452231168747e-05, 6.9398432970047e-05, 7.234234362840652e-05, 7.528625428676605e-05, 7.823016494512558e-05, 8.117407560348511e-05, 8.411798626184464e-05, 8.706189692020416e-05, 9.000580757856369e-05, 9.294971823692322e-05, 9.589362889528275e-05, 9.883753955364227e-05, 0.0001017814502120018, 0.00010472536087036133]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 8.0, 12.0, 17.0, 29.0, 54.0, 98.0, 200.0, 373.0, 937.0, 2930.0, 15088.0, 227098.0, 741336.0, 51420.0, 6142.0, 1648.0, 585.0, 260.0, 137.0, 64.0, 41.0, 25.0, 21.0, 12.0, 6.0, 7.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.458984375, -0.44518280029296875, -0.4313812255859375, -0.41757965087890625, -0.403778076171875, -0.38997650146484375, -0.3761749267578125, -0.36237335205078125, -0.34857177734375, -0.33477020263671875, -0.3209686279296875, -0.30716705322265625, -0.293365478515625, -0.27956390380859375, -0.2657623291015625, -0.25196075439453125, -0.2381591796875, -0.22435760498046875, -0.2105560302734375, -0.19675445556640625, -0.182952880859375, -0.16915130615234375, -0.1553497314453125, -0.14154815673828125, -0.12774658203125, -0.11394500732421875, -0.1001434326171875, -0.08634185791015625, -0.072540283203125, -0.05873870849609375, -0.0449371337890625, -0.03113555908203125, -0.017333984375, -0.00353240966796875, 0.0102691650390625, 0.02407073974609375, 0.037872314453125, 0.05167388916015625, 0.0654754638671875, 0.07927703857421875, 0.09307861328125, 0.10688018798828125, 0.1206817626953125, 0.13448333740234375, 0.148284912109375, 0.16208648681640625, 0.1758880615234375, 0.18968963623046875, 0.2034912109375, 0.21729278564453125, 0.2310943603515625, 0.24489593505859375, 0.258697509765625, 0.27249908447265625, 0.2863006591796875, 0.30010223388671875, 0.31390380859375, 0.32770538330078125, 0.3415069580078125, 0.35530853271484375, 0.369110107421875, 0.38291168212890625, 0.3967132568359375, 0.41051483154296875, 0.42431640625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 7.0, 8.0, 12.0, 17.0, 23.0, 14.0, 29.0, 36.0, 41.0, 52.0, 67.0, 72.0, 79.0, 82.0, 83.0, 70.0, 65.0, 54.0, 43.0, 46.0, 23.0, 18.0, 15.0, 9.0, 9.0, 6.0, 5.0, 3.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.210693359375, -0.20327377319335938, -0.19585418701171875, -0.18843460083007812, -0.1810150146484375, -0.17359542846679688, -0.16617584228515625, -0.15875625610351562, -0.151336669921875, -0.14391708374023438, -0.13649749755859375, -0.12907791137695312, -0.1216583251953125, -0.11423873901367188, -0.10681915283203125, -0.09939956665039062, -0.09197998046875, -0.08456039428710938, -0.07714080810546875, -0.06972122192382812, -0.0623016357421875, -0.054882049560546875, -0.04746246337890625, -0.040042877197265625, -0.032623291015625, -0.025203704833984375, -0.01778411865234375, -0.010364532470703125, -0.0029449462890625, 0.004474639892578125, 0.01189422607421875, 0.019313812255859375, 0.0267333984375, 0.034152984619140625, 0.04157257080078125, 0.048992156982421875, 0.0564117431640625, 0.06383132934570312, 0.07125091552734375, 0.07867050170898438, 0.086090087890625, 0.09350967407226562, 0.10092926025390625, 0.10834884643554688, 0.1157684326171875, 0.12318801879882812, 0.13060760498046875, 0.13802719116210938, 0.14544677734375, 0.15286636352539062, 0.16028594970703125, 0.16770553588867188, 0.1751251220703125, 0.18254470825195312, 0.18996429443359375, 0.19738388061523438, 0.204803466796875, 0.21222305297851562, 0.21964263916015625, 0.22706222534179688, 0.2344818115234375, 0.24190139770507812, 0.24932098388671875, 0.2567405700683594, 0.26416015625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 5.0, 7.0, 11.0, 16.0, 34.0, 60.0, 99.0, 125.0, 158.0, 150.0, 149.0, 81.0, 53.0, 33.0, 13.0, 9.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.906912803649902, -5.738889217376709, -5.570865631103516, -5.402842044830322, -5.234818458557129, -5.0667948722839355, -4.898771286010742, -4.730747222900391, -4.5627241134643555, -4.394700527191162, -4.226676940917969, -4.058653354644775, -3.890629768371582, -3.7226061820983887, -3.554582357406616, -3.386558771133423, -3.2185349464416504, -3.050511360168457, -2.8824877738952637, -2.7144641876220703, -2.546440601348877, -2.3784170150756836, -2.210393190383911, -2.0423696041107178, -1.8743460178375244, -1.706322431564331, -1.5382988452911377, -1.3702751398086548, -1.2022515535354614, -1.034227967262268, -0.8662042617797852, -0.6981806755065918, -0.5301575660705566, -0.3621339499950409, -0.19411033391952515, -0.02608668804168701, 0.14193689823150635, 0.3099604845046997, 0.4779841899871826, 0.646007776260376, 0.8140313625335693, 0.9820549488067627, 1.150078535079956, 1.318102240562439, 1.4861258268356323, 1.6541494131088257, 1.8221731185913086, 1.990196704864502, 2.1582202911376953, 2.3262438774108887, 2.494267463684082, 2.6622910499572754, 2.8303146362304688, 2.998338222503662, 3.1663620471954346, 3.334385633468628, 3.5024092197418213, 3.6704328060150146, 3.838456392288208, 4.0064802169799805, 4.174503803253174, 4.342527389526367, 4.5105509757995605, 4.678574562072754, 4.846598148345947]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 7.0, 5.0, 3.0, 8.0, 7.0, 10.0, 12.0, 11.0, 16.0, 30.0, 28.0, 32.0, 35.0, 35.0, 42.0, 46.0, 59.0, 41.0, 65.0, 48.0, 61.0, 58.0, 47.0, 47.0, 36.0, 35.0, 21.0, 26.0, 21.0, 20.0, 19.0, 13.0, 8.0, 15.0, 5.0, 6.0, 5.0, 8.0, 2.0, 4.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.246680974960327, -3.1521010398864746, -3.057521104812622, -2.9629411697387695, -2.868361234664917, -2.7737812995910645, -2.679201602935791, -2.5846214294433594, -2.490041732788086, -2.3954617977142334, -2.300881862640381, -2.2063019275665283, -2.111721992492676, -2.0171420574188232, -1.9225622415542603, -1.8279823064804077, -1.7334022521972656, -1.638822317123413, -1.5442423820495605, -1.449662446975708, -1.3550825119018555, -1.260502576828003, -1.16592276096344, -1.0713428258895874, -0.9767628908157349, -0.8821829557418823, -0.7876030206680298, -0.693023145198822, -0.5984432101249695, -0.5038632750511169, -0.4092833995819092, -0.31470346450805664, -0.2201237678527832, -0.12554384768009186, -0.030963927507400513, 0.06361597776412964, 0.15819591283798218, 0.2527758479118347, 0.3473557233810425, 0.441935658454895, 0.5365155935287476, 0.6310955286026001, 0.7256754636764526, 0.8202553391456604, 0.9148352742195129, 1.0094151496887207, 1.1039950847625732, 1.1985750198364258, 1.2931549549102783, 1.3877348899841309, 1.4823148250579834, 1.576894760131836, 1.6714746952056885, 1.766054630279541, 1.860634446144104, 1.9552143812179565, 2.0497941970825195, 2.144374132156372, 2.2389540672302246, 2.333534002304077, 2.4281139373779297, 2.5226938724517822, 2.6172738075256348, 2.711853504180908, 2.80643367767334]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 6.0, 3.0, 8.0, 19.0, 35.0, 46.0, 62.0, 79.0, 124.0, 185.0, 303.0, 485.0, 806.0, 1373.0, 2780.0, 7031.0, 32991.0, 4058465.0, 71747.0, 10043.0, 3473.0, 1650.0, 931.0, 588.0, 373.0, 240.0, 137.0, 89.0, 72.0, 44.0, 46.0, 21.0, 9.0, 4.0, 6.0, 5.0, 5.0, 4.0, 3.0, 3.0], "bins": [-0.857421875, -0.8368339538574219, -0.8162460327148438, -0.7956581115722656, -0.7750701904296875, -0.7544822692871094, -0.7338943481445312, -0.7133064270019531, -0.692718505859375, -0.6721305847167969, -0.6515426635742188, -0.6309547424316406, -0.6103668212890625, -0.5897789001464844, -0.5691909790039062, -0.5486030578613281, -0.52801513671875, -0.5074272155761719, -0.48683929443359375, -0.4662513732910156, -0.4456634521484375, -0.4250755310058594, -0.40448760986328125, -0.3838996887207031, -0.363311767578125, -0.3427238464355469, -0.32213592529296875, -0.3015480041503906, -0.2809600830078125, -0.2603721618652344, -0.23978424072265625, -0.21919631958007812, -0.1986083984375, -0.17802047729492188, -0.15743255615234375, -0.13684463500976562, -0.1162567138671875, -0.09566879272460938, -0.07508087158203125, -0.054492950439453125, -0.033905029296875, -0.013317108154296875, 0.00727081298828125, 0.027858734130859375, 0.0484466552734375, 0.06903457641601562, 0.08962249755859375, 0.11021041870117188, 0.13079833984375, 0.15138626098632812, 0.17197418212890625, 0.19256210327148438, 0.2131500244140625, 0.23373794555664062, 0.25432586669921875, 0.2749137878417969, 0.295501708984375, 0.3160896301269531, 0.33667755126953125, 0.3572654724121094, 0.3778533935546875, 0.3984413146972656, 0.41902923583984375, 0.4396171569824219, 0.460205078125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 4.0, 2.0, 2.0, 0.0, 3.0, 6.0, 13.0, 6.0, 6.0, 11.0, 17.0, 21.0, 23.0, 25.0, 30.0, 35.0, 43.0, 61.0, 53.0, 54.0, 64.0, 65.0, 61.0, 52.0, 51.0, 56.0, 45.0, 33.0, 26.0, 32.0, 15.0, 15.0, 17.0, 17.0, 9.0, 5.0, 8.0, 7.0, 1.0, 5.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.147216796875, -0.14267539978027344, -0.13813400268554688, -0.1335926055908203, -0.12905120849609375, -0.12450981140136719, -0.11996841430664062, -0.11542701721191406, -0.1108856201171875, -0.10634422302246094, -0.10180282592773438, -0.09726142883300781, -0.09272003173828125, -0.08817863464355469, -0.08363723754882812, -0.07909584045410156, -0.074554443359375, -0.07001304626464844, -0.06547164916992188, -0.06093025207519531, -0.05638885498046875, -0.05184745788574219, -0.047306060791015625, -0.04276466369628906, -0.0382232666015625, -0.03368186950683594, -0.029140472412109375, -0.024599075317382812, -0.02005767822265625, -0.015516281127929688, -0.010974884033203125, -0.0064334869384765625, -0.00189208984375, 0.0026493072509765625, 0.007190704345703125, 0.011732101440429688, 0.01627349853515625, 0.020814895629882812, 0.025356292724609375, 0.029897689819335938, 0.0344390869140625, 0.03898048400878906, 0.043521881103515625, 0.04806327819824219, 0.05260467529296875, 0.05714607238769531, 0.061687469482421875, 0.06622886657714844, 0.070770263671875, 0.07531166076660156, 0.07985305786132812, 0.08439445495605469, 0.08893585205078125, 0.09347724914550781, 0.09801864624023438, 0.10256004333496094, 0.1071014404296875, 0.11164283752441406, 0.11618423461914062, 0.12072563171386719, 0.12526702880859375, 0.1298084259033203, 0.13434982299804688, 0.13889122009277344, 0.1434326171875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 3.0, 5.0, 4.0, 7.0, 8.0, 7.0, 6.0, 14.0, 13.0, 25.0, 20.0, 31.0, 35.0, 43.0, 65.0, 98.0, 149.0, 263.0, 526.0, 1707.0, 32700.0, 4152104.0, 4682.0, 787.0, 367.0, 168.0, 108.0, 75.0, 53.0, 46.0, 25.0, 27.0, 25.0, 19.0, 7.0, 14.0, 11.0, 5.0, 8.0, 6.0, 5.0, 5.0, 2.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.740234375, -2.643157958984375, -2.54608154296875, -2.449005126953125, -2.3519287109375, -2.254852294921875, -2.15777587890625, -2.060699462890625, -1.963623046875, -1.866546630859375, -1.76947021484375, -1.672393798828125, -1.5753173828125, -1.478240966796875, -1.38116455078125, -1.284088134765625, -1.18701171875, -1.089935302734375, -0.99285888671875, -0.895782470703125, -0.7987060546875, -0.701629638671875, -0.60455322265625, -0.507476806640625, -0.410400390625, -0.313323974609375, -0.21624755859375, -0.119171142578125, -0.0220947265625, 0.074981689453125, 0.17205810546875, 0.269134521484375, 0.3662109375, 0.463287353515625, 0.56036376953125, 0.657440185546875, 0.7545166015625, 0.851593017578125, 0.94866943359375, 1.045745849609375, 1.142822265625, 1.239898681640625, 1.33697509765625, 1.434051513671875, 1.5311279296875, 1.628204345703125, 1.72528076171875, 1.822357177734375, 1.91943359375, 2.016510009765625, 2.11358642578125, 2.210662841796875, 2.3077392578125, 2.404815673828125, 2.50189208984375, 2.598968505859375, 2.696044921875, 2.793121337890625, 2.89019775390625, 2.987274169921875, 3.0843505859375, 3.181427001953125, 3.27850341796875, 3.375579833984375, 3.47265625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 14.0, 37.0, 3715.0, 269.0, 25.0, 13.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.319580078125, -0.3005714416503906, -0.28156280517578125, -0.2625541687011719, -0.2435455322265625, -0.22453689575195312, -0.20552825927734375, -0.18651962280273438, -0.167510986328125, -0.14850234985351562, -0.12949371337890625, -0.11048507690429688, -0.0914764404296875, -0.07246780395507812, -0.05345916748046875, -0.034450531005859375, -0.01544189453125, 0.003566741943359375, 0.02257537841796875, 0.041584014892578125, 0.0605926513671875, 0.07960128784179688, 0.09860992431640625, 0.11761856079101562, 0.136627197265625, 0.15563583374023438, 0.17464447021484375, 0.19365310668945312, 0.2126617431640625, 0.23167037963867188, 0.25067901611328125, 0.2696876525878906, 0.2886962890625, 0.3077049255371094, 0.32671356201171875, 0.3457221984863281, 0.3647308349609375, 0.3837394714355469, 0.40274810791015625, 0.4217567443847656, 0.440765380859375, 0.4597740173339844, 0.47878265380859375, 0.4977912902832031, 0.5167999267578125, 0.5358085632324219, 0.5548171997070312, 0.5738258361816406, 0.59283447265625, 0.6118431091308594, 0.6308517456054688, 0.6498603820800781, 0.6688690185546875, 0.6878776550292969, 0.7068862915039062, 0.7258949279785156, 0.744903564453125, 0.7639122009277344, 0.7829208374023438, 0.8019294738769531, 0.8209381103515625, 0.8399467468261719, 0.8589553833007812, 0.8779640197753906, 0.89697265625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 1.0, 1.0, 8.0, 8.0, 6.0, 6.0, 21.0, 20.0, 27.0, 38.0, 60.0, 80.0, 85.0, 114.0, 106.0, 114.0, 72.0, 50.0, 42.0, 26.0, 26.0, 28.0, 14.0, 9.0, 8.0, 5.0, 5.0, 6.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9515249729156494, -0.9232561588287354, -0.8949872851371765, -0.8667184710502625, -0.8384495973587036, -0.8101807832717896, -0.7819119691848755, -0.7536431550979614, -0.7253742814064026, -0.6971054673194885, -0.6688365936279297, -0.6405677795410156, -0.6122989654541016, -0.5840300917625427, -0.5557612776756287, -0.5274924039840698, -0.49922358989715576, -0.4709547460079193, -0.44268590211868286, -0.4144170880317688, -0.38614824414253235, -0.3578794002532959, -0.32961058616638184, -0.3013417422771454, -0.27307289838790894, -0.24480405449867249, -0.21653522551059723, -0.18826639652252197, -0.15999755263328552, -0.13172870874404907, -0.10345987975597382, -0.07519105076789856, -0.046922266483306885, -0.01865343004465103, 0.009615406394004822, 0.037884242832660675, 0.06615307927131653, 0.09442192316055298, 0.12269075214862823, 0.1509595811367035, 0.17922842502593994, 0.2074972689151764, 0.23576609790325165, 0.2640349268913269, 0.29230377078056335, 0.3205726146697998, 0.34884142875671387, 0.3771102726459503, 0.40537911653518677, 0.4336479604244232, 0.46191680431365967, 0.49018561840057373, 0.5184544324874878, 0.5467233061790466, 0.5749921202659607, 0.6032609939575195, 0.6315298080444336, 0.6597986221313477, 0.6880674958229065, 0.7163363099098206, 0.7446051836013794, 0.7728739976882935, 0.8011428117752075, 0.8294116258621216, 0.8576804995536804]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 2.0, 9.0, 8.0, 4.0, 8.0, 12.0, 11.0, 13.0, 15.0, 20.0, 13.0, 24.0, 16.0, 28.0, 25.0, 33.0, 40.0, 37.0, 40.0, 37.0, 46.0, 46.0, 50.0, 47.0, 38.0, 49.0, 43.0, 31.0, 29.0, 16.0, 30.0, 28.0, 31.0, 12.0, 27.0, 10.0, 14.0, 14.0, 11.0, 7.0, 7.0, 6.0, 4.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5644198060035706, -0.5468206405639648, -0.5292214751243591, -0.5116223096847534, -0.4940231442451477, -0.476423978805542, -0.4588248133659363, -0.44122564792633057, -0.42362648248672485, -0.40602731704711914, -0.3884281516075134, -0.3708289861679077, -0.353229820728302, -0.3356306552886963, -0.3180314898490906, -0.30043232440948486, -0.28283315896987915, -0.26523399353027344, -0.24763482809066772, -0.230035662651062, -0.2124364972114563, -0.19483733177185059, -0.17723816633224487, -0.15963900089263916, -0.14203983545303345, -0.12444067001342773, -0.10684150457382202, -0.08924233913421631, -0.0716431736946106, -0.05404400825500488, -0.03644484281539917, -0.018845677375793457, -0.0012464523315429688, 0.016352713108062744, 0.03395187854766846, 0.05155104398727417, 0.06915020942687988, 0.0867493748664856, 0.10434854030609131, 0.12194770574569702, 0.13954687118530273, 0.15714603662490845, 0.17474520206451416, 0.19234436750411987, 0.20994353294372559, 0.2275426983833313, 0.245141863822937, 0.2627410292625427, 0.28034019470214844, 0.29793936014175415, 0.31553852558135986, 0.3331376910209656, 0.3507368564605713, 0.368336021900177, 0.3859351873397827, 0.4035343527793884, 0.42113351821899414, 0.43873268365859985, 0.45633184909820557, 0.4739310145378113, 0.491530179977417, 0.5091293454170227, 0.5267285108566284, 0.5443276762962341, 0.5619268417358398]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 1.0, 1.0, 4.0, 7.0, 6.0, 27.0, 21.0, 26.0, 50.0, 50.0, 94.0, 123.0, 260.0, 371.0, 682.0, 1193.0, 2233.0, 4424.0, 9911.0, 24898.0, 74516.0, 278821.0, 451732.0, 131092.0, 40210.0, 14787.0, 6328.0, 2949.0, 1569.0, 862.0, 481.0, 297.0, 151.0, 120.0, 81.0, 55.0, 43.0, 27.0, 18.0, 13.0, 8.0, 5.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43310546875, -0.4192352294921875, -0.405364990234375, -0.3914947509765625, -0.37762451171875, -0.3637542724609375, -0.349884033203125, -0.3360137939453125, -0.3221435546875, -0.3082733154296875, -0.294403076171875, -0.2805328369140625, -0.26666259765625, -0.2527923583984375, -0.238922119140625, -0.2250518798828125, -0.211181640625, -0.1973114013671875, -0.183441162109375, -0.1695709228515625, -0.15570068359375, -0.1418304443359375, -0.127960205078125, -0.1140899658203125, -0.1002197265625, -0.0863494873046875, -0.072479248046875, -0.0586090087890625, -0.04473876953125, -0.0308685302734375, -0.016998291015625, -0.0031280517578125, 0.0107421875, 0.0246124267578125, 0.038482666015625, 0.0523529052734375, 0.06622314453125, 0.0800933837890625, 0.093963623046875, 0.1078338623046875, 0.1217041015625, 0.1355743408203125, 0.149444580078125, 0.1633148193359375, 0.17718505859375, 0.1910552978515625, 0.204925537109375, 0.2187957763671875, 0.232666015625, 0.2465362548828125, 0.260406494140625, 0.2742767333984375, 0.28814697265625, 0.3020172119140625, 0.315887451171875, 0.3297576904296875, 0.3436279296875, 0.3574981689453125, 0.371368408203125, 0.3852386474609375, 0.39910888671875, 0.4129791259765625, 0.426849365234375, 0.4407196044921875, 0.45458984375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 4.0, 4.0, 8.0, 4.0, 13.0, 11.0, 13.0, 7.0, 22.0, 26.0, 24.0, 38.0, 23.0, 47.0, 32.0, 46.0, 39.0, 46.0, 72.0, 58.0, 48.0, 56.0, 48.0, 48.0, 41.0, 32.0, 31.0, 31.0, 30.0, 17.0, 13.0, 7.0, 15.0, 11.0, 8.0, 7.0, 6.0, 4.0, 6.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1724853515625, -0.1671142578125, -0.1617431640625, -0.1563720703125, -0.1510009765625, -0.1456298828125, -0.1402587890625, -0.1348876953125, -0.1295166015625, -0.1241455078125, -0.1187744140625, -0.1134033203125, -0.1080322265625, -0.1026611328125, -0.0972900390625, -0.0919189453125, -0.0865478515625, -0.0811767578125, -0.0758056640625, -0.0704345703125, -0.0650634765625, -0.0596923828125, -0.0543212890625, -0.0489501953125, -0.0435791015625, -0.0382080078125, -0.0328369140625, -0.0274658203125, -0.0220947265625, -0.0167236328125, -0.0113525390625, -0.0059814453125, -0.0006103515625, 0.0047607421875, 0.0101318359375, 0.0155029296875, 0.0208740234375, 0.0262451171875, 0.0316162109375, 0.0369873046875, 0.0423583984375, 0.0477294921875, 0.0531005859375, 0.0584716796875, 0.0638427734375, 0.0692138671875, 0.0745849609375, 0.0799560546875, 0.0853271484375, 0.0906982421875, 0.0960693359375, 0.1014404296875, 0.1068115234375, 0.1121826171875, 0.1175537109375, 0.1229248046875, 0.1282958984375, 0.1336669921875, 0.1390380859375, 0.1444091796875, 0.1497802734375, 0.1551513671875, 0.1605224609375, 0.1658935546875, 0.1712646484375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 4.0, 3.0, 7.0, 6.0, 23.0, 28.0, 33.0, 40.0, 62.0, 113.0, 171.0, 288.0, 468.0, 880.0, 2086.0, 6990.0, 42682.0, 735849.0, 232770.0, 18701.0, 4122.0, 1422.0, 711.0, 364.0, 247.0, 152.0, 116.0, 84.0, 47.0, 33.0, 19.0, 9.0, 13.0, 6.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.033203125, -1.005126953125, -0.97705078125, -0.948974609375, -0.9208984375, -0.892822265625, -0.86474609375, -0.836669921875, -0.80859375, -0.780517578125, -0.75244140625, -0.724365234375, -0.6962890625, -0.668212890625, -0.64013671875, -0.612060546875, -0.583984375, -0.555908203125, -0.52783203125, -0.499755859375, -0.4716796875, -0.443603515625, -0.41552734375, -0.387451171875, -0.359375, -0.331298828125, -0.30322265625, -0.275146484375, -0.2470703125, -0.218994140625, -0.19091796875, -0.162841796875, -0.134765625, -0.106689453125, -0.07861328125, -0.050537109375, -0.0224609375, 0.005615234375, 0.03369140625, 0.061767578125, 0.08984375, 0.117919921875, 0.14599609375, 0.174072265625, 0.2021484375, 0.230224609375, 0.25830078125, 0.286376953125, 0.314453125, 0.342529296875, 0.37060546875, 0.398681640625, 0.4267578125, 0.454833984375, 0.48291015625, 0.510986328125, 0.5390625, 0.567138671875, 0.59521484375, 0.623291015625, 0.6513671875, 0.679443359375, 0.70751953125, 0.735595703125, 0.763671875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 10.0, 7.0, 9.0, 19.0, 27.0, 25.0, 35.0, 35.0, 37.0, 48.0, 50.0, 58.0, 59.0, 55.0, 75.0, 74.0, 62.0, 44.0, 61.0, 42.0, 37.0, 32.0, 23.0, 27.0, 19.0, 15.0, 10.0, 7.0, 1.0, 3.0, 4.0, 0.0, 1.0, 2.0], "bins": [-1.4423828125, -1.4093856811523438, -1.3763885498046875, -1.3433914184570312, -1.310394287109375, -1.2773971557617188, -1.2444000244140625, -1.2114028930664062, -1.17840576171875, -1.1454086303710938, -1.1124114990234375, -1.0794143676757812, -1.046417236328125, -1.0134201049804688, -0.9804229736328125, -0.9474258422851562, -0.9144287109375, -0.8814315795898438, -0.8484344482421875, -0.8154373168945312, -0.782440185546875, -0.7494430541992188, -0.7164459228515625, -0.6834487915039062, -0.65045166015625, -0.6174545288085938, -0.5844573974609375, -0.5514602661132812, -0.518463134765625, -0.48546600341796875, -0.4524688720703125, -0.41947174072265625, -0.386474609375, -0.35347747802734375, -0.3204803466796875, -0.28748321533203125, -0.254486083984375, -0.22148895263671875, -0.1884918212890625, -0.15549468994140625, -0.12249755859375, -0.08950042724609375, -0.0565032958984375, -0.02350616455078125, 0.009490966796875, 0.04248809814453125, 0.0754852294921875, 0.10848236083984375, 0.1414794921875, 0.17447662353515625, 0.2074737548828125, 0.24047088623046875, 0.273468017578125, 0.30646514892578125, 0.3394622802734375, 0.37245941162109375, 0.40545654296875, 0.43845367431640625, 0.4714508056640625, 0.5044479370117188, 0.537445068359375, 0.5704421997070312, 0.6034393310546875, 0.6364364624023438, 0.66943359375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 4.0, 7.0, 5.0, 5.0, 12.0, 25.0, 33.0, 54.0, 79.0, 182.0, 305.0, 739.0, 1913.0, 8797.0, 106127.0, 854399.0, 66019.0, 6945.0, 1646.0, 600.0, 281.0, 146.0, 76.0, 58.0, 33.0, 17.0, 9.0, 10.0, 9.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51318359375, -0.4982757568359375, -0.483367919921875, -0.4684600830078125, -0.45355224609375, -0.4386444091796875, -0.423736572265625, -0.4088287353515625, -0.3939208984375, -0.3790130615234375, -0.364105224609375, -0.3491973876953125, -0.33428955078125, -0.3193817138671875, -0.304473876953125, -0.2895660400390625, -0.274658203125, -0.2597503662109375, -0.244842529296875, -0.2299346923828125, -0.21502685546875, -0.2001190185546875, -0.185211181640625, -0.1703033447265625, -0.1553955078125, -0.1404876708984375, -0.125579833984375, -0.1106719970703125, -0.09576416015625, -0.0808563232421875, -0.065948486328125, -0.0510406494140625, -0.0361328125, -0.0212249755859375, -0.006317138671875, 0.0085906982421875, 0.02349853515625, 0.0384063720703125, 0.053314208984375, 0.0682220458984375, 0.0831298828125, 0.0980377197265625, 0.112945556640625, 0.1278533935546875, 0.14276123046875, 0.1576690673828125, 0.172576904296875, 0.1874847412109375, 0.202392578125, 0.2173004150390625, 0.232208251953125, 0.2471160888671875, 0.26202392578125, 0.2769317626953125, 0.291839599609375, 0.3067474365234375, 0.3216552734375, 0.3365631103515625, 0.351470947265625, 0.3663787841796875, 0.38128662109375, 0.3961944580078125, 0.411102294921875, 0.4260101318359375, 0.44091796875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 2.0, 7.0, 4.0, 15.0, 7.0, 17.0, 23.0, 29.0, 44.0, 56.0, 107.0, 141.0, 169.0, 137.0, 71.0, 41.0, 38.0, 28.0, 14.0, 15.0, 7.0, 12.0, 8.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.00020134449005126953, -0.0001969076693058014, -0.00019247084856033325, -0.0001880340278148651, -0.00018359720706939697, -0.00017916038632392883, -0.0001747235655784607, -0.00017028674483299255, -0.00016584992408752441, -0.00016141310334205627, -0.00015697628259658813, -0.00015253946185112, -0.00014810264110565186, -0.00014366582036018372, -0.00013922899961471558, -0.00013479217886924744, -0.0001303553581237793, -0.00012591853737831116, -0.00012148171663284302, -0.00011704489588737488, -0.00011260807514190674, -0.0001081712543964386, -0.00010373443365097046, -9.929761290550232e-05, -9.486079216003418e-05, -9.042397141456604e-05, -8.59871506690979e-05, -8.155032992362976e-05, -7.711350917816162e-05, -7.267668843269348e-05, -6.823986768722534e-05, -6.38030469417572e-05, -5.936622619628906e-05, -5.492940545082092e-05, -5.049258470535278e-05, -4.6055763959884644e-05, -4.1618943214416504e-05, -3.7182122468948364e-05, -3.2745301723480225e-05, -2.8308480978012085e-05, -2.3871660232543945e-05, -1.9434839487075806e-05, -1.4998018741607666e-05, -1.0561197996139526e-05, -6.124377250671387e-06, -1.687556505203247e-06, 2.7492642402648926e-06, 7.186084985733032e-06, 1.1622905731201172e-05, 1.605972647666931e-05, 2.049654722213745e-05, 2.493336796760559e-05, 2.937018871307373e-05, 3.380700945854187e-05, 3.824383020401001e-05, 4.268065094947815e-05, 4.711747169494629e-05, 5.155429244041443e-05, 5.599111318588257e-05, 6.042793393135071e-05, 6.486475467681885e-05, 6.930157542228699e-05, 7.373839616775513e-05, 7.817521691322327e-05, 8.26120376586914e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 9.0, 18.0, 17.0, 30.0, 52.0, 116.0, 189.0, 427.0, 1009.0, 3782.0, 37930.0, 900718.0, 96001.0, 5864.0, 1436.0, 489.0, 212.0, 101.0, 64.0, 29.0, 15.0, 13.0, 12.0, 6.0, 3.0, 2.0, 6.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5986328125, -0.5797042846679688, -0.5607757568359375, -0.5418472290039062, -0.522918701171875, -0.5039901733398438, -0.4850616455078125, -0.46613311767578125, -0.44720458984375, -0.42827606201171875, -0.4093475341796875, -0.39041900634765625, -0.371490478515625, -0.35256195068359375, -0.3336334228515625, -0.31470489501953125, -0.2957763671875, -0.27684783935546875, -0.2579193115234375, -0.23899078369140625, -0.220062255859375, -0.20113372802734375, -0.1822052001953125, -0.16327667236328125, -0.14434814453125, -0.12541961669921875, -0.1064910888671875, -0.08756256103515625, -0.068634033203125, -0.04970550537109375, -0.0307769775390625, -0.01184844970703125, 0.007080078125, 0.02600860595703125, 0.0449371337890625, 0.06386566162109375, 0.082794189453125, 0.10172271728515625, 0.1206512451171875, 0.13957977294921875, 0.15850830078125, 0.17743682861328125, 0.1963653564453125, 0.21529388427734375, 0.234222412109375, 0.25315093994140625, 0.2720794677734375, 0.29100799560546875, 0.3099365234375, 0.32886505126953125, 0.3477935791015625, 0.36672210693359375, 0.385650634765625, 0.40457916259765625, 0.4235076904296875, 0.44243621826171875, 0.46136474609375, 0.48029327392578125, 0.4992218017578125, 0.5181503295898438, 0.537078857421875, 0.5560073852539062, 0.5749359130859375, 0.5938644409179688, 0.61279296875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 3.0, 15.0, 22.0, 36.0, 62.0, 99.0, 152.0, 171.0, 162.0, 110.0, 73.0, 42.0, 21.0, 15.0, 10.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.278076171875, -0.2630577087402344, -0.24803924560546875, -0.23302078247070312, -0.2180023193359375, -0.20298385620117188, -0.18796539306640625, -0.17294692993164062, -0.157928466796875, -0.14291000366210938, -0.12789154052734375, -0.11287307739257812, -0.0978546142578125, -0.08283615112304688, -0.06781768798828125, -0.052799224853515625, -0.03778076171875, -0.022762298583984375, -0.00774383544921875, 0.007274627685546875, 0.0222930908203125, 0.037311553955078125, 0.05233001708984375, 0.06734848022460938, 0.082366943359375, 0.09738540649414062, 0.11240386962890625, 0.12742233276367188, 0.1424407958984375, 0.15745925903320312, 0.17247772216796875, 0.18749618530273438, 0.2025146484375, 0.21753311157226562, 0.23255157470703125, 0.24757003784179688, 0.2625885009765625, 0.2776069641113281, 0.29262542724609375, 0.3076438903808594, 0.322662353515625, 0.3376808166503906, 0.35269927978515625, 0.3677177429199219, 0.3827362060546875, 0.3977546691894531, 0.41277313232421875, 0.4277915954589844, 0.44281005859375, 0.4578285217285156, 0.47284698486328125, 0.4878654479980469, 0.5028839111328125, 0.5179023742675781, 0.5329208374023438, 0.5479393005371094, 0.562957763671875, 0.5779762268066406, 0.5929946899414062, 0.6080131530761719, 0.6230316162109375, 0.6380500793457031, 0.6530685424804688, 0.6680870056152344, 0.68310546875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 12.0, 22.0, 63.0, 127.0, 194.0, 219.0, 179.0, 103.0, 50.0, 18.0, 10.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.10800838470459, -5.833505630493164, -5.5590033531188965, -5.284501075744629, -5.009998321533203, -4.735495567321777, -4.46099328994751, -4.186491012573242, -3.9119882583618164, -3.6374857425689697, -3.362983226776123, -3.0884807109832764, -2.8139781951904297, -2.539475679397583, -2.2649731636047363, -1.9904706478118896, -1.715968132019043, -1.4414656162261963, -1.1669631004333496, -0.8924605846405029, -0.6179580688476562, -0.34345555305480957, -0.06895303726196289, 0.2055494785308838, 0.48005199432373047, 0.7545545101165771, 1.0290570259094238, 1.3035595417022705, 1.5780620574951172, 1.8525645732879639, 2.1270670890808105, 2.4015696048736572, 2.676072120666504, 2.9505746364593506, 3.2250771522521973, 3.499579668045044, 3.7740821838378906, 4.048584938049316, 4.323087215423584, 4.597589492797852, 4.872092247009277, 5.146595001220703, 5.421097278594971, 5.695599555969238, 5.970102310180664, 6.24460506439209, 6.519107341766357, 6.793609619140625, 7.068112373352051, 7.342615127563477, 7.617117404937744, 7.891619682312012, 8.166122436523438, 8.440625190734863, 8.715127944946289, 8.989629745483398, 9.264132499694824, 9.53863525390625, 9.81313705444336, 10.087639808654785, 10.362142562866211, 10.636645317077637, 10.911148071289062, 11.185649871826172, 11.460152626037598]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 3.0, 5.0, 11.0, 10.0, 8.0, 11.0, 22.0, 21.0, 30.0, 29.0, 41.0, 45.0, 61.0, 57.0, 63.0, 73.0, 70.0, 77.0, 56.0, 49.0, 45.0, 37.0, 62.0, 26.0, 14.0, 11.0, 16.0, 17.0, 11.0, 11.0, 2.0, 2.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.002743721008301, -4.852298736572266, -4.701854228973389, -4.5514092445373535, -4.400964736938477, -4.250519752502441, -4.1000752449035645, -3.9496302604675293, -3.7991855144500732, -3.648740768432617, -3.498296022415161, -3.347851276397705, -3.19740629196167, -3.046961784362793, -2.896516799926758, -2.7460720539093018, -2.5956273078918457, -2.4451825618743896, -2.2947378158569336, -2.1442930698394775, -1.993848204612732, -1.8434034585952759, -1.6929585933685303, -1.5425138473510742, -1.3920691013336182, -1.241624355316162, -1.091179609298706, -0.9407347440719604, -0.7902899980545044, -0.6398452520370483, -0.4894004464149475, -0.3389556407928467, -0.18851089477539062, -0.03806611895561218, 0.11237865686416626, 0.2628234326839447, 0.41326820850372314, 0.5637129545211792, 0.71415776014328, 0.8646025657653809, 1.015047311782837, 1.165492057800293, 1.315936803817749, 1.4663816690444946, 1.6168264150619507, 1.7672711610794067, 1.9177160263061523, 2.0681607723236084, 2.2186055183410645, 2.3690502643585205, 2.5194950103759766, 2.6699397563934326, 2.8203845024108887, 2.970829486846924, 3.12127423286438, 3.271718978881836, 3.422163724899292, 3.572608470916748, 3.723053216934204, 3.87349796295166, 4.023942947387695, 4.174387454986572, 4.324832439422607, 4.475276947021484, 4.6257219314575195]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 8.0, 3.0, 6.0, 4.0, 7.0, 4.0, 13.0, 15.0, 22.0, 26.0, 33.0, 42.0, 63.0, 109.0, 120.0, 200.0, 307.0, 452.0, 770.0, 1251.0, 2546.0, 7035.0, 33433.0, 3916258.0, 206254.0, 15849.0, 4525.0, 1986.0, 1035.0, 614.0, 439.0, 265.0, 175.0, 104.0, 98.0, 46.0, 44.0, 22.0, 27.0, 19.0, 16.0, 9.0, 9.0, 17.0, 2.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.85791015625, -0.8325271606445312, -0.8071441650390625, -0.7817611694335938, -0.756378173828125, -0.7309951782226562, -0.7056121826171875, -0.6802291870117188, -0.65484619140625, -0.6294631958007812, -0.6040802001953125, -0.5786972045898438, -0.553314208984375, -0.5279312133789062, -0.5025482177734375, -0.47716522216796875, -0.4517822265625, -0.42639923095703125, -0.4010162353515625, -0.37563323974609375, -0.350250244140625, -0.32486724853515625, -0.2994842529296875, -0.27410125732421875, -0.24871826171875, -0.22333526611328125, -0.1979522705078125, -0.17256927490234375, -0.147186279296875, -0.12180328369140625, -0.0964202880859375, -0.07103729248046875, -0.045654296875, -0.02027130126953125, 0.0051116943359375, 0.03049468994140625, 0.055877685546875, 0.08126068115234375, 0.1066436767578125, 0.13202667236328125, 0.15740966796875, 0.18279266357421875, 0.2081756591796875, 0.23355865478515625, 0.258941650390625, 0.28432464599609375, 0.3097076416015625, 0.33509063720703125, 0.3604736328125, 0.38585662841796875, 0.4112396240234375, 0.43662261962890625, 0.462005615234375, 0.48738861083984375, 0.5127716064453125, 0.5381546020507812, 0.56353759765625, 0.5889205932617188, 0.6143035888671875, 0.6396865844726562, 0.665069580078125, 0.6904525756835938, 0.7158355712890625, 0.7412185668945312, 0.7666015625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 7.0, 9.0, 7.0, 21.0, 18.0, 31.0, 33.0, 41.0, 49.0, 56.0, 87.0, 70.0, 99.0, 83.0, 74.0, 72.0, 59.0, 57.0, 23.0, 26.0, 18.0, 20.0, 10.0, 11.0, 2.0, 5.0, 4.0, 2.0, 0.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2200927734375, -0.21214866638183594, -0.20420455932617188, -0.1962604522705078, -0.18831634521484375, -0.1803722381591797, -0.17242813110351562, -0.16448402404785156, -0.1565399169921875, -0.14859580993652344, -0.14065170288085938, -0.1327075958251953, -0.12476348876953125, -0.11681938171386719, -0.10887527465820312, -0.10093116760253906, -0.092987060546875, -0.08504295349121094, -0.07709884643554688, -0.06915473937988281, -0.06121063232421875, -0.05326652526855469, -0.045322418212890625, -0.03737831115722656, -0.0294342041015625, -0.021490097045898438, -0.013545989990234375, -0.0056018829345703125, 0.00234222412109375, 0.010286331176757812, 0.018230438232421875, 0.026174545288085938, 0.03411865234375, 0.04206275939941406, 0.050006866455078125, 0.05795097351074219, 0.06589508056640625, 0.07383918762207031, 0.08178329467773438, 0.08972740173339844, 0.0976715087890625, 0.10561561584472656, 0.11355972290039062, 0.12150382995605469, 0.12944793701171875, 0.1373920440673828, 0.14533615112304688, 0.15328025817871094, 0.161224365234375, 0.16916847229003906, 0.17711257934570312, 0.1850566864013672, 0.19300079345703125, 0.2009449005126953, 0.20888900756835938, 0.21683311462402344, 0.2247772216796875, 0.23272132873535156, 0.24066543579101562, 0.2486095428466797, 0.25655364990234375, 0.2644977569580078, 0.2724418640136719, 0.28038597106933594, 0.288330078125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 6.0, 19.0, 25.0, 19.0, 24.0, 29.0, 29.0, 51.0, 79.0, 74.0, 118.0, 169.0, 227.0, 308.0, 432.0, 575.0, 897.0, 1415.0, 2704.0, 7089.0, 53194.0, 4054179.0, 58274.0, 7196.0, 2672.0, 1413.0, 923.0, 574.0, 397.0, 268.0, 215.0, 159.0, 123.0, 114.0, 77.0, 46.0, 39.0, 28.0, 25.0, 22.0, 21.0, 5.0, 6.0, 9.0, 4.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.142578125, -1.105133056640625, -1.06768798828125, -1.030242919921875, -0.9927978515625, -0.955352783203125, -0.91790771484375, -0.880462646484375, -0.843017578125, -0.805572509765625, -0.76812744140625, -0.730682373046875, -0.6932373046875, -0.655792236328125, -0.61834716796875, -0.580902099609375, -0.54345703125, -0.506011962890625, -0.46856689453125, -0.431121826171875, -0.3936767578125, -0.356231689453125, -0.31878662109375, -0.281341552734375, -0.243896484375, -0.206451416015625, -0.16900634765625, -0.131561279296875, -0.0941162109375, -0.056671142578125, -0.01922607421875, 0.018218994140625, 0.0556640625, 0.093109130859375, 0.13055419921875, 0.167999267578125, 0.2054443359375, 0.242889404296875, 0.28033447265625, 0.317779541015625, 0.355224609375, 0.392669677734375, 0.43011474609375, 0.467559814453125, 0.5050048828125, 0.542449951171875, 0.57989501953125, 0.617340087890625, 0.65478515625, 0.692230224609375, 0.72967529296875, 0.767120361328125, 0.8045654296875, 0.842010498046875, 0.87945556640625, 0.916900634765625, 0.954345703125, 0.991790771484375, 1.02923583984375, 1.066680908203125, 1.1041259765625, 1.141571044921875, 1.17901611328125, 1.216461181640625, 1.25390625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 0.0, 8.0, 4.0, 19.0, 50.0, 288.0, 3345.0, 266.0, 52.0, 24.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67138671875, -0.6486282348632812, -0.6258697509765625, -0.6031112670898438, -0.580352783203125, -0.5575942993164062, -0.5348358154296875, -0.5120773315429688, -0.48931884765625, -0.46656036376953125, -0.4438018798828125, -0.42104339599609375, -0.398284912109375, -0.37552642822265625, -0.3527679443359375, -0.33000946044921875, -0.3072509765625, -0.28449249267578125, -0.2617340087890625, -0.23897552490234375, -0.216217041015625, -0.19345855712890625, -0.1707000732421875, -0.14794158935546875, -0.12518310546875, -0.10242462158203125, -0.0796661376953125, -0.05690765380859375, -0.034149169921875, -0.01139068603515625, 0.0113677978515625, 0.03412628173828125, 0.056884765625, 0.07964324951171875, 0.1024017333984375, 0.12516021728515625, 0.147918701171875, 0.17067718505859375, 0.1934356689453125, 0.21619415283203125, 0.23895263671875, 0.26171112060546875, 0.2844696044921875, 0.30722808837890625, 0.329986572265625, 0.35274505615234375, 0.3755035400390625, 0.39826202392578125, 0.4210205078125, 0.44377899169921875, 0.4665374755859375, 0.48929595947265625, 0.512054443359375, 0.5348129272460938, 0.5575714111328125, 0.5803298950195312, 0.60308837890625, 0.6258468627929688, 0.6486053466796875, 0.6713638305664062, 0.694122314453125, 0.7168807983398438, 0.7396392822265625, 0.7623977661132812, 0.78515625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 5.0, 6.0, 9.0, 20.0, 29.0, 44.0, 67.0, 86.0, 131.0, 220.0, 170.0, 120.0, 37.0, 24.0, 14.0, 4.0, 4.0, 3.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7611165046691895, -3.661835193634033, -3.562554121017456, -3.4632728099823, -3.3639917373657227, -3.2647104263305664, -3.16542911529541, -3.066148042678833, -2.9668667316436768, -2.8675854206085205, -2.7683043479919434, -2.669023036956787, -2.56974196434021, -2.4704606533050537, -2.3711795806884766, -2.2718982696533203, -2.172616958618164, -2.073335647583008, -1.9740545749664307, -1.8747732639312744, -1.7754920721054077, -1.676210880279541, -1.5769296884536743, -1.4776484966278076, -1.3783674240112305, -1.2790862321853638, -1.179805040359497, -1.0805237293243408, -0.9812425374984741, -0.8819613456726074, -0.7826801538467407, -0.6833989024162292, -0.5841176509857178, -0.4848364293575287, -0.3855552077293396, -0.2862740159034729, -0.1869927942752838, -0.08771157264709473, 0.011569619178771973, 0.11085087060928345, 0.21013206243515015, 0.30941328406333923, 0.4086945056915283, 0.507975697517395, 0.6072568893432617, 0.7065381407737732, 0.8058193325996399, 0.9051005840301514, 1.004381775856018, 1.1036629676818848, 1.2029441595077515, 1.3022253513336182, 1.4015066623687744, 1.5007878541946411, 1.6000690460205078, 1.699350357055664, 1.7986314296722412, 1.897912621498108, 1.9971938133239746, 2.096475124359131, 2.195756196975708, 2.2950375080108643, 2.3943185806274414, 2.4935998916625977, 2.592881202697754]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 11.0, 9.0, 12.0, 10.0, 13.0, 15.0, 10.0, 28.0, 14.0, 20.0, 27.0, 25.0, 25.0, 41.0, 32.0, 39.0, 33.0, 29.0, 40.0, 38.0, 36.0, 43.0, 43.0, 26.0, 30.0, 35.0, 28.0, 28.0, 30.0, 38.0, 26.0, 32.0, 22.0, 10.0, 18.0, 17.0, 14.0, 13.0, 10.0, 5.0, 6.0, 5.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1675562858581543, -1.1265923976898193, -1.085628628730774, -1.044664740562439, -1.0037009716033936, -0.9627370834350586, -0.9217732548713684, -0.8808094263076782, -0.839845597743988, -0.7988817691802979, -0.7579179406166077, -0.7169541120529175, -0.6759902238845825, -0.6350264549255371, -0.5940625667572021, -0.553098738193512, -0.5121349096298218, -0.4711710810661316, -0.4302072525024414, -0.38924339413642883, -0.34827956557273865, -0.30731573700904846, -0.2663518786430359, -0.2253880500793457, -0.18442422151565552, -0.14346039295196533, -0.10249654948711395, -0.06153271347284317, -0.020568877458572388, 0.020394951105117798, 0.06135879456996918, 0.10232263803482056, 0.14328646659851074, 0.18425029516220093, 0.2252141386270523, 0.2661779820919037, 0.30714181065559387, 0.34810563921928406, 0.38906949758529663, 0.4300333261489868, 0.470997154712677, 0.5119609832763672, 0.5529248118400574, 0.5938886404037476, 0.6348525285720825, 0.6758162975311279, 0.7167801856994629, 0.7577440142631531, 0.7987078428268433, 0.8396716713905334, 0.8806354999542236, 0.9215993285179138, 0.962563157081604, 1.003527045249939, 1.0444908142089844, 1.0854547023773193, 1.1264185905456543, 1.1673824787139893, 1.2083462476730347, 1.2493101358413696, 1.290273904800415, 1.33123779296875, 1.3722015619277954, 1.4131654500961304, 1.4541292190551758]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 8.0, 7.0, 15.0, 19.0, 29.0, 40.0, 58.0, 63.0, 103.0, 121.0, 169.0, 233.0, 361.0, 532.0, 798.0, 1277.0, 1895.0, 3216.0, 5296.0, 9800.0, 19642.0, 43859.0, 117470.0, 397464.0, 286468.0, 87840.0, 34883.0, 16053.0, 8289.0, 4652.0, 2731.0, 1733.0, 1071.0, 692.0, 512.0, 355.0, 258.0, 167.0, 115.0, 83.0, 50.0, 36.0, 29.0, 19.0, 20.0, 13.0, 7.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.51416015625, -0.49802398681640625, -0.4818878173828125, -0.46575164794921875, -0.449615478515625, -0.43347930908203125, -0.4173431396484375, -0.40120697021484375, -0.38507080078125, -0.36893463134765625, -0.3527984619140625, -0.33666229248046875, -0.320526123046875, -0.30438995361328125, -0.2882537841796875, -0.27211761474609375, -0.2559814453125, -0.23984527587890625, -0.2237091064453125, -0.20757293701171875, -0.191436767578125, -0.17530059814453125, -0.1591644287109375, -0.14302825927734375, -0.12689208984375, -0.11075592041015625, -0.0946197509765625, -0.07848358154296875, -0.062347412109375, -0.04621124267578125, -0.0300750732421875, -0.01393890380859375, 0.002197265625, 0.01833343505859375, 0.0344696044921875, 0.05060577392578125, 0.066741943359375, 0.08287811279296875, 0.0990142822265625, 0.11515045166015625, 0.13128662109375, 0.14742279052734375, 0.1635589599609375, 0.17969512939453125, 0.195831298828125, 0.21196746826171875, 0.2281036376953125, 0.24423980712890625, 0.2603759765625, 0.27651214599609375, 0.2926483154296875, 0.30878448486328125, 0.324920654296875, 0.34105682373046875, 0.3571929931640625, 0.37332916259765625, 0.38946533203125, 0.40560150146484375, 0.4217376708984375, 0.43787384033203125, 0.454010009765625, 0.47014617919921875, 0.4862823486328125, 0.5024185180664062, 0.5185546875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 6.0, 5.0, 4.0, 7.0, 12.0, 14.0, 19.0, 15.0, 27.0, 35.0, 45.0, 34.0, 48.0, 53.0, 75.0, 70.0, 57.0, 61.0, 59.0, 60.0, 52.0, 40.0, 38.0, 30.0, 26.0, 21.0, 27.0, 18.0, 12.0, 4.0, 6.0, 8.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23046875, -0.22274017333984375, -0.2150115966796875, -0.20728302001953125, -0.199554443359375, -0.19182586669921875, -0.1840972900390625, -0.17636871337890625, -0.16864013671875, -0.16091156005859375, -0.1531829833984375, -0.14545440673828125, -0.137725830078125, -0.12999725341796875, -0.1222686767578125, -0.11454010009765625, -0.1068115234375, -0.09908294677734375, -0.0913543701171875, -0.08362579345703125, -0.075897216796875, -0.06816864013671875, -0.0604400634765625, -0.05271148681640625, -0.04498291015625, -0.03725433349609375, -0.0295257568359375, -0.02179718017578125, -0.014068603515625, -0.00634002685546875, 0.0013885498046875, 0.00911712646484375, 0.016845703125, 0.02457427978515625, 0.0323028564453125, 0.04003143310546875, 0.047760009765625, 0.05548858642578125, 0.0632171630859375, 0.07094573974609375, 0.07867431640625, 0.08640289306640625, 0.0941314697265625, 0.10186004638671875, 0.109588623046875, 0.11731719970703125, 0.1250457763671875, 0.13277435302734375, 0.1405029296875, 0.14823150634765625, 0.1559600830078125, 0.16368865966796875, 0.171417236328125, 0.17914581298828125, 0.1868743896484375, 0.19460296630859375, 0.20233154296875, 0.21006011962890625, 0.2177886962890625, 0.22551727294921875, 0.233245849609375, 0.24097442626953125, 0.2487030029296875, 0.25643157958984375, 0.26416015625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 6.0, 12.0, 13.0, 16.0, 14.0, 27.0, 36.0, 42.0, 68.0, 101.0, 151.0, 203.0, 336.0, 579.0, 1142.0, 2528.0, 7506.0, 38161.0, 646599.0, 315725.0, 25138.0, 5650.0, 2045.0, 938.0, 542.0, 301.0, 224.0, 137.0, 81.0, 60.0, 48.0, 40.0, 21.0, 17.0, 16.0, 9.0, 12.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.08984375, -1.0521240234375, -1.014404296875, -0.9766845703125, -0.93896484375, -0.9012451171875, -0.863525390625, -0.8258056640625, -0.7880859375, -0.7503662109375, -0.712646484375, -0.6749267578125, -0.63720703125, -0.5994873046875, -0.561767578125, -0.5240478515625, -0.486328125, -0.4486083984375, -0.410888671875, -0.3731689453125, -0.33544921875, -0.2977294921875, -0.260009765625, -0.2222900390625, -0.1845703125, -0.1468505859375, -0.109130859375, -0.0714111328125, -0.03369140625, 0.0040283203125, 0.041748046875, 0.0794677734375, 0.1171875, 0.1549072265625, 0.192626953125, 0.2303466796875, 0.26806640625, 0.3057861328125, 0.343505859375, 0.3812255859375, 0.4189453125, 0.4566650390625, 0.494384765625, 0.5321044921875, 0.56982421875, 0.6075439453125, 0.645263671875, 0.6829833984375, 0.720703125, 0.7584228515625, 0.796142578125, 0.8338623046875, 0.87158203125, 0.9093017578125, 0.947021484375, 0.9847412109375, 1.0224609375, 1.0601806640625, 1.097900390625, 1.1356201171875, 1.17333984375, 1.2110595703125, 1.248779296875, 1.2864990234375, 1.32421875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 3.0, 6.0, 8.0, 12.0, 8.0, 7.0, 24.0, 12.0, 20.0, 31.0, 25.0, 28.0, 34.0, 39.0, 41.0, 42.0, 45.0, 50.0, 66.0, 46.0, 49.0, 48.0, 33.0, 42.0, 37.0, 40.0, 27.0, 23.0, 29.0, 24.0, 23.0, 14.0, 18.0, 8.0, 8.0, 9.0, 6.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.99462890625, -0.9638900756835938, -0.9331512451171875, -0.9024124145507812, -0.871673583984375, -0.8409347534179688, -0.8101959228515625, -0.7794570922851562, -0.74871826171875, -0.7179794311523438, -0.6872406005859375, -0.6565017700195312, -0.625762939453125, -0.5950241088867188, -0.5642852783203125, -0.5335464477539062, -0.5028076171875, -0.47206878662109375, -0.4413299560546875, -0.41059112548828125, -0.379852294921875, -0.34911346435546875, -0.3183746337890625, -0.28763580322265625, -0.25689697265625, -0.22615814208984375, -0.1954193115234375, -0.16468048095703125, -0.133941650390625, -0.10320281982421875, -0.0724639892578125, -0.04172515869140625, -0.010986328125, 0.01975250244140625, 0.0504913330078125, 0.08123016357421875, 0.111968994140625, 0.14270782470703125, 0.1734466552734375, 0.20418548583984375, 0.23492431640625, 0.26566314697265625, 0.2964019775390625, 0.32714080810546875, 0.357879638671875, 0.38861846923828125, 0.4193572998046875, 0.45009613037109375, 0.4808349609375, 0.5115737915039062, 0.5423126220703125, 0.5730514526367188, 0.603790283203125, 0.6345291137695312, 0.6652679443359375, 0.6960067749023438, 0.72674560546875, 0.7574844360351562, 0.7882232666015625, 0.8189620971679688, 0.849700927734375, 0.8804397583007812, 0.9111785888671875, 0.9419174194335938, 0.97265625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 12.0, 7.0, 25.0, 44.0, 69.0, 111.0, 324.0, 1282.0, 11913.0, 1006553.0, 25653.0, 1764.0, 432.0, 159.0, 82.0, 45.0, 25.0, 20.0, 11.0, 6.0, 4.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7529296875, -1.6894378662109375, -1.625946044921875, -1.5624542236328125, -1.49896240234375, -1.4354705810546875, -1.371978759765625, -1.3084869384765625, -1.2449951171875, -1.1815032958984375, -1.118011474609375, -1.0545196533203125, -0.99102783203125, -0.9275360107421875, -0.864044189453125, -0.8005523681640625, -0.737060546875, -0.6735687255859375, -0.610076904296875, -0.5465850830078125, -0.48309326171875, -0.4196014404296875, -0.356109619140625, -0.2926177978515625, -0.2291259765625, -0.1656341552734375, -0.102142333984375, -0.0386505126953125, 0.02484130859375, 0.0883331298828125, 0.151824951171875, 0.2153167724609375, 0.27880859375, 0.3423004150390625, 0.405792236328125, 0.4692840576171875, 0.53277587890625, 0.5962677001953125, 0.659759521484375, 0.7232513427734375, 0.7867431640625, 0.8502349853515625, 0.913726806640625, 0.9772186279296875, 1.04071044921875, 1.1042022705078125, 1.167694091796875, 1.2311859130859375, 1.294677734375, 1.3581695556640625, 1.421661376953125, 1.4851531982421875, 1.54864501953125, 1.6121368408203125, 1.675628662109375, 1.7391204833984375, 1.8026123046875, 1.8661041259765625, 1.929595947265625, 1.9930877685546875, 2.05657958984375, 2.1200714111328125, 2.183563232421875, 2.2470550537109375, 2.310546875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 4.0, 5.0, 2.0, 1.0, 2.0, 3.0, 3.0, 7.0, 16.0, 11.0, 17.0, 16.0, 28.0, 28.0, 42.0, 35.0, 57.0, 110.0, 175.0, 120.0, 69.0, 47.0, 37.0, 45.0, 29.0, 16.0, 14.0, 19.0, 8.0, 9.0, 4.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 6.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014483928680419922, -0.00014076754450798035, -0.00013669580221176147, -0.0001326240599155426, -0.00012855231761932373, -0.00012448057532310486, -0.00012040883302688599, -0.00011633709073066711, -0.00011226534843444824, -0.00010819360613822937, -0.0001041218638420105, -0.00010005012154579163, -9.597837924957275e-05, -9.190663695335388e-05, -8.783489465713501e-05, -8.376315236091614e-05, -7.969141006469727e-05, -7.56196677684784e-05, -7.154792547225952e-05, -6.747618317604065e-05, -6.340444087982178e-05, -5.9332698583602905e-05, -5.526095628738403e-05, -5.118921399116516e-05, -4.711747169494629e-05, -4.304572939872742e-05, -3.8973987102508545e-05, -3.490224480628967e-05, -3.08305025100708e-05, -2.675876021385193e-05, -2.2687017917633057e-05, -1.8615275621414185e-05, -1.4543533325195312e-05, -1.047179102897644e-05, -6.400048732757568e-06, -2.3283064365386963e-06, 1.7434358596801758e-06, 5.815178155899048e-06, 9.88692045211792e-06, 1.3958662748336792e-05, 1.8030405044555664e-05, 2.2102147340774536e-05, 2.6173889636993408e-05, 3.024563193321228e-05, 3.431737422943115e-05, 3.8389116525650024e-05, 4.2460858821868896e-05, 4.653260111808777e-05, 5.060434341430664e-05, 5.467608571052551e-05, 5.8747828006744385e-05, 6.281957030296326e-05, 6.689131259918213e-05, 7.0963054895401e-05, 7.503479719161987e-05, 7.910653948783875e-05, 8.317828178405762e-05, 8.725002408027649e-05, 9.132176637649536e-05, 9.539350867271423e-05, 9.94652509689331e-05, 0.00010353699326515198, 0.00010760873556137085, 0.00011168047785758972, 0.0001157522201538086]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 7.0, 7.0, 15.0, 37.0, 63.0, 115.0, 249.0, 785.0, 4732.0, 964838.0, 74390.0, 2419.0, 493.0, 169.0, 104.0, 51.0, 35.0, 16.0, 8.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.732421875, -1.665374755859375, -1.59832763671875, -1.531280517578125, -1.4642333984375, -1.397186279296875, -1.33013916015625, -1.263092041015625, -1.196044921875, -1.128997802734375, -1.06195068359375, -0.994903564453125, -0.9278564453125, -0.860809326171875, -0.79376220703125, -0.726715087890625, -0.65966796875, -0.592620849609375, -0.52557373046875, -0.458526611328125, -0.3914794921875, -0.324432373046875, -0.25738525390625, -0.190338134765625, -0.123291015625, -0.056243896484375, 0.01080322265625, 0.077850341796875, 0.1448974609375, 0.211944580078125, 0.27899169921875, 0.346038818359375, 0.4130859375, 0.480133056640625, 0.54718017578125, 0.614227294921875, 0.6812744140625, 0.748321533203125, 0.81536865234375, 0.882415771484375, 0.949462890625, 1.016510009765625, 1.08355712890625, 1.150604248046875, 1.2176513671875, 1.284698486328125, 1.35174560546875, 1.418792724609375, 1.48583984375, 1.552886962890625, 1.61993408203125, 1.686981201171875, 1.7540283203125, 1.821075439453125, 1.88812255859375, 1.955169677734375, 2.022216796875, 2.089263916015625, 2.15631103515625, 2.223358154296875, 2.2904052734375, 2.357452392578125, 2.42449951171875, 2.491546630859375, 2.55859375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 7.0, 12.0, 19.0, 38.0, 80.0, 242.0, 352.0, 143.0, 48.0, 22.0, 13.0, 8.0, 8.0, 4.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9921875, -1.94720458984375, -1.9022216796875, -1.85723876953125, -1.812255859375, -1.76727294921875, -1.7222900390625, -1.67730712890625, -1.63232421875, -1.58734130859375, -1.5423583984375, -1.49737548828125, -1.452392578125, -1.40740966796875, -1.3624267578125, -1.31744384765625, -1.2724609375, -1.22747802734375, -1.1824951171875, -1.13751220703125, -1.092529296875, -1.04754638671875, -1.0025634765625, -0.95758056640625, -0.91259765625, -0.86761474609375, -0.8226318359375, -0.77764892578125, -0.732666015625, -0.68768310546875, -0.6427001953125, -0.59771728515625, -0.552734375, -0.50775146484375, -0.4627685546875, -0.41778564453125, -0.372802734375, -0.32781982421875, -0.2828369140625, -0.23785400390625, -0.19287109375, -0.14788818359375, -0.1029052734375, -0.05792236328125, -0.012939453125, 0.03204345703125, 0.0770263671875, 0.12200927734375, 0.1669921875, 0.21197509765625, 0.2569580078125, 0.30194091796875, 0.346923828125, 0.39190673828125, 0.4368896484375, 0.48187255859375, 0.52685546875, 0.57183837890625, 0.6168212890625, 0.66180419921875, 0.706787109375, 0.75177001953125, 0.7967529296875, 0.84173583984375, 0.88671875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 4.0, 3.0, 3.0, 16.0, 16.0, 42.0, 121.0, 217.0, 258.0, 185.0, 76.0, 37.0, 8.0, 7.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.154760360717773, -11.741466522216797, -11.32817268371582, -10.914877891540527, -10.50158405303955, -10.088290214538574, -9.674995422363281, -9.261701583862305, -8.848407745361328, -8.435113906860352, -8.021820068359375, -7.608525276184082, -7.1952314376831055, -6.781937599182129, -6.368643283843994, -5.955348968505859, -5.542055130004883, -5.128761291503906, -4.7154669761657715, -4.302172660827637, -3.88887882232666, -3.4755847454071045, -3.062290668487549, -2.648996591567993, -2.2357025146484375, -1.8224084377288818, -1.4091143608093262, -0.9958202838897705, -0.5825262069702148, -0.16923213005065918, 0.24406194686889648, 0.6573560237884521, 1.0706491470336914, 1.483943223953247, 1.8972373008728027, 2.3105313777923584, 2.723825454711914, 3.1371195316314697, 3.5504136085510254, 3.963707685470581, 4.377001762390137, 4.790295600891113, 5.203589916229248, 5.616884231567383, 6.030178070068359, 6.443471908569336, 6.856766223907471, 7.2700605392456055, 7.683354377746582, 8.096648216247559, 8.509943008422852, 8.923236846923828, 9.336530685424805, 9.749824523925781, 10.163118362426758, 10.57641315460205, 10.989706993103027, 11.403000831604004, 11.816295623779297, 12.229589462280273, 12.64288330078125, 13.056177139282227, 13.469470977783203, 13.882765769958496, 14.296059608459473]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 10.0, 7.0, 12.0, 11.0, 14.0, 13.0, 26.0, 25.0, 35.0, 38.0, 35.0, 51.0, 48.0, 51.0, 61.0, 54.0, 61.0, 47.0, 53.0, 41.0, 43.0, 39.0, 37.0, 33.0, 25.0, 21.0, 13.0, 23.0, 16.0, 23.0, 6.0, 4.0, 7.0, 5.0, 3.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-6.578887939453125, -6.398497104644775, -6.218106746673584, -6.037715911865234, -5.857325077056885, -5.676934242248535, -5.496543884277344, -5.316153049468994, -5.1357622146606445, -4.955371379852295, -4.7749810218811035, -4.594590187072754, -4.414199352264404, -4.233808517456055, -4.053418159484863, -3.8730273246765137, -3.6926369667053223, -3.5122463703155518, -3.331855535507202, -3.1514649391174316, -2.971074104309082, -2.7906835079193115, -2.610292911529541, -2.4299020767211914, -2.249511480331421, -2.0691208839416504, -1.8887300491333008, -1.7083394527435303, -1.5279487371444702, -1.3475580215454102, -1.1671674251556396, -0.9867767095565796, -0.8063864707946777, -0.6259957551956177, -0.4456050992012024, -0.2652144432067871, -0.08482372760772705, 0.09556698799133301, 0.2759575843811035, 0.4563482999801636, 0.6367390155792236, 0.8171297311782837, 0.997520387172699, 1.1779110431671143, 1.3583017587661743, 1.5386924743652344, 1.7190830707550049, 1.899473786354065, 2.079864501953125, 2.2602550983428955, 2.440645933151245, 2.6210365295410156, 2.8014273643493652, 2.9818179607391357, 3.1622085571289062, 3.342599391937256, 3.5229899883270264, 3.703380584716797, 3.8837714195251465, 4.064162254333496, 4.2445526123046875, 4.424943447113037, 4.605334281921387, 4.785724639892578, 4.966115474700928]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 6.0, 5.0, 8.0, 13.0, 29.0, 21.0, 41.0, 72.0, 113.0, 176.0, 301.0, 501.0, 897.0, 1857.0, 3618.0, 8599.0, 26178.0, 138686.0, 1605173.0, 2195134.0, 163445.0, 30358.0, 9996.0, 4237.0, 2047.0, 1114.0, 636.0, 395.0, 225.0, 168.0, 81.0, 67.0, 31.0, 15.0, 13.0, 10.0, 5.0, 3.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.45458984375, -0.43894195556640625, -0.4232940673828125, -0.40764617919921875, -0.391998291015625, -0.37635040283203125, -0.3607025146484375, -0.34505462646484375, -0.32940673828125, -0.31375885009765625, -0.2981109619140625, -0.28246307373046875, -0.266815185546875, -0.25116729736328125, -0.2355194091796875, -0.21987152099609375, -0.2042236328125, -0.18857574462890625, -0.1729278564453125, -0.15727996826171875, -0.141632080078125, -0.12598419189453125, -0.1103363037109375, -0.09468841552734375, -0.07904052734375, -0.06339263916015625, -0.0477447509765625, -0.03209686279296875, -0.016448974609375, -0.00080108642578125, 0.0148468017578125, 0.03049468994140625, 0.046142578125, 0.06179046630859375, 0.0774383544921875, 0.09308624267578125, 0.108734130859375, 0.12438201904296875, 0.1400299072265625, 0.15567779541015625, 0.17132568359375, 0.18697357177734375, 0.2026214599609375, 0.21826934814453125, 0.233917236328125, 0.24956512451171875, 0.2652130126953125, 0.28086090087890625, 0.2965087890625, 0.31215667724609375, 0.3278045654296875, 0.34345245361328125, 0.359100341796875, 0.37474822998046875, 0.3903961181640625, 0.40604400634765625, 0.42169189453125, 0.43733978271484375, 0.4529876708984375, 0.46863555908203125, 0.484283447265625, 0.49993133544921875, 0.5155792236328125, 0.5312271118164062, 0.546875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 6.0, 5.0, 10.0, 6.0, 10.0, 13.0, 20.0, 22.0, 25.0, 38.0, 39.0, 50.0, 37.0, 56.0, 54.0, 60.0, 66.0, 65.0, 60.0, 42.0, 48.0, 45.0, 46.0, 35.0, 35.0, 15.0, 15.0, 13.0, 13.0, 11.0, 13.0, 6.0, 5.0, 8.0, 6.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.254150390625, -0.24667930603027344, -0.23920822143554688, -0.2317371368408203, -0.22426605224609375, -0.2167949676513672, -0.20932388305664062, -0.20185279846191406, -0.1943817138671875, -0.18691062927246094, -0.17943954467773438, -0.1719684600830078, -0.16449737548828125, -0.1570262908935547, -0.14955520629882812, -0.14208412170410156, -0.134613037109375, -0.12714195251464844, -0.11967086791992188, -0.11219978332519531, -0.10472869873046875, -0.09725761413574219, -0.08978652954101562, -0.08231544494628906, -0.0748443603515625, -0.06737327575683594, -0.059902191162109375, -0.05243110656738281, -0.04496002197265625, -0.03748893737792969, -0.030017852783203125, -0.022546768188476562, -0.01507568359375, -0.0076045989990234375, -0.000133514404296875, 0.0073375701904296875, 0.01480865478515625, 0.022279739379882812, 0.029750823974609375, 0.03722190856933594, 0.0446929931640625, 0.05216407775878906, 0.059635162353515625, 0.06710624694824219, 0.07457733154296875, 0.08204841613769531, 0.08951950073242188, 0.09699058532714844, 0.104461669921875, 0.11193275451660156, 0.11940383911132812, 0.1268749237060547, 0.13434600830078125, 0.1418170928955078, 0.14928817749023438, 0.15675926208496094, 0.1642303466796875, 0.17170143127441406, 0.17917251586914062, 0.1866436004638672, 0.19411468505859375, 0.2015857696533203, 0.20905685424804688, 0.21652793884277344, 0.2239990234375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 9.0, 9.0, 16.0, 16.0, 35.0, 54.0, 99.0, 186.0, 363.0, 977.0, 2794.0, 11037.0, 71830.0, 3341382.0, 719565.0, 35862.0, 6789.0, 1848.0, 717.0, 289.0, 165.0, 84.0, 61.0, 34.0, 16.0, 19.0, 8.0, 9.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1455078125, -1.1135406494140625, -1.081573486328125, -1.0496063232421875, -1.01763916015625, -0.9856719970703125, -0.953704833984375, -0.9217376708984375, -0.8897705078125, -0.8578033447265625, -0.825836181640625, -0.7938690185546875, -0.76190185546875, -0.7299346923828125, -0.697967529296875, -0.6660003662109375, -0.634033203125, -0.6020660400390625, -0.570098876953125, -0.5381317138671875, -0.50616455078125, -0.4741973876953125, -0.442230224609375, -0.4102630615234375, -0.3782958984375, -0.3463287353515625, -0.314361572265625, -0.2823944091796875, -0.25042724609375, -0.2184600830078125, -0.186492919921875, -0.1545257568359375, -0.12255859375, -0.0905914306640625, -0.058624267578125, -0.0266571044921875, 0.00531005859375, 0.0372772216796875, 0.069244384765625, 0.1012115478515625, 0.1331787109375, 0.1651458740234375, 0.197113037109375, 0.2290802001953125, 0.26104736328125, 0.2930145263671875, 0.324981689453125, 0.3569488525390625, 0.388916015625, 0.4208831787109375, 0.452850341796875, 0.4848175048828125, 0.51678466796875, 0.5487518310546875, 0.580718994140625, 0.6126861572265625, 0.6446533203125, 0.6766204833984375, 0.708587646484375, 0.7405548095703125, 0.77252197265625, 0.8044891357421875, 0.836456298828125, 0.8684234619140625, 0.900390625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 7.0, 6.0, 4.0, 10.0, 11.0, 18.0, 24.0, 40.0, 46.0, 131.0, 328.0, 794.0, 1386.0, 702.0, 235.0, 116.0, 86.0, 49.0, 29.0, 13.0, 14.0, 8.0, 11.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75, -0.715057373046875, -0.68011474609375, -0.645172119140625, -0.6102294921875, -0.575286865234375, -0.54034423828125, -0.505401611328125, -0.470458984375, -0.435516357421875, -0.40057373046875, -0.365631103515625, -0.3306884765625, -0.295745849609375, -0.26080322265625, -0.225860595703125, -0.19091796875, -0.155975341796875, -0.12103271484375, -0.086090087890625, -0.0511474609375, -0.016204833984375, 0.01873779296875, 0.053680419921875, 0.088623046875, 0.123565673828125, 0.15850830078125, 0.193450927734375, 0.2283935546875, 0.263336181640625, 0.29827880859375, 0.333221435546875, 0.3681640625, 0.403106689453125, 0.43804931640625, 0.472991943359375, 0.5079345703125, 0.542877197265625, 0.57781982421875, 0.612762451171875, 0.647705078125, 0.682647705078125, 0.71759033203125, 0.752532958984375, 0.7874755859375, 0.822418212890625, 0.85736083984375, 0.892303466796875, 0.92724609375, 0.962188720703125, 0.99713134765625, 1.032073974609375, 1.0670166015625, 1.101959228515625, 1.13690185546875, 1.171844482421875, 1.206787109375, 1.241729736328125, 1.27667236328125, 1.311614990234375, 1.3465576171875, 1.381500244140625, 1.41644287109375, 1.451385498046875, 1.486328125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 5.0, 9.0, 18.0, 40.0, 108.0, 255.0, 299.0, 152.0, 66.0, 26.0, 7.0, 7.0, 0.0, 7.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.832291603088379, -11.486713409423828, -11.141134262084961, -10.79555606842041, -10.44997787475586, -10.104398727416992, -9.758820533752441, -9.41324234008789, -9.067663192749023, -8.722084999084473, -8.376505851745605, -8.030927658081055, -7.685349464416504, -7.339770793914795, -6.994192123413086, -6.648613929748535, -6.303035736083984, -5.957457065582275, -5.611878871917725, -5.266300201416016, -4.920722007751465, -4.575143337249756, -4.229564666748047, -3.883986234664917, -3.538407802581787, -3.1928293704986572, -2.8472509384155273, -2.5016722679138184, -2.1560938358306885, -1.8105154037475586, -1.4649367332458496, -1.1193583011627197, -0.7737789154052734, -0.4282004237174988, -0.08262193202972412, 0.2629566192626953, 0.6085350513458252, 0.9541134834289551, 1.299692153930664, 1.645270586013794, 1.9908490180969238, 2.3364274501800537, 2.6820058822631836, 3.0275845527648926, 3.3731629848480225, 3.7187414169311523, 4.064320087432861, 4.40989875793457, 4.755476951599121, 5.10105562210083, 5.446633815765381, 5.79221248626709, 6.137790679931641, 6.48336935043335, 6.828948020935059, 7.174526214599609, 7.520104885101318, 7.865683555603027, 8.211261749267578, 8.556840896606445, 8.902419090270996, 9.247997283935547, 9.593576431274414, 9.939154624938965, 10.284732818603516]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 2.0, 3.0, 6.0, 6.0, 10.0, 3.0, 11.0, 5.0, 24.0, 13.0, 16.0, 21.0, 27.0, 27.0, 34.0, 26.0, 43.0, 38.0, 53.0, 51.0, 37.0, 56.0, 55.0, 51.0, 35.0, 46.0, 42.0, 33.0, 31.0, 26.0, 30.0, 20.0, 22.0, 20.0, 21.0, 12.0, 12.0, 6.0, 4.0, 8.0, 8.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-3.4748730659484863, -3.372300863265991, -3.269728422164917, -3.167156219482422, -3.0645837783813477, -2.9620115756988525, -2.8594393730163574, -2.756866931915283, -2.654294729232788, -2.551722526550293, -2.4491500854492188, -2.3465778827667236, -2.2440054416656494, -2.1414332389831543, -2.03886079788208, -1.936288595199585, -1.8337162733078003, -1.7311439514160156, -1.628571629524231, -1.5259993076324463, -1.4234271049499512, -1.3208547830581665, -1.2182824611663818, -1.1157102584838867, -1.0131378173828125, -0.9105654954910278, -0.8079932332038879, -0.7054209113121033, -0.6028486490249634, -0.5002763271331787, -0.39770400524139404, -0.29513174295425415, -0.19255948066711426, -0.08998718112707138, 0.012585118412971497, 0.11515742540359497, 0.21772971749305725, 0.32030200958251953, 0.4228743314743042, 0.5254465937614441, 0.6280189156532288, 0.7305912375450134, 0.8331634998321533, 0.935735821723938, 1.0383081436157227, 1.1408803462982178, 1.243452787399292, 1.346024990081787, 1.4485973119735718, 1.5511696338653564, 1.6537419557571411, 1.7563142776489258, 1.858886480331421, 1.9614588022232056, 2.0640311241149902, 2.1666033267974854, 2.2691757678985596, 2.3717479705810547, 2.474320411682129, 2.576892614364624, 2.6794650554656982, 2.7820372581481934, 2.8846096992492676, 2.9871819019317627, 3.089754104614258]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 3.0, 6.0, 4.0, 14.0, 15.0, 25.0, 31.0, 55.0, 67.0, 122.0, 191.0, 280.0, 538.0, 844.0, 1587.0, 3034.0, 6474.0, 14727.0, 40554.0, 170407.0, 630744.0, 122043.0, 32728.0, 12450.0, 5424.0, 2694.0, 1455.0, 774.0, 485.0, 259.0, 187.0, 94.0, 76.0, 52.0, 34.0, 19.0, 16.0, 10.0, 11.0, 5.0, 7.0, 4.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.8896484375, -0.8652114868164062, -0.8407745361328125, -0.8163375854492188, -0.791900634765625, -0.7674636840820312, -0.7430267333984375, -0.7185897827148438, -0.69415283203125, -0.6697158813476562, -0.6452789306640625, -0.6208419799804688, -0.596405029296875, -0.5719680786132812, -0.5475311279296875, -0.5230941772460938, -0.4986572265625, -0.47422027587890625, -0.4497833251953125, -0.42534637451171875, -0.400909423828125, -0.37647247314453125, -0.3520355224609375, -0.32759857177734375, -0.30316162109375, -0.27872467041015625, -0.2542877197265625, -0.22985076904296875, -0.205413818359375, -0.18097686767578125, -0.1565399169921875, -0.13210296630859375, -0.107666015625, -0.08322906494140625, -0.0587921142578125, -0.03435516357421875, -0.009918212890625, 0.01451873779296875, 0.0389556884765625, 0.06339263916015625, 0.08782958984375, 0.11226654052734375, 0.1367034912109375, 0.16114044189453125, 0.185577392578125, 0.21001434326171875, 0.2344512939453125, 0.25888824462890625, 0.2833251953125, 0.30776214599609375, 0.3321990966796875, 0.35663604736328125, 0.381072998046875, 0.40550994873046875, 0.4299468994140625, 0.45438385009765625, 0.47882080078125, 0.5032577514648438, 0.5276947021484375, 0.5521316528320312, 0.576568603515625, 0.6010055541992188, 0.6254425048828125, 0.6498794555664062, 0.67431640625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 6.0, 6.0, 3.0, 5.0, 6.0, 13.0, 10.0, 19.0, 27.0, 35.0, 36.0, 38.0, 57.0, 55.0, 55.0, 62.0, 62.0, 71.0, 60.0, 60.0, 44.0, 48.0, 49.0, 33.0, 29.0, 28.0, 18.0, 7.0, 22.0, 12.0, 6.0, 4.0, 4.0, 2.0, 5.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2958984375, -0.2869453430175781, -0.27799224853515625, -0.2690391540527344, -0.2600860595703125, -0.2511329650878906, -0.24217987060546875, -0.23322677612304688, -0.224273681640625, -0.21532058715820312, -0.20636749267578125, -0.19741439819335938, -0.1884613037109375, -0.17950820922851562, -0.17055511474609375, -0.16160202026367188, -0.15264892578125, -0.14369583129882812, -0.13474273681640625, -0.12578964233398438, -0.1168365478515625, -0.10788345336914062, -0.09893035888671875, -0.08997726440429688, -0.081024169921875, -0.07207107543945312, -0.06311798095703125, -0.054164886474609375, -0.0452117919921875, -0.036258697509765625, -0.02730560302734375, -0.018352508544921875, -0.0093994140625, -0.000446319580078125, 0.00850677490234375, 0.017459869384765625, 0.0264129638671875, 0.035366058349609375, 0.04431915283203125, 0.053272247314453125, 0.062225341796875, 0.07117843627929688, 0.08013153076171875, 0.08908462524414062, 0.0980377197265625, 0.10699081420898438, 0.11594390869140625, 0.12489700317382812, 0.13385009765625, 0.14280319213867188, 0.15175628662109375, 0.16070938110351562, 0.1696624755859375, 0.17861557006835938, 0.18756866455078125, 0.19652175903320312, 0.205474853515625, 0.21442794799804688, 0.22338104248046875, 0.23233413696289062, 0.2412872314453125, 0.2502403259277344, 0.25919342041015625, 0.2681465148925781, 0.277099609375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 2.0, 5.0, 7.0, 7.0, 12.0, 13.0, 15.0, 28.0, 42.0, 45.0, 56.0, 90.0, 99.0, 169.0, 203.0, 349.0, 563.0, 1088.0, 2341.0, 6201.0, 26814.0, 552600.0, 421809.0, 24989.0, 5927.0, 2262.0, 1092.0, 568.0, 354.0, 231.0, 158.0, 108.0, 73.0, 54.0, 45.0, 27.0, 28.0, 14.0, 9.0, 13.0, 11.0, 6.0, 2.0, 4.0, 2.0, 4.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0], "bins": [-1.533203125, -1.4880828857421875, -1.442962646484375, -1.3978424072265625, -1.35272216796875, -1.3076019287109375, -1.262481689453125, -1.2173614501953125, -1.1722412109375, -1.1271209716796875, -1.082000732421875, -1.0368804931640625, -0.99176025390625, -0.9466400146484375, -0.901519775390625, -0.8563995361328125, -0.811279296875, -0.7661590576171875, -0.721038818359375, -0.6759185791015625, -0.63079833984375, -0.5856781005859375, -0.540557861328125, -0.4954376220703125, -0.4503173828125, -0.4051971435546875, -0.360076904296875, -0.3149566650390625, -0.26983642578125, -0.2247161865234375, -0.179595947265625, -0.1344757080078125, -0.08935546875, -0.0442352294921875, 0.000885009765625, 0.0460052490234375, 0.09112548828125, 0.1362457275390625, 0.181365966796875, 0.2264862060546875, 0.2716064453125, 0.3167266845703125, 0.361846923828125, 0.4069671630859375, 0.45208740234375, 0.4972076416015625, 0.542327880859375, 0.5874481201171875, 0.632568359375, 0.6776885986328125, 0.722808837890625, 0.7679290771484375, 0.81304931640625, 0.8581695556640625, 0.903289794921875, 0.9484100341796875, 0.9935302734375, 1.0386505126953125, 1.083770751953125, 1.1288909912109375, 1.17401123046875, 1.2191314697265625, 1.264251708984375, 1.3093719482421875, 1.3544921875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 5.0, 4.0, 10.0, 13.0, 15.0, 28.0, 13.0, 20.0, 21.0, 30.0, 30.0, 43.0, 43.0, 57.0, 55.0, 56.0, 61.0, 63.0, 42.0, 49.0, 42.0, 38.0, 40.0, 38.0, 18.0, 38.0, 20.0, 19.0, 18.0, 7.0, 12.0, 12.0, 5.0, 6.0, 6.0, 4.0, 2.0, 5.0, 5.0, 4.0, 1.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3056640625, -1.264984130859375, -1.22430419921875, -1.183624267578125, -1.1429443359375, -1.102264404296875, -1.06158447265625, -1.020904541015625, -0.980224609375, -0.939544677734375, -0.89886474609375, -0.858184814453125, -0.8175048828125, -0.776824951171875, -0.73614501953125, -0.695465087890625, -0.65478515625, -0.614105224609375, -0.57342529296875, -0.532745361328125, -0.4920654296875, -0.451385498046875, -0.41070556640625, -0.370025634765625, -0.329345703125, -0.288665771484375, -0.24798583984375, -0.207305908203125, -0.1666259765625, -0.125946044921875, -0.08526611328125, -0.044586181640625, -0.00390625, 0.036773681640625, 0.07745361328125, 0.118133544921875, 0.1588134765625, 0.199493408203125, 0.24017333984375, 0.280853271484375, 0.321533203125, 0.362213134765625, 0.40289306640625, 0.443572998046875, 0.4842529296875, 0.524932861328125, 0.56561279296875, 0.606292724609375, 0.64697265625, 0.687652587890625, 0.72833251953125, 0.769012451171875, 0.8096923828125, 0.850372314453125, 0.89105224609375, 0.931732177734375, 0.972412109375, 1.013092041015625, 1.05377197265625, 1.094451904296875, 1.1351318359375, 1.175811767578125, 1.21649169921875, 1.257171630859375, 1.2978515625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 2.0, 4.0, 8.0, 6.0, 10.0, 24.0, 30.0, 71.0, 79.0, 154.0, 319.0, 793.0, 1934.0, 7685.0, 65057.0, 913975.0, 48839.0, 6390.0, 1826.0, 666.0, 289.0, 142.0, 82.0, 53.0, 38.0, 25.0, 16.0, 9.0, 6.0, 7.0, 6.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7216796875, -0.697174072265625, -0.67266845703125, -0.648162841796875, -0.6236572265625, -0.599151611328125, -0.57464599609375, -0.550140380859375, -0.525634765625, -0.501129150390625, -0.47662353515625, -0.452117919921875, -0.4276123046875, -0.403106689453125, -0.37860107421875, -0.354095458984375, -0.32958984375, -0.305084228515625, -0.28057861328125, -0.256072998046875, -0.2315673828125, -0.207061767578125, -0.18255615234375, -0.158050537109375, -0.133544921875, -0.109039306640625, -0.08453369140625, -0.060028076171875, -0.0355224609375, -0.011016845703125, 0.01348876953125, 0.037994384765625, 0.0625, 0.087005615234375, 0.11151123046875, 0.136016845703125, 0.1605224609375, 0.185028076171875, 0.20953369140625, 0.234039306640625, 0.258544921875, 0.283050537109375, 0.30755615234375, 0.332061767578125, 0.3565673828125, 0.381072998046875, 0.40557861328125, 0.430084228515625, 0.45458984375, 0.479095458984375, 0.50360107421875, 0.528106689453125, 0.5526123046875, 0.577117919921875, 0.60162353515625, 0.626129150390625, 0.650634765625, 0.675140380859375, 0.69964599609375, 0.724151611328125, 0.7486572265625, 0.773162841796875, 0.79766845703125, 0.822174072265625, 0.8466796875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 10.0, 11.0, 16.0, 26.0, 44.0, 45.0, 79.0, 205.0, 230.0, 147.0, 62.0, 33.0, 33.0, 17.0, 8.0, 8.0, 7.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016260147094726562, -0.00015639327466487885, -0.00015018507838249207, -0.00014397688210010529, -0.0001377686858177185, -0.00013156048953533173, -0.00012535229325294495, -0.00011914409697055817, -0.00011293590068817139, -0.00010672770440578461, -0.00010051950812339783, -9.431131184101105e-05, -8.810311555862427e-05, -8.189491927623749e-05, -7.568672299385071e-05, -6.947852671146393e-05, -6.327033042907715e-05, -5.706213414669037e-05, -5.085393786430359e-05, -4.464574158191681e-05, -3.843754529953003e-05, -3.222934901714325e-05, -2.602115273475647e-05, -1.981295645236969e-05, -1.360476016998291e-05, -7.39656388759613e-06, -1.1883676052093506e-06, 5.019828677177429e-06, 1.1228024959564209e-05, 1.743622124195099e-05, 2.364441752433777e-05, 2.985261380672455e-05, 3.606081008911133e-05, 4.226900637149811e-05, 4.847720265388489e-05, 5.468539893627167e-05, 6.089359521865845e-05, 6.710179150104523e-05, 7.330998778343201e-05, 7.951818406581879e-05, 8.572638034820557e-05, 9.193457663059235e-05, 9.814277291297913e-05, 0.0001043509691953659, 0.00011055916547775269, 0.00011676736176013947, 0.00012297555804252625, 0.00012918375432491302, 0.0001353919506072998, 0.00014160014688968658, 0.00014780834317207336, 0.00015401653945446014, 0.00016022473573684692, 0.0001664329320192337, 0.00017264112830162048, 0.00017884932458400726, 0.00018505752086639404, 0.00019126571714878082, 0.0001974739134311676, 0.00020368210971355438, 0.00020989030599594116, 0.00021609850227832794, 0.00022230669856071472, 0.0002285148948431015, 0.00023472309112548828]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 12.0, 10.0, 12.0, 17.0, 25.0, 31.0, 47.0, 77.0, 146.0, 179.0, 304.0, 606.0, 1280.0, 3521.0, 15001.0, 216758.0, 767865.0, 33317.0, 5692.0, 1772.0, 784.0, 394.0, 229.0, 149.0, 93.0, 55.0, 43.0, 32.0, 15.0, 18.0, 13.0, 11.0, 10.0, 2.0, 5.0, 9.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.5859375, -0.5682830810546875, -0.550628662109375, -0.5329742431640625, -0.51531982421875, -0.4976654052734375, -0.480010986328125, -0.4623565673828125, -0.4447021484375, -0.4270477294921875, -0.409393310546875, -0.3917388916015625, -0.37408447265625, -0.3564300537109375, -0.338775634765625, -0.3211212158203125, -0.303466796875, -0.2858123779296875, -0.268157958984375, -0.2505035400390625, -0.23284912109375, -0.2151947021484375, -0.197540283203125, -0.1798858642578125, -0.1622314453125, -0.1445770263671875, -0.126922607421875, -0.1092681884765625, -0.09161376953125, -0.0739593505859375, -0.056304931640625, -0.0386505126953125, -0.02099609375, -0.0033416748046875, 0.014312744140625, 0.0319671630859375, 0.04962158203125, 0.0672760009765625, 0.084930419921875, 0.1025848388671875, 0.1202392578125, 0.1378936767578125, 0.155548095703125, 0.1732025146484375, 0.19085693359375, 0.2085113525390625, 0.226165771484375, 0.2438201904296875, 0.261474609375, 0.2791290283203125, 0.296783447265625, 0.3144378662109375, 0.33209228515625, 0.3497467041015625, 0.367401123046875, 0.3850555419921875, 0.4027099609375, 0.4203643798828125, 0.438018798828125, 0.4556732177734375, 0.47332763671875, 0.4909820556640625, 0.508636474609375, 0.5262908935546875, 0.5439453125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 10.0, 4.0, 6.0, 4.0, 15.0, 16.0, 29.0, 30.0, 34.0, 54.0, 60.0, 88.0, 92.0, 93.0, 97.0, 71.0, 64.0, 61.0, 49.0, 22.0, 27.0, 15.0, 10.0, 10.0, 8.0, 4.0, 5.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.44873046875, -0.43642425537109375, -0.4241180419921875, -0.41181182861328125, -0.399505615234375, -0.38719940185546875, -0.3748931884765625, -0.36258697509765625, -0.35028076171875, -0.33797454833984375, -0.3256683349609375, -0.31336212158203125, -0.301055908203125, -0.28874969482421875, -0.2764434814453125, -0.26413726806640625, -0.2518310546875, -0.23952484130859375, -0.2272186279296875, -0.21491241455078125, -0.202606201171875, -0.19029998779296875, -0.1779937744140625, -0.16568756103515625, -0.15338134765625, -0.14107513427734375, -0.1287689208984375, -0.11646270751953125, -0.104156494140625, -0.09185028076171875, -0.0795440673828125, -0.06723785400390625, -0.054931640625, -0.04262542724609375, -0.0303192138671875, -0.01801300048828125, -0.005706787109375, 0.00659942626953125, 0.0189056396484375, 0.03121185302734375, 0.04351806640625, 0.05582427978515625, 0.0681304931640625, 0.08043670654296875, 0.092742919921875, 0.10504913330078125, 0.1173553466796875, 0.12966156005859375, 0.1419677734375, 0.15427398681640625, 0.1665802001953125, 0.17888641357421875, 0.191192626953125, 0.20349884033203125, 0.2158050537109375, 0.22811126708984375, 0.24041748046875, 0.25272369384765625, 0.2650299072265625, 0.27733612060546875, 0.289642333984375, 0.30194854736328125, 0.3142547607421875, 0.32656097412109375, 0.3388671875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 5.0, 3.0, 7.0, 17.0, 45.0, 107.0, 208.0, 332.0, 185.0, 58.0, 19.0, 10.0, 9.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.230348587036133, -9.773762702941895, -9.317176818847656, -8.860590934753418, -8.40400505065918, -7.947419166564941, -7.490833282470703, -7.034247398376465, -6.577661514282227, -6.121075630187988, -5.66448974609375, -5.207903861999512, -4.751317977905273, -4.294732093811035, -3.838146448135376, -3.3815605640411377, -2.9249749183654785, -2.4683890342712402, -2.011803150177002, -1.5552173852920532, -1.098631501197815, -0.6420457363128662, -0.18545985221862793, 0.27112603187561035, 0.7277119159698486, 1.184297800064087, 1.6408836841583252, 2.0974693298339844, 2.5540552139282227, 3.010641098022461, 3.467226982116699, 3.9238128662109375, 4.380398750305176, 4.836984634399414, 5.293570518493652, 5.750156402587891, 6.206742286682129, 6.663328170776367, 7.1199140548706055, 7.576499938964844, 8.033085823059082, 8.48967170715332, 8.946257591247559, 9.402843475341797, 9.859429359436035, 10.316015243530273, 10.772601127624512, 11.22918701171875, 11.685771942138672, 12.14235782623291, 12.598943710327148, 13.055529594421387, 13.512115478515625, 13.968701362609863, 14.425287246704102, 14.88187313079834, 15.338459014892578, 15.795044898986816, 16.251630783081055, 16.708215713500977, 17.16480255126953, 17.621387481689453, 18.077974319458008, 18.53455924987793, 18.991146087646484]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 11.0, 6.0, 12.0, 11.0, 26.0, 23.0, 41.0, 51.0, 44.0, 54.0, 62.0, 71.0, 72.0, 78.0, 74.0, 71.0, 52.0, 58.0, 45.0, 41.0, 26.0, 21.0, 17.0, 16.0, 5.0, 9.0, 7.0, 9.0, 2.0, 0.0, 1.0], "bins": [-9.658439636230469, -9.449823379516602, -9.241207122802734, -9.032590866088867, -8.823974609375, -8.615358352661133, -8.406742095947266, -8.198126792907715, -7.989510536193848, -7.7808942794799805, -7.572278022766113, -7.363661766052246, -7.155045986175537, -6.94642972946167, -6.737813472747803, -6.5291972160339355, -6.320580959320068, -6.111964702606201, -5.903348445892334, -5.694732666015625, -5.486116409301758, -5.277500152587891, -5.068883895874023, -4.860267639160156, -4.651651382446289, -4.443035125732422, -4.234418869018555, -4.0258026123046875, -3.8171868324279785, -3.6085705757141113, -3.399954319000244, -3.191338062286377, -2.982722759246826, -2.774106502532959, -2.565490484237671, -2.3568742275238037, -2.1482582092285156, -1.9396419525146484, -1.7310256958007812, -1.5224095582962036, -1.313793420791626, -1.1051772832870483, -0.8965610861778259, -0.6879448890686035, -0.4793287515640259, -0.27071261405944824, -0.062096357345581055, 0.14651978015899658, 0.3551359176635742, 0.5637520551681519, 0.7723682522773743, 0.9809844493865967, 1.1896005868911743, 1.398216724395752, 1.6068329811096191, 1.8154491186141968, 2.0240652561187744, 2.2326815128326416, 2.4412975311279297, 2.649913787841797, 2.858530044555664, 3.067146062850952, 3.2757623195648193, 3.4843783378601074, 3.6929945945739746]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 0.0, 7.0, 6.0, 11.0, 15.0, 15.0, 33.0, 35.0, 42.0, 83.0, 122.0, 208.0, 405.0, 816.0, 1878.0, 5948.0, 30288.0, 689824.0, 3363468.0, 83848.0, 11789.0, 3156.0, 1147.0, 517.0, 239.0, 164.0, 71.0, 50.0, 31.0, 21.0, 16.0, 10.0, 4.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.705078125, -0.680938720703125, -0.65679931640625, -0.632659912109375, -0.6085205078125, -0.584381103515625, -0.56024169921875, -0.536102294921875, -0.511962890625, -0.487823486328125, -0.46368408203125, -0.439544677734375, -0.4154052734375, -0.391265869140625, -0.36712646484375, -0.342987060546875, -0.31884765625, -0.294708251953125, -0.27056884765625, -0.246429443359375, -0.2222900390625, -0.198150634765625, -0.17401123046875, -0.149871826171875, -0.125732421875, -0.101593017578125, -0.07745361328125, -0.053314208984375, -0.0291748046875, -0.005035400390625, 0.01910400390625, 0.043243408203125, 0.0673828125, 0.091522216796875, 0.11566162109375, 0.139801025390625, 0.1639404296875, 0.188079833984375, 0.21221923828125, 0.236358642578125, 0.260498046875, 0.284637451171875, 0.30877685546875, 0.332916259765625, 0.3570556640625, 0.381195068359375, 0.40533447265625, 0.429473876953125, 0.45361328125, 0.477752685546875, 0.50189208984375, 0.526031494140625, 0.5501708984375, 0.574310302734375, 0.59844970703125, 0.622589111328125, 0.646728515625, 0.670867919921875, 0.69500732421875, 0.719146728515625, 0.7432861328125, 0.767425537109375, 0.79156494140625, 0.815704345703125, 0.83984375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 8.0, 15.0, 20.0, 25.0, 31.0, 52.0, 79.0, 86.0, 92.0, 93.0, 99.0, 78.0, 75.0, 58.0, 55.0, 37.0, 32.0, 20.0, 19.0, 11.0, 9.0, 3.0, 6.0, 4.0, 0.0, 0.0, 2.0], "bins": [-0.63525390625, -0.6217784881591797, -0.6083030700683594, -0.5948276519775391, -0.5813522338867188, -0.5678768157958984, -0.5544013977050781, -0.5409259796142578, -0.5274505615234375, -0.5139751434326172, -0.5004997253417969, -0.48702430725097656, -0.47354888916015625, -0.46007347106933594, -0.4465980529785156, -0.4331226348876953, -0.419647216796875, -0.4061717987060547, -0.3926963806152344, -0.37922096252441406, -0.36574554443359375, -0.35227012634277344, -0.3387947082519531, -0.3253192901611328, -0.3118438720703125, -0.2983684539794922, -0.2848930358886719, -0.27141761779785156, -0.25794219970703125, -0.24446678161621094, -0.23099136352539062, -0.2175159454345703, -0.20404052734375, -0.1905651092529297, -0.17708969116210938, -0.16361427307128906, -0.15013885498046875, -0.13666343688964844, -0.12318801879882812, -0.10971260070800781, -0.0962371826171875, -0.08276176452636719, -0.06928634643554688, -0.05581092834472656, -0.04233551025390625, -0.028860092163085938, -0.015384674072265625, -0.0019092559814453125, 0.011566162109375, 0.025041580200195312, 0.038516998291015625, 0.05199241638183594, 0.06546783447265625, 0.07894325256347656, 0.09241867065429688, 0.10589408874511719, 0.1193695068359375, 0.1328449249267578, 0.14632034301757812, 0.15979576110839844, 0.17327117919921875, 0.18674659729003906, 0.20022201538085938, 0.2136974334716797, 0.2271728515625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 12.0, 18.0, 29.0, 35.0, 73.0, 127.0, 204.0, 427.0, 996.0, 3052.0, 13238.0, 96289.0, 3499490.0, 537995.0, 32501.0, 6702.0, 1869.0, 673.0, 285.0, 138.0, 67.0, 37.0, 10.0, 14.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92919921875, -0.8989791870117188, -0.8687591552734375, -0.8385391235351562, -0.808319091796875, -0.7780990600585938, -0.7478790283203125, -0.7176589965820312, -0.68743896484375, -0.6572189331054688, -0.6269989013671875, -0.5967788696289062, -0.566558837890625, -0.5363388061523438, -0.5061187744140625, -0.47589874267578125, -0.4456787109375, -0.41545867919921875, -0.3852386474609375, -0.35501861572265625, -0.324798583984375, -0.29457855224609375, -0.2643585205078125, -0.23413848876953125, -0.20391845703125, -0.17369842529296875, -0.1434783935546875, -0.11325836181640625, -0.083038330078125, -0.05281829833984375, -0.0225982666015625, 0.00762176513671875, 0.037841796875, 0.06806182861328125, 0.0982818603515625, 0.12850189208984375, 0.158721923828125, 0.18894195556640625, 0.2191619873046875, 0.24938201904296875, 0.27960205078125, 0.30982208251953125, 0.3400421142578125, 0.37026214599609375, 0.400482177734375, 0.43070220947265625, 0.4609222412109375, 0.49114227294921875, 0.5213623046875, 0.5515823364257812, 0.5818023681640625, 0.6120223999023438, 0.642242431640625, 0.6724624633789062, 0.7026824951171875, 0.7329025268554688, 0.76312255859375, 0.7933425903320312, 0.8235626220703125, 0.8537826538085938, 0.884002685546875, 0.9142227172851562, 0.9444427490234375, 0.9746627807617188, 1.0048828125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 5.0, 6.0, 8.0, 18.0, 19.0, 35.0, 43.0, 111.0, 208.0, 517.0, 1101.0, 1063.0, 467.0, 209.0, 97.0, 57.0, 39.0, 13.0, 14.0, 18.0, 8.0, 6.0, 5.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1611328125, -1.1305465698242188, -1.0999603271484375, -1.0693740844726562, -1.038787841796875, -1.0082015991210938, -0.9776153564453125, -0.9470291137695312, -0.91644287109375, -0.8858566284179688, -0.8552703857421875, -0.8246841430664062, -0.794097900390625, -0.7635116577148438, -0.7329254150390625, -0.7023391723632812, -0.6717529296875, -0.6411666870117188, -0.6105804443359375, -0.5799942016601562, -0.549407958984375, -0.5188217163085938, -0.4882354736328125, -0.45764923095703125, -0.42706298828125, -0.39647674560546875, -0.3658905029296875, -0.33530426025390625, -0.304718017578125, -0.27413177490234375, -0.2435455322265625, -0.21295928955078125, -0.182373046875, -0.15178680419921875, -0.1212005615234375, -0.09061431884765625, -0.060028076171875, -0.02944183349609375, 0.0011444091796875, 0.03173065185546875, 0.06231689453125, 0.09290313720703125, 0.1234893798828125, 0.15407562255859375, 0.184661865234375, 0.21524810791015625, 0.2458343505859375, 0.27642059326171875, 0.3070068359375, 0.33759307861328125, 0.3681793212890625, 0.39876556396484375, 0.429351806640625, 0.45993804931640625, 0.4905242919921875, 0.5211105346679688, 0.55169677734375, 0.5822830200195312, 0.6128692626953125, 0.6434555053710938, 0.674041748046875, 0.7046279907226562, 0.7352142333984375, 0.7658004760742188, 0.79638671875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 6.0, 14.0, 15.0, 45.0, 117.0, 210.0, 260.0, 165.0, 79.0, 36.0, 16.0, 7.0, 6.0, 5.0, 6.0, 5.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.605859279632568, -4.37527322769165, -4.144687175750732, -3.9141008853912354, -3.6835148334503174, -3.4529287815093994, -3.2223424911499023, -2.9917564392089844, -2.7611703872680664, -2.5305843353271484, -2.2999982833862305, -2.0694119930267334, -1.8388259410858154, -1.6082398891448975, -1.37765371799469, -1.1470675468444824, -0.9164814949035645, -0.6858953833580017, -0.45530927181243896, -0.22472316026687622, 0.0058629512786865234, 0.2364490032196045, 0.467035174369812, 0.6976213455200195, 0.9282073974609375, 1.1587934494018555, 1.389379620552063, 1.6199657917022705, 1.8505518436431885, 2.0811378955841064, 2.3117241859436035, 2.5423102378845215, 2.7728958129882812, 3.003481864929199, 3.234067916870117, 3.4646542072296143, 3.6952402591705322, 3.92582631111145, 4.156412601470947, 4.386998653411865, 4.617584705352783, 4.848170757293701, 5.078756809234619, 5.309342861175537, 5.539929389953613, 5.770515441894531, 6.001101493835449, 6.231687545776367, 6.462273597717285, 6.692859649658203, 6.923445701599121, 7.154031753540039, 7.384617805480957, 7.615203857421875, 7.845790386199951, 8.076375961303711, 8.306962966918945, 8.537549018859863, 8.768135070800781, 8.9987211227417, 9.229307174682617, 9.459893226623535, 9.690479278564453, 9.921066284179688, 10.151651382446289]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 7.0, 8.0, 11.0, 5.0, 9.0, 9.0, 17.0, 28.0, 33.0, 39.0, 51.0, 47.0, 49.0, 58.0, 47.0, 52.0, 73.0, 59.0, 61.0, 50.0, 49.0, 48.0, 47.0, 23.0, 23.0, 19.0, 23.0, 12.0, 7.0, 8.0, 5.0, 6.0, 4.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.158969402313232, -4.044740676879883, -3.930511474609375, -3.8162827491760254, -3.7020537853240967, -3.587824821472168, -3.4735958576202393, -3.3593668937683105, -3.245138168334961, -3.1309092044830322, -3.0166802406311035, -2.902451515197754, -2.788222551345825, -2.6739935874938965, -2.5597646236419678, -2.445535659790039, -2.3313069343566895, -2.2170779705047607, -2.102849006652832, -1.9886201620101929, -1.8743913173675537, -1.760162353515625, -1.6459333896636963, -1.5317045450210571, -1.4174754619598389, -1.3032464981079102, -1.189017653465271, -1.0747886896133423, -0.9605598449707031, -0.8463308811187744, -0.7321019768714905, -0.6178730726242065, -0.5036442279815674, -0.38941532373428345, -0.2751864194869995, -0.1609574854373932, -0.04672858119010925, 0.06750035285949707, 0.181729257106781, 0.29595816135406494, 0.4101870656013489, 0.5244159698486328, 0.6386448740959167, 0.7528737783432007, 0.8671027421951294, 0.9813316464424133, 1.0955605506896973, 1.209789514541626, 1.3240183591842651, 1.4382473230361938, 1.552476167678833, 1.6667051315307617, 1.7809339761734009, 1.8951629400253296, 2.0093917846679688, 2.1236207485198975, 2.237849712371826, 2.352078676223755, 2.4663076400756836, 2.580536365509033, 2.694765329360962, 2.8089942932128906, 2.9232232570648193, 3.037452220916748, 3.1516809463500977]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 12.0, 9.0, 15.0, 25.0, 39.0, 66.0, 98.0, 154.0, 249.0, 488.0, 1023.0, 2280.0, 6035.0, 19341.0, 85988.0, 656213.0, 223819.0, 36281.0, 9973.0, 3507.0, 1392.0, 657.0, 349.0, 193.0, 119.0, 75.0, 49.0, 33.0, 24.0, 13.0, 10.0, 7.0, 4.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6025390625, -0.5781707763671875, -0.553802490234375, -0.5294342041015625, -0.50506591796875, -0.4806976318359375, -0.456329345703125, -0.4319610595703125, -0.4075927734375, -0.3832244873046875, -0.358856201171875, -0.3344879150390625, -0.31011962890625, -0.2857513427734375, -0.261383056640625, -0.2370147705078125, -0.212646484375, -0.1882781982421875, -0.163909912109375, -0.1395416259765625, -0.11517333984375, -0.0908050537109375, -0.066436767578125, -0.0420684814453125, -0.0177001953125, 0.0066680908203125, 0.031036376953125, 0.0554046630859375, 0.07977294921875, 0.1041412353515625, 0.128509521484375, 0.1528778076171875, 0.17724609375, 0.2016143798828125, 0.225982666015625, 0.2503509521484375, 0.27471923828125, 0.2990875244140625, 0.323455810546875, 0.3478240966796875, 0.3721923828125, 0.3965606689453125, 0.420928955078125, 0.4452972412109375, 0.46966552734375, 0.4940338134765625, 0.518402099609375, 0.5427703857421875, 0.567138671875, 0.5915069580078125, 0.615875244140625, 0.6402435302734375, 0.66461181640625, 0.6889801025390625, 0.713348388671875, 0.7377166748046875, 0.7620849609375, 0.7864532470703125, 0.810821533203125, 0.8351898193359375, 0.85955810546875, 0.8839263916015625, 0.908294677734375, 0.9326629638671875, 0.95703125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 4.0, 5.0, 4.0, 11.0, 9.0, 7.0, 14.0, 20.0, 30.0, 29.0, 41.0, 39.0, 54.0, 47.0, 71.0, 55.0, 64.0, 69.0, 72.0, 55.0, 40.0, 52.0, 28.0, 32.0, 35.0, 38.0, 17.0, 14.0, 16.0, 12.0, 7.0, 8.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.40087890625, -0.3913612365722656, -0.38184356689453125, -0.3723258972167969, -0.3628082275390625, -0.3532905578613281, -0.34377288818359375, -0.3342552185058594, -0.324737548828125, -0.3152198791503906, -0.30570220947265625, -0.2961845397949219, -0.2866668701171875, -0.2771492004394531, -0.26763153076171875, -0.2581138610839844, -0.24859619140625, -0.23907852172851562, -0.22956085205078125, -0.22004318237304688, -0.2105255126953125, -0.20100784301757812, -0.19149017333984375, -0.18197250366210938, -0.172454833984375, -0.16293716430664062, -0.15341949462890625, -0.14390182495117188, -0.1343841552734375, -0.12486648559570312, -0.11534881591796875, -0.10583114624023438, -0.0963134765625, -0.08679580688476562, -0.07727813720703125, -0.06776046752929688, -0.0582427978515625, -0.048725128173828125, -0.03920745849609375, -0.029689788818359375, -0.020172119140625, -0.010654449462890625, -0.00113677978515625, 0.008380889892578125, 0.0178985595703125, 0.027416229248046875, 0.03693389892578125, 0.046451568603515625, 0.05596923828125, 0.06548690795898438, 0.07500457763671875, 0.08452224731445312, 0.0940399169921875, 0.10355758666992188, 0.11307525634765625, 0.12259292602539062, 0.132110595703125, 0.14162826538085938, 0.15114593505859375, 0.16066360473632812, 0.1701812744140625, 0.17969894409179688, 0.18921661376953125, 0.19873428344726562, 0.208251953125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 7.0, 4.0, 7.0, 15.0, 18.0, 13.0, 14.0, 30.0, 31.0, 43.0, 67.0, 99.0, 134.0, 206.0, 311.0, 473.0, 791.0, 1633.0, 3761.0, 11035.0, 44415.0, 460732.0, 461216.0, 44597.0, 11233.0, 3775.0, 1745.0, 786.0, 443.0, 266.0, 182.0, 119.0, 89.0, 60.0, 54.0, 31.0, 29.0, 28.0, 23.0, 10.0, 12.0, 2.0, 5.0, 5.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.8056640625, -0.780487060546875, -0.75531005859375, -0.730133056640625, -0.7049560546875, -0.679779052734375, -0.65460205078125, -0.629425048828125, -0.604248046875, -0.579071044921875, -0.55389404296875, -0.528717041015625, -0.5035400390625, -0.478363037109375, -0.45318603515625, -0.428009033203125, -0.40283203125, -0.377655029296875, -0.35247802734375, -0.327301025390625, -0.3021240234375, -0.276947021484375, -0.25177001953125, -0.226593017578125, -0.201416015625, -0.176239013671875, -0.15106201171875, -0.125885009765625, -0.1007080078125, -0.075531005859375, -0.05035400390625, -0.025177001953125, 0.0, 0.025177001953125, 0.05035400390625, 0.075531005859375, 0.1007080078125, 0.125885009765625, 0.15106201171875, 0.176239013671875, 0.201416015625, 0.226593017578125, 0.25177001953125, 0.276947021484375, 0.3021240234375, 0.327301025390625, 0.35247802734375, 0.377655029296875, 0.40283203125, 0.428009033203125, 0.45318603515625, 0.478363037109375, 0.5035400390625, 0.528717041015625, 0.55389404296875, 0.579071044921875, 0.604248046875, 0.629425048828125, 0.65460205078125, 0.679779052734375, 0.7049560546875, 0.730133056640625, 0.75531005859375, 0.780487060546875, 0.8056640625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 9.0, 3.0, 3.0, 6.0, 8.0, 10.0, 6.0, 10.0, 16.0, 17.0, 18.0, 23.0, 31.0, 40.0, 26.0, 38.0, 44.0, 45.0, 42.0, 53.0, 44.0, 65.0, 58.0, 53.0, 43.0, 28.0, 36.0, 38.0, 27.0, 23.0, 23.0, 26.0, 14.0, 23.0, 8.0, 8.0, 9.0, 6.0, 4.0, 5.0, 2.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.97412109375, -0.9413681030273438, -0.9086151123046875, -0.8758621215820312, -0.843109130859375, -0.8103561401367188, -0.7776031494140625, -0.7448501586914062, -0.71209716796875, -0.6793441772460938, -0.6465911865234375, -0.6138381958007812, -0.581085205078125, -0.5483322143554688, -0.5155792236328125, -0.48282623291015625, -0.4500732421875, -0.41732025146484375, -0.3845672607421875, -0.35181427001953125, -0.319061279296875, -0.28630828857421875, -0.2535552978515625, -0.22080230712890625, -0.18804931640625, -0.15529632568359375, -0.1225433349609375, -0.08979034423828125, -0.057037353515625, -0.02428436279296875, 0.0084686279296875, 0.04122161865234375, 0.073974609375, 0.10672760009765625, 0.1394805908203125, 0.17223358154296875, 0.204986572265625, 0.23773956298828125, 0.2704925537109375, 0.30324554443359375, 0.33599853515625, 0.36875152587890625, 0.4015045166015625, 0.43425750732421875, 0.467010498046875, 0.49976348876953125, 0.5325164794921875, 0.5652694702148438, 0.5980224609375, 0.6307754516601562, 0.6635284423828125, 0.6962814331054688, 0.729034423828125, 0.7617874145507812, 0.7945404052734375, 0.8272933959960938, 0.86004638671875, 0.8927993774414062, 0.9255523681640625, 0.9583053588867188, 0.991058349609375, 1.0238113403320312, 1.0565643310546875, 1.0893173217773438, 1.1220703125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 9.0, 28.0, 39.0, 84.0, 244.0, 934.0, 6552.0, 215680.0, 809406.0, 13501.0, 1513.0, 345.0, 105.0, 43.0, 20.0, 10.0, 13.0, 8.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85205078125, -0.8228073120117188, -0.7935638427734375, -0.7643203735351562, -0.735076904296875, -0.7058334350585938, -0.6765899658203125, -0.6473464965820312, -0.61810302734375, -0.5888595581054688, -0.5596160888671875, -0.5303726196289062, -0.501129150390625, -0.47188568115234375, -0.4426422119140625, -0.41339874267578125, -0.3841552734375, -0.35491180419921875, -0.3256683349609375, -0.29642486572265625, -0.267181396484375, -0.23793792724609375, -0.2086944580078125, -0.17945098876953125, -0.15020751953125, -0.12096405029296875, -0.0917205810546875, -0.06247711181640625, -0.033233642578125, -0.00399017333984375, 0.0252532958984375, 0.05449676513671875, 0.083740234375, 0.11298370361328125, 0.1422271728515625, 0.17147064208984375, 0.200714111328125, 0.22995758056640625, 0.2592010498046875, 0.28844451904296875, 0.31768798828125, 0.34693145751953125, 0.3761749267578125, 0.40541839599609375, 0.434661865234375, 0.46390533447265625, 0.4931488037109375, 0.5223922729492188, 0.5516357421875, 0.5808792114257812, 0.6101226806640625, 0.6393661499023438, 0.668609619140625, 0.6978530883789062, 0.7270965576171875, 0.7563400268554688, 0.78558349609375, 0.8148269653320312, 0.8440704345703125, 0.8733139038085938, 0.902557373046875, 0.9318008422851562, 0.9610443115234375, 0.9902877807617188, 1.01953125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 5.0, 3.0, 5.0, 8.0, 3.0, 7.0, 8.0, 9.0, 9.0, 8.0, 10.0, 23.0, 23.0, 27.0, 57.0, 81.0, 107.0, 126.0, 132.0, 110.0, 62.0, 36.0, 25.0, 26.0, 23.0, 9.0, 10.0, 8.0, 11.0, 6.0, 9.0, 3.0, 1.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00010007619857788086, -9.708385914564133e-05, -9.40915197134018e-05, -9.109918028116226e-05, -8.810684084892273e-05, -8.51145014166832e-05, -8.212216198444366e-05, -7.912982255220413e-05, -7.61374831199646e-05, -7.314514368772507e-05, -7.015280425548553e-05, -6.7160464823246e-05, -6.416812539100647e-05, -6.117578595876694e-05, -5.8183446526527405e-05, -5.519110709428787e-05, -5.219876766204834e-05, -4.920642822980881e-05, -4.6214088797569275e-05, -4.322174936532974e-05, -4.022940993309021e-05, -3.723707050085068e-05, -3.4244731068611145e-05, -3.125239163637161e-05, -2.826005220413208e-05, -2.5267712771892548e-05, -2.2275373339653015e-05, -1.9283033907413483e-05, -1.629069447517395e-05, -1.3298355042934418e-05, -1.0306015610694885e-05, -7.313676178455353e-06, -4.32133674621582e-06, -1.3289973139762878e-06, 1.6633421182632446e-06, 4.655681550502777e-06, 7.64802098274231e-06, 1.0640360414981842e-05, 1.3632699847221375e-05, 1.6625039279460907e-05, 1.961737871170044e-05, 2.2609718143939972e-05, 2.5602057576179504e-05, 2.8594397008419037e-05, 3.158673644065857e-05, 3.45790758728981e-05, 3.7571415305137634e-05, 4.056375473737717e-05, 4.35560941696167e-05, 4.654843360185623e-05, 4.9540773034095764e-05, 5.25331124663353e-05, 5.552545189857483e-05, 5.851779133081436e-05, 6.15101307630539e-05, 6.450247019529343e-05, 6.749480962753296e-05, 7.048714905977249e-05, 7.347948849201202e-05, 7.647182792425156e-05, 7.946416735649109e-05, 8.245650678873062e-05, 8.544884622097015e-05, 8.844118565320969e-05, 9.143352508544922e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 6.0, 3.0, 9.0, 9.0, 19.0, 25.0, 52.0, 80.0, 145.0, 342.0, 794.0, 2072.0, 8184.0, 65989.0, 851354.0, 104778.0, 10666.0, 2395.0, 844.0, 355.0, 194.0, 119.0, 43.0, 31.0, 16.0, 12.0, 8.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6318359375, -0.6135635375976562, -0.5952911376953125, -0.5770187377929688, -0.558746337890625, -0.5404739379882812, -0.5222015380859375, -0.5039291381835938, -0.48565673828125, -0.46738433837890625, -0.4491119384765625, -0.43083953857421875, -0.412567138671875, -0.39429473876953125, -0.3760223388671875, -0.35774993896484375, -0.3394775390625, -0.32120513916015625, -0.3029327392578125, -0.28466033935546875, -0.266387939453125, -0.24811553955078125, -0.2298431396484375, -0.21157073974609375, -0.19329833984375, -0.17502593994140625, -0.1567535400390625, -0.13848114013671875, -0.120208740234375, -0.10193634033203125, -0.0836639404296875, -0.06539154052734375, -0.047119140625, -0.02884674072265625, -0.0105743408203125, 0.00769805908203125, 0.025970458984375, 0.04424285888671875, 0.0625152587890625, 0.08078765869140625, 0.09906005859375, 0.11733245849609375, 0.1356048583984375, 0.15387725830078125, 0.172149658203125, 0.19042205810546875, 0.2086944580078125, 0.22696685791015625, 0.2452392578125, 0.26351165771484375, 0.2817840576171875, 0.30005645751953125, 0.318328857421875, 0.33660125732421875, 0.3548736572265625, 0.37314605712890625, 0.39141845703125, 0.40969085693359375, 0.4279632568359375, 0.44623565673828125, 0.464508056640625, 0.48278045654296875, 0.5010528564453125, 0.5193252563476562, 0.53759765625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 3.0, 6.0, 7.0, 4.0, 4.0, 16.0, 16.0, 20.0, 15.0, 28.0, 34.0, 38.0, 52.0, 73.0, 88.0, 81.0, 77.0, 65.0, 80.0, 72.0, 43.0, 43.0, 21.0, 26.0, 20.0, 12.0, 13.0, 8.0, 10.0, 4.0, 10.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.218505859375, -0.20912933349609375, -0.1997528076171875, -0.19037628173828125, -0.180999755859375, -0.17162322998046875, -0.1622467041015625, -0.15287017822265625, -0.14349365234375, -0.13411712646484375, -0.1247406005859375, -0.11536407470703125, -0.105987548828125, -0.09661102294921875, -0.0872344970703125, -0.07785797119140625, -0.0684814453125, -0.05910491943359375, -0.0497283935546875, -0.04035186767578125, -0.030975341796875, -0.02159881591796875, -0.0122222900390625, -0.00284576416015625, 0.00653076171875, 0.01590728759765625, 0.0252838134765625, 0.03466033935546875, 0.044036865234375, 0.05341339111328125, 0.0627899169921875, 0.07216644287109375, 0.08154296875, 0.09091949462890625, 0.1002960205078125, 0.10967254638671875, 0.119049072265625, 0.12842559814453125, 0.1378021240234375, 0.14717864990234375, 0.15655517578125, 0.16593170166015625, 0.1753082275390625, 0.18468475341796875, 0.194061279296875, 0.20343780517578125, 0.2128143310546875, 0.22219085693359375, 0.2315673828125, 0.24094390869140625, 0.2503204345703125, 0.25969696044921875, 0.269073486328125, 0.27845001220703125, 0.2878265380859375, 0.29720306396484375, 0.30657958984375, 0.31595611572265625, 0.3253326416015625, 0.33470916748046875, 0.344085693359375, 0.35346221923828125, 0.3628387451171875, 0.37221527099609375, 0.381591796875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 5.0, 6.0, 20.0, 44.0, 84.0, 159.0, 268.0, 191.0, 100.0, 66.0, 24.0, 6.0, 8.0, 5.0, 8.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.225849151611328, -5.983249187469482, -5.740649700164795, -5.498049736022949, -5.2554497718811035, -5.012850284576416, -4.77025032043457, -4.527650833129883, -4.285050868988037, -4.042450904846191, -3.799851179122925, -3.557251453399658, -3.3146517276763916, -3.072052001953125, -2.8294520378112793, -2.5868523120880127, -2.344252347946167, -2.1016526222229004, -1.8590527772903442, -1.616452932357788, -1.3738532066345215, -1.1312533617019653, -0.8886535167694092, -0.6460537910461426, -0.4034539461135864, -0.16085414588451385, 0.08174565434455872, 0.3243454694747925, 0.5669452548027039, 0.8095450401306152, 1.0521448850631714, 1.294744610786438, 1.5373444557189941, 1.7799443006515503, 2.0225441455841064, 2.265143871307373, 2.5077435970306396, 2.7503433227539062, 2.992943286895752, 3.2355430126190186, 3.478142738342285, 3.7207424640655518, 3.9633424282073975, 4.205942153930664, 4.44854211807251, 4.691141605377197, 4.933741569519043, 5.1763410568237305, 5.418941497802734, 5.66154146194458, 5.904140949249268, 6.146740913391113, 6.389340877532959, 6.6319403648376465, 6.874540328979492, 7.11713981628418, 7.359739780426025, 7.602339744567871, 7.844939231872559, 8.087539672851562, 8.33013916015625, 8.572738647460938, 8.815338134765625, 9.057938575744629, 9.300538063049316]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 6.0, 8.0, 8.0, 6.0, 10.0, 10.0, 12.0, 18.0, 31.0, 28.0, 26.0, 37.0, 46.0, 54.0, 48.0, 46.0, 64.0, 69.0, 63.0, 73.0, 43.0, 53.0, 43.0, 24.0, 41.0, 30.0, 24.0, 19.0, 15.0, 11.0, 13.0, 3.0, 3.0, 7.0, 6.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8675172328948975, -3.7111971378326416, -3.5548770427703857, -3.398556709289551, -3.242236614227295, -3.085916519165039, -2.929596424102783, -2.7732763290405273, -2.6169562339782715, -2.4606361389160156, -2.3043160438537598, -2.147995948791504, -1.991675615310669, -1.835355520248413, -1.6790354251861572, -1.5227152109146118, -1.3663949966430664, -1.2100749015808105, -1.0537546873092651, -0.8974345922470093, -0.7411144375801086, -0.584794282913208, -0.42847418785095215, -0.27215397357940674, -0.11583387851715088, 0.04048626124858856, 0.196806401014328, 0.35312652587890625, 0.5094466805458069, 0.6657668352127075, 0.8220869302749634, 0.9784071445465088, 1.1347270011901855, 1.2910470962524414, 1.4473673105239868, 1.6036874055862427, 1.760007619857788, 1.916327714920044, 2.0726478099823, 2.2289681434631348, 2.3852882385253906, 2.5416083335876465, 2.6979284286499023, 2.854248523712158, 3.010568857192993, 3.166888952255249, 3.323209047317505, 3.47952938079834, 3.6358492374420166, 3.7921693325042725, 3.9484894275665283, 4.104809761047363, 4.261129856109619, 4.417449951171875, 4.573770046234131, 4.730090141296387, 4.886410236358643, 5.042730331420898, 5.199050426483154, 5.35537052154541, 5.511690616607666, 5.668010711669922, 5.824331283569336, 5.980651378631592, 6.136971473693848]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 3.0, 7.0, 7.0, 10.0, 13.0, 8.0, 18.0, 18.0, 30.0, 50.0, 71.0, 89.0, 154.0, 264.0, 516.0, 1033.0, 2329.0, 6182.0, 19518.0, 86226.0, 606947.0, 2741544.0, 606614.0, 89691.0, 21165.0, 6951.0, 2629.0, 1075.0, 488.0, 283.0, 152.0, 72.0, 40.0, 40.0, 15.0, 13.0, 11.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.52197265625, -0.5084152221679688, -0.4948577880859375, -0.48130035400390625, -0.467742919921875, -0.45418548583984375, -0.4406280517578125, -0.42707061767578125, -0.41351318359375, -0.39995574951171875, -0.3863983154296875, -0.37284088134765625, -0.359283447265625, -0.34572601318359375, -0.3321685791015625, -0.31861114501953125, -0.3050537109375, -0.29149627685546875, -0.2779388427734375, -0.26438140869140625, -0.250823974609375, -0.23726654052734375, -0.2237091064453125, -0.21015167236328125, -0.19659423828125, -0.18303680419921875, -0.1694793701171875, -0.15592193603515625, -0.142364501953125, -0.12880706787109375, -0.1152496337890625, -0.10169219970703125, -0.088134765625, -0.07457733154296875, -0.0610198974609375, -0.04746246337890625, -0.033905029296875, -0.02034759521484375, -0.0067901611328125, 0.00676727294921875, 0.02032470703125, 0.03388214111328125, 0.0474395751953125, 0.06099700927734375, 0.074554443359375, 0.08811187744140625, 0.1016693115234375, 0.11522674560546875, 0.1287841796875, 0.14234161376953125, 0.1558990478515625, 0.16945648193359375, 0.183013916015625, 0.19657135009765625, 0.2101287841796875, 0.22368621826171875, 0.23724365234375, 0.25080108642578125, 0.2643585205078125, 0.27791595458984375, 0.291473388671875, 0.30503082275390625, 0.3185882568359375, 0.33214569091796875, 0.345703125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 5.0, 3.0, 8.0, 16.0, 13.0, 22.0, 18.0, 30.0, 36.0, 51.0, 44.0, 62.0, 53.0, 65.0, 70.0, 82.0, 45.0, 55.0, 59.0, 53.0, 38.0, 34.0, 36.0, 22.0, 23.0, 13.0, 12.0, 13.0, 11.0, 7.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.338623046875, -0.3295001983642578, -0.3203773498535156, -0.31125450134277344, -0.30213165283203125, -0.29300880432128906, -0.2838859558105469, -0.2747631072998047, -0.2656402587890625, -0.2565174102783203, -0.24739456176757812, -0.23827171325683594, -0.22914886474609375, -0.22002601623535156, -0.21090316772460938, -0.2017803192138672, -0.192657470703125, -0.1835346221923828, -0.17441177368164062, -0.16528892517089844, -0.15616607666015625, -0.14704322814941406, -0.13792037963867188, -0.1287975311279297, -0.1196746826171875, -0.11055183410644531, -0.10142898559570312, -0.09230613708496094, -0.08318328857421875, -0.07406044006347656, -0.06493759155273438, -0.05581474304199219, -0.04669189453125, -0.03756904602050781, -0.028446197509765625, -0.019323348999023438, -0.01020050048828125, -0.0010776519775390625, 0.008045196533203125, 0.017168045043945312, 0.0262908935546875, 0.03541374206542969, 0.044536590576171875, 0.05365943908691406, 0.06278228759765625, 0.07190513610839844, 0.08102798461914062, 0.09015083312988281, 0.099273681640625, 0.10839653015136719, 0.11751937866210938, 0.12664222717285156, 0.13576507568359375, 0.14488792419433594, 0.15401077270507812, 0.1631336212158203, 0.1722564697265625, 0.1813793182373047, 0.19050216674804688, 0.19962501525878906, 0.20874786376953125, 0.21787071228027344, 0.22699356079101562, 0.2361164093017578, 0.2452392578125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 7.0, 4.0, 9.0, 10.0, 18.0, 22.0, 41.0, 57.0, 91.0, 162.0, 298.0, 555.0, 1198.0, 2847.0, 8083.0, 30450.0, 153749.0, 2128399.0, 1700861.0, 129022.0, 26229.0, 7571.0, 2495.0, 1050.0, 457.0, 243.0, 135.0, 76.0, 54.0, 36.0, 19.0, 16.0, 3.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.638671875, -0.619293212890625, -0.59991455078125, -0.580535888671875, -0.5611572265625, -0.541778564453125, -0.52239990234375, -0.503021240234375, -0.483642578125, -0.464263916015625, -0.44488525390625, -0.425506591796875, -0.4061279296875, -0.386749267578125, -0.36737060546875, -0.347991943359375, -0.32861328125, -0.309234619140625, -0.28985595703125, -0.270477294921875, -0.2510986328125, -0.231719970703125, -0.21234130859375, -0.192962646484375, -0.173583984375, -0.154205322265625, -0.13482666015625, -0.115447998046875, -0.0960693359375, -0.076690673828125, -0.05731201171875, -0.037933349609375, -0.0185546875, 0.000823974609375, 0.02020263671875, 0.039581298828125, 0.0589599609375, 0.078338623046875, 0.09771728515625, 0.117095947265625, 0.136474609375, 0.155853271484375, 0.17523193359375, 0.194610595703125, 0.2139892578125, 0.233367919921875, 0.25274658203125, 0.272125244140625, 0.29150390625, 0.310882568359375, 0.33026123046875, 0.349639892578125, 0.3690185546875, 0.388397216796875, 0.40777587890625, 0.427154541015625, 0.446533203125, 0.465911865234375, 0.48529052734375, 0.504669189453125, 0.5240478515625, 0.543426513671875, 0.56280517578125, 0.582183837890625, 0.6015625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 6.0, 17.0, 17.0, 21.0, 19.0, 37.0, 49.0, 74.0, 85.0, 138.0, 238.0, 353.0, 595.0, 728.0, 609.0, 369.0, 218.0, 138.0, 105.0, 71.0, 43.0, 44.0, 23.0, 15.0, 10.0, 15.0, 9.0, 3.0, 4.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.814453125, -0.7908248901367188, -0.7671966552734375, -0.7435684204101562, -0.719940185546875, -0.6963119506835938, -0.6726837158203125, -0.6490554809570312, -0.62542724609375, -0.6017990112304688, -0.5781707763671875, -0.5545425415039062, -0.530914306640625, -0.5072860717773438, -0.4836578369140625, -0.46002960205078125, -0.4364013671875, -0.41277313232421875, -0.3891448974609375, -0.36551666259765625, -0.341888427734375, -0.31826019287109375, -0.2946319580078125, -0.27100372314453125, -0.24737548828125, -0.22374725341796875, -0.2001190185546875, -0.17649078369140625, -0.152862548828125, -0.12923431396484375, -0.1056060791015625, -0.08197784423828125, -0.058349609375, -0.03472137451171875, -0.0110931396484375, 0.01253509521484375, 0.036163330078125, 0.05979156494140625, 0.0834197998046875, 0.10704803466796875, 0.13067626953125, 0.15430450439453125, 0.1779327392578125, 0.20156097412109375, 0.225189208984375, 0.24881744384765625, 0.2724456787109375, 0.29607391357421875, 0.3197021484375, 0.34333038330078125, 0.3669586181640625, 0.39058685302734375, 0.414215087890625, 0.43784332275390625, 0.4614715576171875, 0.48509979248046875, 0.50872802734375, 0.5323562622070312, 0.5559844970703125, 0.5796127319335938, 0.603240966796875, 0.6268692016601562, 0.6504974365234375, 0.6741256713867188, 0.69775390625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 7.0, 13.0, 46.0, 186.0, 389.0, 238.0, 79.0, 19.0, 12.0, 1.0, 1.0, 5.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.852357864379883, -15.406903266906738, -14.961448669433594, -14.515995025634766, -14.070540428161621, -13.625085830688477, -13.179632186889648, -12.734177589416504, -12.28872299194336, -11.843268394470215, -11.39781379699707, -10.952360153198242, -10.506905555725098, -10.061450958251953, -9.615997314453125, -9.17054271697998, -8.725088119506836, -8.279633522033691, -7.834179401397705, -7.388725280761719, -6.943270683288574, -6.49781608581543, -6.052361965179443, -5.606907844543457, -5.1614532470703125, -4.715998649597168, -4.270544528961182, -3.825090169906616, -3.379635810852051, -2.9341814517974854, -2.48872709274292, -2.0432727336883545, -1.597818374633789, -1.1523640155792236, -0.7069096565246582, -0.2614552974700928, 0.18399906158447266, 0.6294534206390381, 1.0749077796936035, 1.520362138748169, 1.9658164978027344, 2.4112708568573, 2.8567252159118652, 3.3021795749664307, 3.747633934020996, 4.193088531494141, 4.638542652130127, 5.083996772766113, 5.529451370239258, 5.974905967712402, 6.420360088348389, 6.865814208984375, 7.3112688064575195, 7.756723403930664, 8.202177047729492, 8.647631645202637, 9.093086242675781, 9.538540840148926, 9.98399543762207, 10.429449081420898, 10.874903678894043, 11.320358276367188, 11.765811920166016, 12.21126651763916, 12.656721115112305]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 6.0, 10.0, 11.0, 12.0, 15.0, 19.0, 22.0, 29.0, 26.0, 42.0, 34.0, 41.0, 39.0, 51.0, 48.0, 67.0, 64.0, 53.0, 57.0, 42.0, 44.0, 39.0, 42.0, 32.0, 36.0, 25.0, 14.0, 22.0, 14.0, 12.0, 9.0, 4.0, 7.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1665587425231934, -3.0406112670898438, -2.914663791656494, -2.7887163162231445, -2.662768840789795, -2.5368213653564453, -2.410874128341675, -2.284926652908325, -2.1589791774749756, -2.033031702041626, -1.9070842266082764, -1.7811368703842163, -1.6551893949508667, -1.529241919517517, -1.403294563293457, -1.2773470878601074, -1.1513996124267578, -1.0254521369934082, -0.8995047211647034, -0.7735573053359985, -0.6476098299026489, -0.5216623544692993, -0.3957149386405945, -0.26976752281188965, -0.14382004737854004, -0.017872601747512817, 0.1080748438835144, 0.23402228951454163, 0.35996973514556885, 0.48591721057891846, 0.6118646264076233, 0.7378120422363281, 0.8637590408325195, 0.9897065162658691, 1.1156539916992188, 1.2416013479232788, 1.3675488233566284, 1.493496298789978, 1.619443655014038, 1.7453911304473877, 1.8713386058807373, 1.997286081314087, 2.1232335567474365, 2.249181032180786, 2.3751282691955566, 2.5010757446289062, 2.627023220062256, 2.7529706954956055, 2.878918170928955, 3.0048656463623047, 3.1308131217956543, 3.256760597229004, 3.3827080726623535, 3.508655548095703, 3.6346027851104736, 3.7605502605438232, 3.886497735977173, 4.012444972991943, 4.138392448425293, 4.264339923858643, 4.390287399291992, 4.516234874725342, 4.642182350158691, 4.768129825592041, 4.894077301025391]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 8.0, 14.0, 14.0, 15.0, 34.0, 44.0, 73.0, 144.0, 230.0, 479.0, 1134.0, 2433.0, 6248.0, 17879.0, 61159.0, 266931.0, 519283.0, 122868.0, 32188.0, 10338.0, 3842.0, 1614.0, 726.0, 375.0, 195.0, 113.0, 60.0, 43.0, 22.0, 15.0, 8.0, 5.0, 9.0, 4.0, 3.0, 3.0, 0.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.765625, -0.7432708740234375, -0.720916748046875, -0.6985626220703125, -0.67620849609375, -0.6538543701171875, -0.631500244140625, -0.6091461181640625, -0.5867919921875, -0.5644378662109375, -0.542083740234375, -0.5197296142578125, -0.49737548828125, -0.4750213623046875, -0.452667236328125, -0.4303131103515625, -0.407958984375, -0.3856048583984375, -0.363250732421875, -0.3408966064453125, -0.31854248046875, -0.2961883544921875, -0.273834228515625, -0.2514801025390625, -0.2291259765625, -0.2067718505859375, -0.184417724609375, -0.1620635986328125, -0.13970947265625, -0.1173553466796875, -0.095001220703125, -0.0726470947265625, -0.05029296875, -0.0279388427734375, -0.005584716796875, 0.0167694091796875, 0.03912353515625, 0.0614776611328125, 0.083831787109375, 0.1061859130859375, 0.1285400390625, 0.1508941650390625, 0.173248291015625, 0.1956024169921875, 0.21795654296875, 0.2403106689453125, 0.262664794921875, 0.2850189208984375, 0.307373046875, 0.3297271728515625, 0.352081298828125, 0.3744354248046875, 0.39678955078125, 0.4191436767578125, 0.441497802734375, 0.4638519287109375, 0.4862060546875, 0.5085601806640625, 0.530914306640625, 0.5532684326171875, 0.57562255859375, 0.5979766845703125, 0.620330810546875, 0.6426849365234375, 0.6650390625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 2.0, 1.0, 4.0, 6.0, 7.0, 5.0, 8.0, 11.0, 13.0, 17.0, 24.0, 28.0, 37.0, 31.0, 38.0, 43.0, 47.0, 38.0, 45.0, 45.0, 42.0, 55.0, 40.0, 52.0, 48.0, 45.0, 38.0, 33.0, 31.0, 32.0, 26.0, 20.0, 23.0, 13.0, 17.0, 3.0, 10.0, 8.0, 3.0, 2.0, 7.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.208984375, -0.20178604125976562, -0.19458770751953125, -0.18738937377929688, -0.1801910400390625, -0.17299270629882812, -0.16579437255859375, -0.15859603881835938, -0.151397705078125, -0.14419937133789062, -0.13700103759765625, -0.12980270385742188, -0.1226043701171875, -0.11540603637695312, -0.10820770263671875, -0.10100936889648438, -0.09381103515625, -0.08661270141601562, -0.07941436767578125, -0.07221603393554688, -0.0650177001953125, -0.057819366455078125, -0.05062103271484375, -0.043422698974609375, -0.036224365234375, -0.029026031494140625, -0.02182769775390625, -0.014629364013671875, -0.0074310302734375, -0.000232696533203125, 0.00696563720703125, 0.014163970947265625, 0.0213623046875, 0.028560638427734375, 0.03575897216796875, 0.042957305908203125, 0.0501556396484375, 0.057353973388671875, 0.06455230712890625, 0.07175064086914062, 0.078948974609375, 0.08614730834960938, 0.09334564208984375, 0.10054397583007812, 0.1077423095703125, 0.11494064331054688, 0.12213897705078125, 0.12933731079101562, 0.13653564453125, 0.14373397827148438, 0.15093231201171875, 0.15813064575195312, 0.1653289794921875, 0.17252731323242188, 0.17972564697265625, 0.18692398071289062, 0.194122314453125, 0.20132064819335938, 0.20851898193359375, 0.21571731567382812, 0.2229156494140625, 0.23011398315429688, 0.23731231689453125, 0.24451065063476562, 0.251708984375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 13.0, 4.0, 15.0, 22.0, 28.0, 39.0, 42.0, 103.0, 132.0, 241.0, 363.0, 658.0, 1239.0, 2956.0, 9271.0, 62702.0, 840335.0, 110448.0, 12859.0, 3629.0, 1498.0, 764.0, 469.0, 258.0, 165.0, 96.0, 70.0, 47.0, 19.0, 21.0, 15.0, 10.0, 5.0, 5.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.416015625, -1.3712158203125, -1.326416015625, -1.2816162109375, -1.23681640625, -1.1920166015625, -1.147216796875, -1.1024169921875, -1.0576171875, -1.0128173828125, -0.968017578125, -0.9232177734375, -0.87841796875, -0.8336181640625, -0.788818359375, -0.7440185546875, -0.69921875, -0.6544189453125, -0.609619140625, -0.5648193359375, -0.52001953125, -0.4752197265625, -0.430419921875, -0.3856201171875, -0.3408203125, -0.2960205078125, -0.251220703125, -0.2064208984375, -0.16162109375, -0.1168212890625, -0.072021484375, -0.0272216796875, 0.017578125, 0.0623779296875, 0.107177734375, 0.1519775390625, 0.19677734375, 0.2415771484375, 0.286376953125, 0.3311767578125, 0.3759765625, 0.4207763671875, 0.465576171875, 0.5103759765625, 0.55517578125, 0.5999755859375, 0.644775390625, 0.6895751953125, 0.734375, 0.7791748046875, 0.823974609375, 0.8687744140625, 0.91357421875, 0.9583740234375, 1.003173828125, 1.0479736328125, 1.0927734375, 1.1375732421875, 1.182373046875, 1.2271728515625, 1.27197265625, 1.3167724609375, 1.361572265625, 1.4063720703125, 1.451171875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 5.0, 5.0, 5.0, 3.0, 6.0, 6.0, 8.0, 10.0, 15.0, 15.0, 12.0, 27.0, 27.0, 23.0, 19.0, 37.0, 33.0, 56.0, 35.0, 40.0, 54.0, 46.0, 54.0, 46.0, 53.0, 48.0, 37.0, 42.0, 33.0, 22.0, 28.0, 30.0, 18.0, 21.0, 21.0, 19.0, 11.0, 8.0, 9.0, 6.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.0732421875, -1.0408859252929688, -1.0085296630859375, -0.9761734008789062, -0.943817138671875, -0.9114608764648438, -0.8791046142578125, -0.8467483520507812, -0.81439208984375, -0.7820358276367188, -0.7496795654296875, -0.7173233032226562, -0.684967041015625, -0.6526107788085938, -0.6202545166015625, -0.5878982543945312, -0.5555419921875, -0.5231857299804688, -0.4908294677734375, -0.45847320556640625, -0.426116943359375, -0.39376068115234375, -0.3614044189453125, -0.32904815673828125, -0.29669189453125, -0.26433563232421875, -0.2319793701171875, -0.19962310791015625, -0.167266845703125, -0.13491058349609375, -0.1025543212890625, -0.07019805908203125, -0.037841796875, -0.00548553466796875, 0.0268707275390625, 0.05922698974609375, 0.091583251953125, 0.12393951416015625, 0.1562957763671875, 0.18865203857421875, 0.22100830078125, 0.25336456298828125, 0.2857208251953125, 0.31807708740234375, 0.350433349609375, 0.38278961181640625, 0.4151458740234375, 0.44750213623046875, 0.4798583984375, 0.5122146606445312, 0.5445709228515625, 0.5769271850585938, 0.609283447265625, 0.6416397094726562, 0.6739959716796875, 0.7063522338867188, 0.73870849609375, 0.7710647583007812, 0.8034210205078125, 0.8357772827148438, 0.868133544921875, 0.9004898071289062, 0.9328460693359375, 0.9652023315429688, 0.99755859375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 3.0, 12.0, 11.0, 19.0, 24.0, 46.0, 78.0, 152.0, 269.0, 604.0, 1524.0, 4888.0, 27215.0, 316705.0, 649864.0, 37563.0, 6354.0, 1800.0, 733.0, 317.0, 162.0, 102.0, 43.0, 23.0, 10.0, 12.0, 5.0, 6.0, 6.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55224609375, -0.5365028381347656, -0.5207595825195312, -0.5050163269042969, -0.4892730712890625, -0.4735298156738281, -0.45778656005859375, -0.4420433044433594, -0.426300048828125, -0.4105567932128906, -0.39481353759765625, -0.3790702819824219, -0.3633270263671875, -0.3475837707519531, -0.33184051513671875, -0.3160972595214844, -0.30035400390625, -0.2846107482910156, -0.26886749267578125, -0.2531242370605469, -0.2373809814453125, -0.22163772583007812, -0.20589447021484375, -0.19015121459960938, -0.174407958984375, -0.15866470336914062, -0.14292144775390625, -0.12717819213867188, -0.1114349365234375, -0.09569168090820312, -0.07994842529296875, -0.06420516967773438, -0.0484619140625, -0.032718658447265625, -0.01697540283203125, -0.001232147216796875, 0.0145111083984375, 0.030254364013671875, 0.04599761962890625, 0.061740875244140625, 0.077484130859375, 0.09322738647460938, 0.10897064208984375, 0.12471389770507812, 0.1404571533203125, 0.15620040893554688, 0.17194366455078125, 0.18768692016601562, 0.20343017578125, 0.21917343139648438, 0.23491668701171875, 0.2506599426269531, 0.2664031982421875, 0.2821464538574219, 0.29788970947265625, 0.3136329650878906, 0.329376220703125, 0.3451194763183594, 0.36086273193359375, 0.3766059875488281, 0.3923492431640625, 0.4080924987792969, 0.42383575439453125, 0.4395790100097656, 0.455322265625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 12.0, 4.0, 5.0, 9.0, 12.0, 11.0, 15.0, 23.0, 33.0, 49.0, 48.0, 86.0, 130.0, 110.0, 116.0, 77.0, 51.0, 29.0, 44.0, 26.0, 35.0, 16.0, 13.0, 12.0, 3.0, 6.0, 9.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001316070556640625, -0.0001277988776564598, -0.00012399069964885712, -0.00012018252164125443, -0.00011637434363365173, -0.00011256616562604904, -0.00010875798761844635, -0.00010494980961084366, -0.00010114163160324097, -9.733345359563828e-05, -9.352527558803558e-05, -8.971709758043289e-05, -8.59089195728302e-05, -8.210074156522751e-05, -7.829256355762482e-05, -7.448438555002213e-05, -7.067620754241943e-05, -6.686802953481674e-05, -6.305985152721405e-05, -5.925167351961136e-05, -5.544349551200867e-05, -5.1635317504405975e-05, -4.7827139496803284e-05, -4.401896148920059e-05, -4.02107834815979e-05, -3.640260547399521e-05, -3.259442746639252e-05, -2.8786249458789825e-05, -2.4978071451187134e-05, -2.1169893443584442e-05, -1.736171543598175e-05, -1.3553537428379059e-05, -9.745359420776367e-06, -5.9371814131736755e-06, -2.129003405570984e-06, 1.6791746020317078e-06, 5.487352609634399e-06, 9.295530617237091e-06, 1.3103708624839783e-05, 1.6911886632442474e-05, 2.0720064640045166e-05, 2.4528242647647858e-05, 2.833642065525055e-05, 3.214459866285324e-05, 3.595277667045593e-05, 3.9760954678058624e-05, 4.3569132685661316e-05, 4.737731069326401e-05, 5.11854887008667e-05, 5.499366670846939e-05, 5.880184471607208e-05, 6.261002272367477e-05, 6.641820073127747e-05, 7.022637873888016e-05, 7.403455674648285e-05, 7.784273475408554e-05, 8.165091276168823e-05, 8.545909076929092e-05, 8.926726877689362e-05, 9.307544678449631e-05, 9.6883624792099e-05, 0.00010069180279970169, 0.00010449998080730438, 0.00010830815881490707, 0.00011211633682250977]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 10.0, 11.0, 28.0, 19.0, 29.0, 60.0, 115.0, 152.0, 257.0, 440.0, 812.0, 1631.0, 3635.0, 13013.0, 89252.0, 780648.0, 132981.0, 16963.0, 4560.0, 1861.0, 848.0, 492.0, 268.0, 178.0, 95.0, 60.0, 46.0, 24.0, 15.0, 16.0, 8.0, 6.0, 9.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.490478515625, -0.4774284362792969, -0.46437835693359375, -0.4513282775878906, -0.4382781982421875, -0.4252281188964844, -0.41217803955078125, -0.3991279602050781, -0.386077880859375, -0.3730278015136719, -0.35997772216796875, -0.3469276428222656, -0.3338775634765625, -0.3208274841308594, -0.30777740478515625, -0.2947273254394531, -0.28167724609375, -0.2686271667480469, -0.25557708740234375, -0.24252700805664062, -0.2294769287109375, -0.21642684936523438, -0.20337677001953125, -0.19032669067382812, -0.177276611328125, -0.16422653198242188, -0.15117645263671875, -0.13812637329101562, -0.1250762939453125, -0.11202621459960938, -0.09897613525390625, -0.08592605590820312, -0.0728759765625, -0.059825897216796875, -0.04677581787109375, -0.033725738525390625, -0.0206756591796875, -0.007625579833984375, 0.00542449951171875, 0.018474578857421875, 0.031524658203125, 0.044574737548828125, 0.05762481689453125, 0.07067489624023438, 0.0837249755859375, 0.09677505493164062, 0.10982513427734375, 0.12287521362304688, 0.13592529296875, 0.14897537231445312, 0.16202545166015625, 0.17507553100585938, 0.1881256103515625, 0.20117568969726562, 0.21422576904296875, 0.22727584838867188, 0.240325927734375, 0.2533760070800781, 0.26642608642578125, 0.2794761657714844, 0.2925262451171875, 0.3055763244628906, 0.31862640380859375, 0.3316764831542969, 0.3447265625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 4.0, 5.0, 4.0, 7.0, 6.0, 12.0, 10.0, 17.0, 19.0, 22.0, 25.0, 33.0, 35.0, 46.0, 53.0, 65.0, 88.0, 80.0, 79.0, 54.0, 67.0, 56.0, 26.0, 43.0, 29.0, 21.0, 16.0, 14.0, 9.0, 15.0, 10.0, 7.0, 5.0, 3.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.284912109375, -0.27494049072265625, -0.2649688720703125, -0.25499725341796875, -0.245025634765625, -0.23505401611328125, -0.2250823974609375, -0.21511077880859375, -0.20513916015625, -0.19516754150390625, -0.1851959228515625, -0.17522430419921875, -0.165252685546875, -0.15528106689453125, -0.1453094482421875, -0.13533782958984375, -0.1253662109375, -0.11539459228515625, -0.1054229736328125, -0.09545135498046875, -0.085479736328125, -0.07550811767578125, -0.0655364990234375, -0.05556488037109375, -0.04559326171875, -0.03562164306640625, -0.0256500244140625, -0.01567840576171875, -0.005706787109375, 0.00426483154296875, 0.0142364501953125, 0.02420806884765625, 0.0341796875, 0.04415130615234375, 0.0541229248046875, 0.06409454345703125, 0.074066162109375, 0.08403778076171875, 0.0940093994140625, 0.10398101806640625, 0.11395263671875, 0.12392425537109375, 0.1338958740234375, 0.14386749267578125, 0.153839111328125, 0.16381072998046875, 0.1737823486328125, 0.18375396728515625, 0.1937255859375, 0.20369720458984375, 0.2136688232421875, 0.22364044189453125, 0.233612060546875, 0.24358367919921875, 0.2535552978515625, 0.26352691650390625, 0.27349853515625, 0.28347015380859375, 0.2934417724609375, 0.30341339111328125, 0.313385009765625, 0.32335662841796875, 0.3333282470703125, 0.34329986572265625, 0.353271484375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 8.0, 14.0, 23.0, 42.0, 86.0, 132.0, 248.0, 209.0, 99.0, 59.0, 32.0, 10.0, 15.0, 1.0, 4.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.947265625, -8.690665245056152, -8.434064865112305, -8.177465438842773, -7.920865058898926, -7.664264678955078, -7.4076642990112305, -7.151063919067383, -6.894464015960693, -6.637863636016846, -6.381263732910156, -6.124663352966309, -5.868062973022461, -5.6114630699157715, -5.354862689971924, -5.098262786865234, -4.841662406921387, -4.585062026977539, -4.32846212387085, -4.071861743927002, -3.8152616024017334, -3.558661460876465, -3.302061080932617, -3.0454609394073486, -2.78886079788208, -2.5322606563568115, -2.275660514831543, -2.0190601348876953, -1.7624599933624268, -1.5058598518371582, -1.2492595911026, -0.992659330368042, -0.7360601425170898, -0.4794599413871765, -0.22285974025726318, 0.033740460872650146, 0.2903406620025635, 0.546940803527832, 0.8035410642623901, 1.0601413249969482, 1.3167414665222168, 1.5733416080474854, 1.8299418687820435, 2.0865421295166016, 2.34314227104187, 2.5997424125671387, 2.8563427925109863, 3.112942934036255, 3.3695430755615234, 3.626143217086792, 3.8827433586120605, 4.139343738555908, 4.395943641662598, 4.652544021606445, 4.909144401550293, 5.165744781494141, 5.42234468460083, 5.678945064544678, 5.935544967651367, 6.192145347595215, 6.4487457275390625, 6.705345630645752, 6.9619460105896, 7.218545913696289, 7.475146293640137]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 9.0, 8.0, 12.0, 10.0, 19.0, 13.0, 20.0, 21.0, 21.0, 22.0, 26.0, 23.0, 24.0, 39.0, 42.0, 43.0, 43.0, 60.0, 44.0, 65.0, 55.0, 54.0, 42.0, 36.0, 27.0, 22.0, 27.0, 19.0, 23.0, 26.0, 17.0, 20.0, 13.0, 12.0, 13.0, 10.0, 7.0, 5.0, 2.0, 4.0, 0.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.5936570167541504, -3.4724414348602295, -3.3512256145477295, -3.2300100326538086, -3.1087944507598877, -2.9875786304473877, -2.866363048553467, -2.745147228240967, -2.623931646347046, -2.502716064453125, -2.381500244140625, -2.260284662246704, -2.139069080352783, -2.017853260040283, -1.8966376781463623, -1.7754219770431519, -1.654206395149231, -1.5329906940460205, -1.4117751121520996, -1.2905594110488892, -1.1693437099456787, -1.0481281280517578, -0.9269124269485474, -0.8056967258453369, -0.6844810843467712, -0.5632654428482056, -0.4420497417449951, -0.32083410024642944, -0.19961842894554138, -0.07840275764465332, 0.042812883853912354, 0.1640285849571228, 0.2852442264556885, 0.40645989775657654, 0.5276755690574646, 0.6488912105560303, 0.7701069116592407, 0.8913225531578064, 1.012538194656372, 1.1337538957595825, 1.254969596862793, 1.3761852979660034, 1.4974008798599243, 1.6186165809631348, 1.7398322820663452, 1.8610479831695557, 1.9822635650634766, 2.1034793853759766, 2.2246947288513184, 2.3459103107452393, 2.4671261310577393, 2.58834171295166, 2.709557294845581, 2.830773115158081, 2.951988697052002, 3.073204517364502, 3.194420099258423, 3.3156356811523438, 3.4368515014648438, 3.5580670833587646, 3.6792826652526855, 3.8004984855651855, 3.9217140674591064, 4.042929649353027, 4.164145469665527]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 3.0, 8.0, 8.0, 12.0, 18.0, 36.0, 70.0, 151.0, 276.0, 598.0, 1584.0, 4416.0, 15006.0, 67717.0, 638766.0, 3042091.0, 359053.0, 47543.0, 11395.0, 3385.0, 1180.0, 475.0, 263.0, 104.0, 48.0, 19.0, 21.0, 10.0, 6.0, 3.0, 1.0, 5.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.420166015625, -0.4048271179199219, -0.38948822021484375, -0.3741493225097656, -0.3588104248046875, -0.3434715270996094, -0.32813262939453125, -0.3127937316894531, -0.297454833984375, -0.2821159362792969, -0.26677703857421875, -0.2514381408691406, -0.2360992431640625, -0.22076034545898438, -0.20542144775390625, -0.19008255004882812, -0.17474365234375, -0.15940475463867188, -0.14406585693359375, -0.12872695922851562, -0.1133880615234375, -0.09804916381835938, -0.08271026611328125, -0.06737136840820312, -0.052032470703125, -0.036693572998046875, -0.02135467529296875, -0.006015777587890625, 0.0093231201171875, 0.024662017822265625, 0.04000091552734375, 0.055339813232421875, 0.0706787109375, 0.08601760864257812, 0.10135650634765625, 0.11669540405273438, 0.1320343017578125, 0.14737319946289062, 0.16271209716796875, 0.17805099487304688, 0.193389892578125, 0.20872879028320312, 0.22406768798828125, 0.23940658569335938, 0.2547454833984375, 0.2700843811035156, 0.28542327880859375, 0.3007621765136719, 0.31610107421875, 0.3314399719238281, 0.34677886962890625, 0.3621177673339844, 0.3774566650390625, 0.3927955627441406, 0.40813446044921875, 0.4234733581542969, 0.438812255859375, 0.4541511535644531, 0.46949005126953125, 0.4848289489746094, 0.5001678466796875, 0.5155067443847656, 0.5308456420898438, 0.5461845397949219, 0.5615234375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 11.0, 7.0, 6.0, 15.0, 12.0, 21.0, 24.0, 25.0, 23.0, 38.0, 35.0, 43.0, 47.0, 38.0, 49.0, 61.0, 44.0, 61.0, 70.0, 40.0, 38.0, 55.0, 37.0, 37.0, 23.0, 33.0, 18.0, 27.0, 6.0, 15.0, 9.0, 6.0, 9.0, 4.0, 1.0, 5.0, 0.0, 3.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.250732421875, -0.24303436279296875, -0.2353363037109375, -0.22763824462890625, -0.219940185546875, -0.21224212646484375, -0.2045440673828125, -0.19684600830078125, -0.18914794921875, -0.18144989013671875, -0.1737518310546875, -0.16605377197265625, -0.158355712890625, -0.15065765380859375, -0.1429595947265625, -0.13526153564453125, -0.1275634765625, -0.11986541748046875, -0.1121673583984375, -0.10446929931640625, -0.096771240234375, -0.08907318115234375, -0.0813751220703125, -0.07367706298828125, -0.06597900390625, -0.05828094482421875, -0.0505828857421875, -0.04288482666015625, -0.035186767578125, -0.02748870849609375, -0.0197906494140625, -0.01209259033203125, -0.00439453125, 0.00330352783203125, 0.0110015869140625, 0.01869964599609375, 0.026397705078125, 0.03409576416015625, 0.0417938232421875, 0.04949188232421875, 0.05718994140625, 0.06488800048828125, 0.0725860595703125, 0.08028411865234375, 0.087982177734375, 0.09568023681640625, 0.1033782958984375, 0.11107635498046875, 0.1187744140625, 0.12647247314453125, 0.1341705322265625, 0.14186859130859375, 0.149566650390625, 0.15726470947265625, 0.1649627685546875, 0.17266082763671875, 0.18035888671875, 0.18805694580078125, 0.1957550048828125, 0.20345306396484375, 0.211151123046875, 0.21884918212890625, 0.2265472412109375, 0.23424530029296875, 0.241943359375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 0.0, 3.0, 6.0, 4.0, 8.0, 7.0, 26.0, 51.0, 114.0, 351.0, 1125.0, 5396.0, 48563.0, 2653435.0, 1445537.0, 33909.0, 4153.0, 1005.0, 324.0, 122.0, 63.0, 42.0, 21.0, 11.0, 5.0, 5.0, 2.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6240234375, -0.5892333984375, -0.554443359375, -0.5196533203125, -0.48486328125, -0.4500732421875, -0.415283203125, -0.3804931640625, -0.345703125, -0.3109130859375, -0.276123046875, -0.2413330078125, -0.20654296875, -0.1717529296875, -0.136962890625, -0.1021728515625, -0.0673828125, -0.0325927734375, 0.002197265625, 0.0369873046875, 0.07177734375, 0.1065673828125, 0.141357421875, 0.1761474609375, 0.2109375, 0.2457275390625, 0.280517578125, 0.3153076171875, 0.35009765625, 0.3848876953125, 0.419677734375, 0.4544677734375, 0.4892578125, 0.5240478515625, 0.558837890625, 0.5936279296875, 0.62841796875, 0.6632080078125, 0.697998046875, 0.7327880859375, 0.767578125, 0.8023681640625, 0.837158203125, 0.8719482421875, 0.90673828125, 0.9415283203125, 0.976318359375, 1.0111083984375, 1.0458984375, 1.0806884765625, 1.115478515625, 1.1502685546875, 1.18505859375, 1.2198486328125, 1.254638671875, 1.2894287109375, 1.32421875, 1.3590087890625, 1.393798828125, 1.4285888671875, 1.46337890625, 1.4981689453125, 1.532958984375, 1.5677490234375, 1.6025390625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 8.0, 11.0, 15.0, 17.0, 13.0, 30.0, 19.0, 52.0, 68.0, 112.0, 179.0, 298.0, 496.0, 744.0, 714.0, 523.0, 256.0, 181.0, 110.0, 52.0, 47.0, 39.0, 23.0, 24.0, 13.0, 8.0, 6.0, 5.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.87255859375, -0.8495864868164062, -0.8266143798828125, -0.8036422729492188, -0.780670166015625, -0.7576980590820312, -0.7347259521484375, -0.7117538452148438, -0.68878173828125, -0.6658096313476562, -0.6428375244140625, -0.6198654174804688, -0.596893310546875, -0.5739212036132812, -0.5509490966796875, -0.5279769897460938, -0.5050048828125, -0.48203277587890625, -0.4590606689453125, -0.43608856201171875, -0.413116455078125, -0.39014434814453125, -0.3671722412109375, -0.34420013427734375, -0.32122802734375, -0.29825592041015625, -0.2752838134765625, -0.25231170654296875, -0.229339599609375, -0.20636749267578125, -0.1833953857421875, -0.16042327880859375, -0.137451171875, -0.11447906494140625, -0.0915069580078125, -0.06853485107421875, -0.045562744140625, -0.02259063720703125, 0.0003814697265625, 0.02335357666015625, 0.04632568359375, 0.06929779052734375, 0.0922698974609375, 0.11524200439453125, 0.138214111328125, 0.16118621826171875, 0.1841583251953125, 0.20713043212890625, 0.2301025390625, 0.25307464599609375, 0.2760467529296875, 0.29901885986328125, 0.321990966796875, 0.34496307373046875, 0.3679351806640625, 0.39090728759765625, 0.41387939453125, 0.43685150146484375, 0.4598236083984375, 0.48279571533203125, 0.505767822265625, 0.5287399291992188, 0.5517120361328125, 0.5746841430664062, 0.59765625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 11.0, 29.0, 66.0, 145.0, 224.0, 233.0, 161.0, 59.0, 32.0, 11.0, 5.0, 3.0, 5.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.38394546508789, -10.117875099182129, -9.85180377960205, -9.585733413696289, -9.319662094116211, -9.05359172821045, -8.787521362304688, -8.52145004272461, -8.255379676818848, -7.989308834075928, -7.723237991333008, -7.457167625427246, -7.191096782684326, -6.925025939941406, -6.6589555740356445, -6.392884731292725, -6.126813888549805, -5.860743045806885, -5.594672203063965, -5.328601837158203, -5.062530994415283, -4.796460151672363, -4.530389785766602, -4.264318943023682, -3.9982481002807617, -3.732177257537842, -3.466106653213501, -3.20003604888916, -2.9339652061462402, -2.6678943634033203, -2.4018237590789795, -2.1357531547546387, -1.869682788848877, -1.6036120653152466, -1.3375413417816162, -1.0714706182479858, -0.8053998947143555, -0.5393291711807251, -0.2732584476470947, -0.0071877241134643555, 0.258882999420166, 0.5249537229537964, 0.7910244464874268, 1.0570951700210571, 1.3231658935546875, 1.5892366170883179, 1.8553073406219482, 2.121377944946289, 2.387448787689209, 2.653519630432129, 2.9195902347564697, 3.1856608390808105, 3.4517316818237305, 3.7178025245666504, 3.983873128890991, 4.249943733215332, 4.516014575958252, 4.782085418701172, 5.048155784606934, 5.3142266273498535, 5.580297470092773, 5.846368312835693, 6.112439155578613, 6.378509521484375, 6.644580364227295]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 7.0, 8.0, 13.0, 16.0, 18.0, 22.0, 23.0, 27.0, 49.0, 45.0, 58.0, 41.0, 51.0, 42.0, 48.0, 64.0, 52.0, 61.0, 53.0, 52.0, 43.0, 28.0, 27.0, 28.0, 37.0, 18.0, 24.0, 13.0, 7.0, 10.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0366950035095215, -3.9216067790985107, -3.8065185546875, -3.6914303302764893, -3.5763421058654785, -3.4612536430358887, -3.346165657043457, -3.231077194213867, -3.1159889698028564, -3.0009007453918457, -2.885812520980835, -2.770724296569824, -2.6556360721588135, -2.5405478477478027, -2.425459384918213, -2.310371160507202, -2.1952829360961914, -2.0801947116851807, -1.96510648727417, -1.8500182628631592, -1.7349299192428589, -1.6198416948318481, -1.5047534704208374, -1.389665126800537, -1.2745771408081055, -1.1594889163970947, -1.044400691986084, -0.9293124079704285, -0.814224123954773, -0.6991358995437622, -0.5840476751327515, -0.46895939111709595, -0.35387110710144043, -0.2387828528881073, -0.12369461357593536, -0.008606374263763428, 0.1064818799495697, 0.22157013416290283, 0.3366583585739136, 0.4517466425895691, 0.5668348670005798, 0.6819230914115906, 0.7970113754272461, 0.9120995998382568, 1.0271878242492676, 1.1422760486602783, 1.257364273071289, 1.3724526166915894, 1.4875408411026, 1.6026290655136108, 1.7177172899246216, 1.8328056335449219, 1.9478938579559326, 2.0629820823669434, 2.178070306777954, 2.293158531188965, 2.4082467555999756, 2.5233349800109863, 2.638423204421997, 2.753511428833008, 2.8685996532440186, 2.9836878776550293, 3.098776340484619, 3.21386456489563, 3.3289527893066406]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 4.0, 9.0, 12.0, 17.0, 30.0, 50.0, 98.0, 146.0, 334.0, 627.0, 1430.0, 3360.0, 8573.0, 25077.0, 106572.0, 619050.0, 222239.0, 40155.0, 12304.0, 4682.0, 1974.0, 888.0, 430.0, 225.0, 120.0, 55.0, 44.0, 20.0, 9.0, 7.0, 5.0, 5.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79248046875, -0.7682342529296875, -0.743988037109375, -0.7197418212890625, -0.69549560546875, -0.6712493896484375, -0.647003173828125, -0.6227569580078125, -0.5985107421875, -0.5742645263671875, -0.550018310546875, -0.5257720947265625, -0.50152587890625, -0.4772796630859375, -0.453033447265625, -0.4287872314453125, -0.404541015625, -0.3802947998046875, -0.356048583984375, -0.3318023681640625, -0.30755615234375, -0.2833099365234375, -0.259063720703125, -0.2348175048828125, -0.2105712890625, -0.1863250732421875, -0.162078857421875, -0.1378326416015625, -0.11358642578125, -0.0893402099609375, -0.065093994140625, -0.0408477783203125, -0.0166015625, 0.0076446533203125, 0.031890869140625, 0.0561370849609375, 0.08038330078125, 0.1046295166015625, 0.128875732421875, 0.1531219482421875, 0.1773681640625, 0.2016143798828125, 0.225860595703125, 0.2501068115234375, 0.27435302734375, 0.2985992431640625, 0.322845458984375, 0.3470916748046875, 0.371337890625, 0.3955841064453125, 0.419830322265625, 0.4440765380859375, 0.46832275390625, 0.4925689697265625, 0.516815185546875, 0.5410614013671875, 0.5653076171875, 0.5895538330078125, 0.613800048828125, 0.6380462646484375, 0.66229248046875, 0.6865386962890625, 0.710784912109375, 0.7350311279296875, 0.75927734375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 8.0, 2.0, 11.0, 6.0, 9.0, 11.0, 13.0, 21.0, 14.0, 19.0, 27.0, 22.0, 30.0, 35.0, 34.0, 41.0, 36.0, 56.0, 48.0, 40.0, 43.0, 52.0, 55.0, 42.0, 34.0, 38.0, 47.0, 27.0, 30.0, 28.0, 21.0, 23.0, 20.0, 18.0, 4.0, 7.0, 6.0, 5.0, 6.0, 2.0, 2.0, 7.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2366943359375, -0.22927093505859375, -0.2218475341796875, -0.21442413330078125, -0.207000732421875, -0.19957733154296875, -0.1921539306640625, -0.18473052978515625, -0.17730712890625, -0.16988372802734375, -0.1624603271484375, -0.15503692626953125, -0.147613525390625, -0.14019012451171875, -0.1327667236328125, -0.12534332275390625, -0.117919921875, -0.11049652099609375, -0.1030731201171875, -0.09564971923828125, -0.088226318359375, -0.08080291748046875, -0.0733795166015625, -0.06595611572265625, -0.05853271484375, -0.05110931396484375, -0.0436859130859375, -0.03626251220703125, -0.028839111328125, -0.02141571044921875, -0.0139923095703125, -0.00656890869140625, 0.0008544921875, 0.00827789306640625, 0.0157012939453125, 0.02312469482421875, 0.030548095703125, 0.03797149658203125, 0.0453948974609375, 0.05281829833984375, 0.06024169921875, 0.06766510009765625, 0.0750885009765625, 0.08251190185546875, 0.089935302734375, 0.09735870361328125, 0.1047821044921875, 0.11220550537109375, 0.11962890625, 0.12705230712890625, 0.1344757080078125, 0.14189910888671875, 0.149322509765625, 0.15674591064453125, 0.1641693115234375, 0.17159271240234375, 0.17901611328125, 0.18643951416015625, 0.1938629150390625, 0.20128631591796875, 0.208709716796875, 0.21613311767578125, 0.2235565185546875, 0.23097991943359375, 0.2384033203125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 8.0, 11.0, 11.0, 17.0, 29.0, 45.0, 54.0, 72.0, 105.0, 158.0, 224.0, 378.0, 685.0, 1436.0, 4108.0, 17759.0, 197854.0, 774033.0, 40153.0, 6997.0, 2116.0, 953.0, 492.0, 266.0, 181.0, 119.0, 82.0, 60.0, 43.0, 33.0, 20.0, 11.0, 8.0, 5.0, 6.0, 6.0, 5.0, 6.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1328125, -1.0926513671875, -1.052490234375, -1.0123291015625, -0.97216796875, -0.9320068359375, -0.891845703125, -0.8516845703125, -0.8115234375, -0.7713623046875, -0.731201171875, -0.6910400390625, -0.65087890625, -0.6107177734375, -0.570556640625, -0.5303955078125, -0.490234375, -0.4500732421875, -0.409912109375, -0.3697509765625, -0.32958984375, -0.2894287109375, -0.249267578125, -0.2091064453125, -0.1689453125, -0.1287841796875, -0.088623046875, -0.0484619140625, -0.00830078125, 0.0318603515625, 0.072021484375, 0.1121826171875, 0.15234375, 0.1925048828125, 0.232666015625, 0.2728271484375, 0.31298828125, 0.3531494140625, 0.393310546875, 0.4334716796875, 0.4736328125, 0.5137939453125, 0.553955078125, 0.5941162109375, 0.63427734375, 0.6744384765625, 0.714599609375, 0.7547607421875, 0.794921875, 0.8350830078125, 0.875244140625, 0.9154052734375, 0.95556640625, 0.9957275390625, 1.035888671875, 1.0760498046875, 1.1162109375, 1.1563720703125, 1.196533203125, 1.2366943359375, 1.27685546875, 1.3170166015625, 1.357177734375, 1.3973388671875, 1.4375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 6.0, 5.0, 9.0, 10.0, 12.0, 13.0, 18.0, 14.0, 18.0, 18.0, 27.0, 28.0, 34.0, 51.0, 42.0, 57.0, 49.0, 51.0, 49.0, 49.0, 45.0, 35.0, 47.0, 37.0, 46.0, 37.0, 33.0, 33.0, 23.0, 14.0, 15.0, 17.0, 12.0, 12.0, 7.0, 5.0, 5.0, 7.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0791015625, -1.0443267822265625, -1.009552001953125, -0.9747772216796875, -0.94000244140625, -0.9052276611328125, -0.870452880859375, -0.8356781005859375, -0.8009033203125, -0.7661285400390625, -0.731353759765625, -0.6965789794921875, -0.66180419921875, -0.6270294189453125, -0.592254638671875, -0.5574798583984375, -0.522705078125, -0.4879302978515625, -0.453155517578125, -0.4183807373046875, -0.38360595703125, -0.3488311767578125, -0.314056396484375, -0.2792816162109375, -0.2445068359375, -0.2097320556640625, -0.174957275390625, -0.1401824951171875, -0.10540771484375, -0.0706329345703125, -0.035858154296875, -0.0010833740234375, 0.03369140625, 0.0684661865234375, 0.103240966796875, 0.1380157470703125, 0.17279052734375, 0.2075653076171875, 0.242340087890625, 0.2771148681640625, 0.3118896484375, 0.3466644287109375, 0.381439208984375, 0.4162139892578125, 0.45098876953125, 0.4857635498046875, 0.520538330078125, 0.5553131103515625, 0.590087890625, 0.6248626708984375, 0.659637451171875, 0.6944122314453125, 0.72918701171875, 0.7639617919921875, 0.798736572265625, 0.8335113525390625, 0.8682861328125, 0.9030609130859375, 0.937835693359375, 0.9726104736328125, 1.00738525390625, 1.0421600341796875, 1.076934814453125, 1.1117095947265625, 1.146484375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 8.0, 6.0, 8.0, 12.0, 23.0, 28.0, 49.0, 77.0, 116.0, 150.0, 253.0, 478.0, 966.0, 1990.0, 5527.0, 19179.0, 91863.0, 705869.0, 176527.0, 31712.0, 8307.0, 2844.0, 1185.0, 546.0, 303.0, 179.0, 119.0, 77.0, 60.0, 24.0, 21.0, 17.0, 8.0, 9.0, 5.0, 3.0, 2.0, 4.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2900390625, -0.27873992919921875, -0.2674407958984375, -0.25614166259765625, -0.244842529296875, -0.23354339599609375, -0.2222442626953125, -0.21094512939453125, -0.19964599609375, -0.18834686279296875, -0.1770477294921875, -0.16574859619140625, -0.154449462890625, -0.14315032958984375, -0.1318511962890625, -0.12055206298828125, -0.1092529296875, -0.09795379638671875, -0.0866546630859375, -0.07535552978515625, -0.064056396484375, -0.05275726318359375, -0.0414581298828125, -0.03015899658203125, -0.01885986328125, -0.00756072998046875, 0.0037384033203125, 0.01503753662109375, 0.026336669921875, 0.03763580322265625, 0.0489349365234375, 0.06023406982421875, 0.071533203125, 0.08283233642578125, 0.0941314697265625, 0.10543060302734375, 0.116729736328125, 0.12802886962890625, 0.1393280029296875, 0.15062713623046875, 0.16192626953125, 0.17322540283203125, 0.1845245361328125, 0.19582366943359375, 0.207122802734375, 0.21842193603515625, 0.2297210693359375, 0.24102020263671875, 0.2523193359375, 0.26361846923828125, 0.2749176025390625, 0.28621673583984375, 0.297515869140625, 0.30881500244140625, 0.3201141357421875, 0.33141326904296875, 0.34271240234375, 0.35401153564453125, 0.3653106689453125, 0.37660980224609375, 0.387908935546875, 0.39920806884765625, 0.4105072021484375, 0.42180633544921875, 0.43310546875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 5.0, 5.0, 10.0, 3.0, 6.0, 17.0, 15.0, 10.0, 19.0, 31.0, 37.0, 46.0, 82.0, 107.0, 149.0, 114.0, 79.0, 75.0, 51.0, 35.0, 18.0, 15.0, 14.0, 13.0, 8.0, 8.0, 9.0, 2.0, 7.0, 3.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011265277862548828, -0.00010897591710090637, -0.00010529905557632446, -0.00010162219405174255, -9.794533252716064e-05, -9.426847100257874e-05, -9.059160947799683e-05, -8.691474795341492e-05, -8.323788642883301e-05, -7.95610249042511e-05, -7.588416337966919e-05, -7.220730185508728e-05, -6.853044033050537e-05, -6.485357880592346e-05, -6.117671728134155e-05, -5.7499855756759644e-05, -5.3822994232177734e-05, -5.0146132707595825e-05, -4.6469271183013916e-05, -4.279240965843201e-05, -3.91155481338501e-05, -3.543868660926819e-05, -3.176182508468628e-05, -2.808496356010437e-05, -2.440810203552246e-05, -2.0731240510940552e-05, -1.7054378986358643e-05, -1.3377517461776733e-05, -9.700655937194824e-06, -6.023794412612915e-06, -2.346932888031006e-06, 1.3299286365509033e-06, 5.0067901611328125e-06, 8.683651685714722e-06, 1.2360513210296631e-05, 1.603737473487854e-05, 1.971423625946045e-05, 2.339109778404236e-05, 2.7067959308624268e-05, 3.074482083320618e-05, 3.4421682357788086e-05, 3.8098543882369995e-05, 4.1775405406951904e-05, 4.5452266931533813e-05, 4.912912845611572e-05, 5.280598998069763e-05, 5.648285150527954e-05, 6.015971302986145e-05, 6.383657455444336e-05, 6.751343607902527e-05, 7.119029760360718e-05, 7.486715912818909e-05, 7.8544020652771e-05, 8.22208821773529e-05, 8.589774370193481e-05, 8.957460522651672e-05, 9.325146675109863e-05, 9.692832827568054e-05, 0.00010060518980026245, 0.00010428205132484436, 0.00010795891284942627, 0.00011163577437400818, 0.00011531263589859009, 0.000118989497423172, 0.0001226663589477539]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 6.0, 4.0, 8.0, 4.0, 11.0, 19.0, 23.0, 48.0, 71.0, 124.0, 246.0, 458.0, 999.0, 2373.0, 8925.0, 63511.0, 813859.0, 137622.0, 14531.0, 3180.0, 1262.0, 568.0, 309.0, 160.0, 87.0, 52.0, 27.0, 24.0, 14.0, 9.0, 8.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46484375, -0.449676513671875, -0.43450927734375, -0.419342041015625, -0.4041748046875, -0.389007568359375, -0.37384033203125, -0.358673095703125, -0.343505859375, -0.328338623046875, -0.31317138671875, -0.298004150390625, -0.2828369140625, -0.267669677734375, -0.25250244140625, -0.237335205078125, -0.22216796875, -0.207000732421875, -0.19183349609375, -0.176666259765625, -0.1614990234375, -0.146331787109375, -0.13116455078125, -0.115997314453125, -0.100830078125, -0.085662841796875, -0.07049560546875, -0.055328369140625, -0.0401611328125, -0.024993896484375, -0.00982666015625, 0.005340576171875, 0.0205078125, 0.035675048828125, 0.05084228515625, 0.066009521484375, 0.0811767578125, 0.096343994140625, 0.11151123046875, 0.126678466796875, 0.141845703125, 0.157012939453125, 0.17218017578125, 0.187347412109375, 0.2025146484375, 0.217681884765625, 0.23284912109375, 0.248016357421875, 0.26318359375, 0.278350830078125, 0.29351806640625, 0.308685302734375, 0.3238525390625, 0.339019775390625, 0.35418701171875, 0.369354248046875, 0.384521484375, 0.399688720703125, 0.41485595703125, 0.430023193359375, 0.4451904296875, 0.460357666015625, 0.47552490234375, 0.490692138671875, 0.505859375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 9.0, 3.0, 5.0, 6.0, 5.0, 9.0, 9.0, 12.0, 21.0, 28.0, 30.0, 29.0, 37.0, 63.0, 65.0, 69.0, 84.0, 89.0, 90.0, 76.0, 51.0, 41.0, 32.0, 25.0, 24.0, 9.0, 13.0, 9.0, 11.0, 10.0, 8.0, 7.0, 6.0, 4.0, 6.0, 4.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3193359375, -0.3100013732910156, -0.30066680908203125, -0.2913322448730469, -0.2819976806640625, -0.2726631164550781, -0.26332855224609375, -0.2539939880371094, -0.244659423828125, -0.23532485961914062, -0.22599029541015625, -0.21665573120117188, -0.2073211669921875, -0.19798660278320312, -0.18865203857421875, -0.17931747436523438, -0.16998291015625, -0.16064834594726562, -0.15131378173828125, -0.14197921752929688, -0.1326446533203125, -0.12331008911132812, -0.11397552490234375, -0.10464096069335938, -0.095306396484375, -0.08597183227539062, -0.07663726806640625, -0.06730270385742188, -0.0579681396484375, -0.048633575439453125, -0.03929901123046875, -0.029964447021484375, -0.0206298828125, -0.011295318603515625, -0.00196075439453125, 0.007373809814453125, 0.0167083740234375, 0.026042938232421875, 0.03537750244140625, 0.044712066650390625, 0.054046630859375, 0.06338119506835938, 0.07271575927734375, 0.08205032348632812, 0.0913848876953125, 0.10071945190429688, 0.11005401611328125, 0.11938858032226562, 0.12872314453125, 0.13805770874023438, 0.14739227294921875, 0.15672683715820312, 0.1660614013671875, 0.17539596557617188, 0.18473052978515625, 0.19406509399414062, 0.203399658203125, 0.21273422241210938, 0.22206878662109375, 0.23140335083007812, 0.2407379150390625, 0.2500724792480469, 0.25940704345703125, 0.2687416076660156, 0.278076171875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 10.0, 16.0, 50.0, 158.0, 322.0, 247.0, 121.0, 38.0, 12.0, 11.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.049071311950684, -11.713863372802734, -11.378656387329102, -11.043448448181152, -10.708240509033203, -10.37303352355957, -10.037825584411621, -9.702617645263672, -9.367410659790039, -9.03220272064209, -8.696995735168457, -8.361787796020508, -8.026580810546875, -7.691372871398926, -7.356164932250977, -7.0209574699401855, -6.6857500076293945, -6.3505425453186035, -6.0153350830078125, -5.680127143859863, -5.344919681549072, -5.009712219238281, -4.674504280090332, -4.339296817779541, -4.00408935546875, -3.668881893157959, -3.333674192428589, -2.9984664916992188, -2.6632590293884277, -2.3280515670776367, -1.9928438663482666, -1.6576361656188965, -1.322427749633789, -0.9872201681137085, -0.6520125865936279, -0.31680500507354736, 0.018402576446533203, 0.35361015796661377, 0.6888177394866943, 1.0240254402160645, 1.3592329025268555, 1.694440484046936, 2.0296480655670166, 2.3648557662963867, 2.7000632286071777, 3.0352706909179688, 3.370478391647339, 3.705686092376709, 4.0408935546875, 4.376101016998291, 4.711308479309082, 5.046516418457031, 5.381723880767822, 5.716931343078613, 6.0521392822265625, 6.3873467445373535, 6.7225542068481445, 7.0577616691589355, 7.392969131469727, 7.728177070617676, 8.063385009765625, 8.398591995239258, 8.733799934387207, 9.069007873535156, 9.404214859008789]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 1.0, 3.0, 10.0, 4.0, 16.0, 9.0, 13.0, 17.0, 20.0, 23.0, 28.0, 29.0, 31.0, 28.0, 29.0, 54.0, 61.0, 82.0, 70.0, 75.0, 53.0, 52.0, 51.0, 32.0, 31.0, 31.0, 16.0, 13.0, 27.0, 13.0, 18.0, 11.0, 13.0, 7.0, 7.0, 4.0, 8.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.941935062408447, -4.788825988769531, -4.635716915130615, -4.482607364654541, -4.329498291015625, -4.176389217376709, -4.023280143737793, -3.870171070098877, -3.717061758041382, -3.563952684402466, -3.4108433723449707, -3.2577342987060547, -3.1046252250671387, -2.9515159130096436, -2.7984068393707275, -2.6452975273132324, -2.4921884536743164, -2.3390793800354004, -2.1859700679779053, -2.0328609943389893, -1.8797518014907837, -1.7266426086425781, -1.573533535003662, -1.4204243421554565, -1.267315149307251, -1.1142059564590454, -0.9610968232154846, -0.8079876899719238, -0.6548784971237183, -0.5017693042755127, -0.3486601710319519, -0.1955510377883911, -0.04244184494018555, 0.11066731810569763, 0.2637764811515808, 0.416885644197464, 0.5699948072433472, 0.7231040000915527, 0.8762131333351135, 1.0293222665786743, 1.1824314594268799, 1.3355406522750854, 1.488649845123291, 1.641758918762207, 1.7948681116104126, 1.9479773044586182, 2.101086378097534, 2.2541956901550293, 2.4073047637939453, 2.5604138374328613, 2.7135231494903564, 2.8666322231292725, 3.0197415351867676, 3.1728506088256836, 3.3259596824645996, 3.4790687561035156, 3.6321780681610107, 3.7852871417999268, 3.938396453857422, 4.091505527496338, 4.244614601135254, 4.397724151611328, 4.550833225250244, 4.70394229888916, 4.857051372528076]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 8.0, 1.0, 2.0, 11.0, 10.0, 17.0, 16.0, 21.0, 35.0, 47.0, 95.0, 186.0, 376.0, 954.0, 2668.0, 8978.0, 44240.0, 579537.0, 3303145.0, 219755.0, 25205.0, 5815.0, 1839.0, 712.0, 258.0, 127.0, 85.0, 44.0, 21.0, 18.0, 21.0, 13.0, 10.0, 6.0, 6.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5654296875, -0.5479507446289062, -0.5304718017578125, -0.5129928588867188, -0.495513916015625, -0.47803497314453125, -0.4605560302734375, -0.44307708740234375, -0.42559814453125, -0.40811920166015625, -0.3906402587890625, -0.37316131591796875, -0.355682373046875, -0.33820343017578125, -0.3207244873046875, -0.30324554443359375, -0.2857666015625, -0.26828765869140625, -0.2508087158203125, -0.23332977294921875, -0.215850830078125, -0.19837188720703125, -0.1808929443359375, -0.16341400146484375, -0.14593505859375, -0.12845611572265625, -0.1109771728515625, -0.09349822998046875, -0.076019287109375, -0.05854034423828125, -0.0410614013671875, -0.02358245849609375, -0.006103515625, 0.01137542724609375, 0.0288543701171875, 0.04633331298828125, 0.063812255859375, 0.08129119873046875, 0.0987701416015625, 0.11624908447265625, 0.13372802734375, 0.15120697021484375, 0.1686859130859375, 0.18616485595703125, 0.203643798828125, 0.22112274169921875, 0.2386016845703125, 0.25608062744140625, 0.2735595703125, 0.29103851318359375, 0.3085174560546875, 0.32599639892578125, 0.343475341796875, 0.36095428466796875, 0.3784332275390625, 0.39591217041015625, 0.41339111328125, 0.43087005615234375, 0.4483489990234375, 0.46582794189453125, 0.483306884765625, 0.5007858276367188, 0.5182647705078125, 0.5357437133789062, 0.55322265625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 10.0, 13.0, 15.0, 16.0, 15.0, 18.0, 11.0, 26.0, 28.0, 33.0, 30.0, 42.0, 30.0, 53.0, 40.0, 43.0, 61.0, 56.0, 47.0, 39.0, 41.0, 40.0, 41.0, 41.0, 18.0, 33.0, 24.0, 25.0, 12.0, 16.0, 21.0, 21.0, 3.0, 7.0, 7.0, 2.0, 9.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.255859375, -0.2485485076904297, -0.24123764038085938, -0.23392677307128906, -0.22661590576171875, -0.21930503845214844, -0.21199417114257812, -0.2046833038330078, -0.1973724365234375, -0.1900615692138672, -0.18275070190429688, -0.17543983459472656, -0.16812896728515625, -0.16081809997558594, -0.15350723266601562, -0.1461963653564453, -0.138885498046875, -0.1315746307373047, -0.12426376342773438, -0.11695289611816406, -0.10964202880859375, -0.10233116149902344, -0.09502029418945312, -0.08770942687988281, -0.0803985595703125, -0.07308769226074219, -0.06577682495117188, -0.05846595764160156, -0.05115509033203125, -0.04384422302246094, -0.036533355712890625, -0.029222488403320312, -0.02191162109375, -0.014600753784179688, -0.007289886474609375, 2.09808349609375e-05, 0.00733184814453125, 0.014642715454101562, 0.021953582763671875, 0.029264450073242188, 0.0365753173828125, 0.04388618469238281, 0.051197052001953125, 0.05850791931152344, 0.06581878662109375, 0.07312965393066406, 0.08044052124023438, 0.08775138854980469, 0.095062255859375, 0.10237312316894531, 0.10968399047851562, 0.11699485778808594, 0.12430572509765625, 0.13161659240722656, 0.13892745971679688, 0.1462383270263672, 0.1535491943359375, 0.1608600616455078, 0.16817092895507812, 0.17548179626464844, 0.18279266357421875, 0.19010353088378906, 0.19741439819335938, 0.2047252655029297, 0.2120361328125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 14.0, 10.0, 33.0, 93.0, 362.0, 2548.0, 131693.0, 4041946.0, 15756.0, 1365.0, 304.0, 93.0, 31.0, 11.0, 14.0, 6.0, 5.0, 1.0, 3.0, 2.0, 1.0, 2.0], "bins": [-3.48046875, -3.4098358154296875, -3.339202880859375, -3.2685699462890625, -3.19793701171875, -3.1273040771484375, -3.056671142578125, -2.9860382080078125, -2.9154052734375, -2.8447723388671875, -2.774139404296875, -2.7035064697265625, -2.63287353515625, -2.5622406005859375, -2.491607666015625, -2.4209747314453125, -2.350341796875, -2.2797088623046875, -2.209075927734375, -2.1384429931640625, -2.06781005859375, -1.9971771240234375, -1.926544189453125, -1.8559112548828125, -1.7852783203125, -1.7146453857421875, -1.644012451171875, -1.5733795166015625, -1.50274658203125, -1.4321136474609375, -1.361480712890625, -1.2908477783203125, -1.22021484375, -1.1495819091796875, -1.078948974609375, -1.0083160400390625, -0.93768310546875, -0.8670501708984375, -0.796417236328125, -0.7257843017578125, -0.6551513671875, -0.5845184326171875, -0.513885498046875, -0.4432525634765625, -0.37261962890625, -0.3019866943359375, -0.231353759765625, -0.1607208251953125, -0.090087890625, -0.0194549560546875, 0.051177978515625, 0.1218109130859375, 0.19244384765625, 0.2630767822265625, 0.333709716796875, 0.4043426513671875, 0.4749755859375, 0.5456085205078125, 0.616241455078125, 0.6868743896484375, 0.75750732421875, 0.8281402587890625, 0.898773193359375, 0.9694061279296875, 1.0400390625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 12.0, 5.0, 12.0, 21.0, 26.0, 42.0, 65.0, 128.0, 251.0, 515.0, 1002.0, 969.0, 508.0, 214.0, 108.0, 68.0, 42.0, 17.0, 22.0, 17.0, 8.0, 8.0, 2.0, 5.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50439453125, -0.47629547119140625, -0.4481964111328125, -0.42009735107421875, -0.391998291015625, -0.36389923095703125, -0.3358001708984375, -0.30770111083984375, -0.27960205078125, -0.25150299072265625, -0.2234039306640625, -0.19530487060546875, -0.167205810546875, -0.13910675048828125, -0.1110076904296875, -0.08290863037109375, -0.0548095703125, -0.02671051025390625, 0.0013885498046875, 0.02948760986328125, 0.057586669921875, 0.08568572998046875, 0.1137847900390625, 0.14188385009765625, 0.16998291015625, 0.19808197021484375, 0.2261810302734375, 0.25428009033203125, 0.282379150390625, 0.31047821044921875, 0.3385772705078125, 0.36667633056640625, 0.394775390625, 0.42287445068359375, 0.4509735107421875, 0.47907257080078125, 0.507171630859375, 0.5352706909179688, 0.5633697509765625, 0.5914688110351562, 0.61956787109375, 0.6476669311523438, 0.6757659912109375, 0.7038650512695312, 0.731964111328125, 0.7600631713867188, 0.7881622314453125, 0.8162612915039062, 0.8443603515625, 0.8724594116210938, 0.9005584716796875, 0.9286575317382812, 0.956756591796875, 0.9848556518554688, 1.0129547119140625, 1.0410537719726562, 1.06915283203125, 1.0972518920898438, 1.1253509521484375, 1.1534500122070312, 1.181549072265625, 1.2096481323242188, 1.2377471923828125, 1.2658462524414062, 1.2939453125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 4.0, 4.0, 7.0, 26.0, 62.0, 160.0, 297.0, 223.0, 139.0, 37.0, 15.0, 8.0, 6.0, 5.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.029900550842285, -8.745197296142578, -8.460494995117188, -8.17579174041748, -7.891088485717773, -7.606385231018066, -7.321682453155518, -7.036979675292969, -6.752276420593262, -6.467573165893555, -6.182870388031006, -5.898167610168457, -5.61346435546875, -5.328761100769043, -5.044058322906494, -4.759355545043945, -4.474652290344238, -4.189949035644531, -3.9052462577819824, -3.6205432415008545, -3.3358402252197266, -3.0511372089385986, -2.7664341926574707, -2.4817311763763428, -2.197028160095215, -1.912325143814087, -1.627622127532959, -1.342919111251831, -1.0582160949707031, -0.7735130786895752, -0.48881006240844727, -0.20410704612731934, 0.08059501647949219, 0.3652980327606201, 0.650001049041748, 0.934704065322876, 1.219407081604004, 1.5041100978851318, 1.7888131141662598, 2.0735161304473877, 2.3582191467285156, 2.6429221630096436, 2.9276251792907715, 3.2123281955718994, 3.4970312118530273, 3.7817342281341553, 4.066437244415283, 4.351140022277832, 4.635843276977539, 4.920546531677246, 5.205249309539795, 5.489952087402344, 5.774655342102051, 6.059358596801758, 6.344061374664307, 6.6287641525268555, 6.9134674072265625, 7.1981706619262695, 7.482873439788818, 7.767576217651367, 8.052279472351074, 8.336982727050781, 8.621685028076172, 8.906388282775879, 9.191091537475586]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 9.0, 6.0, 8.0, 10.0, 10.0, 16.0, 34.0, 26.0, 39.0, 41.0, 38.0, 45.0, 49.0, 52.0, 48.0, 56.0, 71.0, 53.0, 45.0, 57.0, 52.0, 36.0, 42.0, 28.0, 24.0, 14.0, 20.0, 11.0, 11.0, 11.0, 13.0, 11.0, 5.0, 3.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.5518808364868164, -3.4524831771850586, -3.3530852794647217, -3.253687620162964, -3.154289722442627, -3.054892063140869, -2.9554944038391113, -2.8560967445373535, -2.7566988468170166, -2.657301187515259, -2.557903289794922, -2.458505630493164, -2.3591079711914062, -2.2597100734710693, -2.1603124141693115, -2.0609145164489746, -1.9615168571472168, -1.8621190786361694, -1.762721300125122, -1.6633236408233643, -1.563925862312317, -1.4645280838012695, -1.3651304244995117, -1.2657326459884644, -1.166334867477417, -1.0669370889663696, -0.967539370059967, -0.8681416511535645, -0.7687438726425171, -0.6693460941314697, -0.5699483752250671, -0.47055065631866455, -0.3711528778076172, -0.2717551290988922, -0.17235738039016724, -0.07295963168144226, 0.026438117027282715, 0.1258358657360077, 0.22523361444473267, 0.32463133335113525, 0.4240291118621826, 0.52342689037323, 0.6228246092796326, 0.7222223281860352, 0.8216201066970825, 0.9210178852081299, 1.0204155445098877, 1.119813323020935, 1.2192111015319824, 1.3186088800430298, 1.4180066585540771, 1.517404317855835, 1.6168020963668823, 1.7161998748779297, 1.8155975341796875, 1.9149953126907349, 2.0143930912017822, 2.11379075050354, 2.213188648223877, 2.3125863075256348, 2.4119839668273926, 2.5113818645477295, 2.6107795238494873, 2.710177421569824, 2.809575080871582]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 8.0, 6.0, 6.0, 21.0, 23.0, 40.0, 61.0, 103.0, 176.0, 307.0, 511.0, 1014.0, 1928.0, 4167.0, 10615.0, 34432.0, 154086.0, 522390.0, 242538.0, 51263.0, 14499.0, 5367.0, 2344.0, 1180.0, 646.0, 332.0, 199.0, 97.0, 67.0, 47.0, 25.0, 20.0, 8.0, 15.0, 5.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.368408203125, -0.3545799255371094, -0.34075164794921875, -0.3269233703613281, -0.3130950927734375, -0.2992668151855469, -0.28543853759765625, -0.2716102600097656, -0.257781982421875, -0.24395370483398438, -0.23012542724609375, -0.21629714965820312, -0.2024688720703125, -0.18864059448242188, -0.17481231689453125, -0.16098403930664062, -0.14715576171875, -0.13332748413085938, -0.11949920654296875, -0.10567092895507812, -0.0918426513671875, -0.07801437377929688, -0.06418609619140625, -0.050357818603515625, -0.036529541015625, -0.022701263427734375, -0.00887298583984375, 0.004955291748046875, 0.0187835693359375, 0.032611846923828125, 0.04644012451171875, 0.060268402099609375, 0.0740966796875, 0.08792495727539062, 0.10175323486328125, 0.11558151245117188, 0.1294097900390625, 0.14323806762695312, 0.15706634521484375, 0.17089462280273438, 0.184722900390625, 0.19855117797851562, 0.21237945556640625, 0.22620773315429688, 0.2400360107421875, 0.2538642883300781, 0.26769256591796875, 0.2815208435058594, 0.29534912109375, 0.3091773986816406, 0.32300567626953125, 0.3368339538574219, 0.3506622314453125, 0.3644905090332031, 0.37831878662109375, 0.3921470642089844, 0.405975341796875, 0.4198036193847656, 0.43363189697265625, 0.4474601745605469, 0.4612884521484375, 0.4751167297363281, 0.48894500732421875, 0.5027732849121094, 0.5166015625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 1.0, 4.0, 5.0, 7.0, 10.0, 6.0, 13.0, 12.0, 10.0, 18.0, 19.0, 14.0, 31.0, 38.0, 36.0, 43.0, 29.0, 46.0, 51.0, 54.0, 59.0, 44.0, 54.0, 43.0, 48.0, 37.0, 35.0, 32.0, 31.0, 26.0, 27.0, 20.0, 24.0, 13.0, 22.0, 10.0, 11.0, 8.0, 6.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26904296875, -0.2608680725097656, -0.25269317626953125, -0.24451828002929688, -0.2363433837890625, -0.22816848754882812, -0.21999359130859375, -0.21181869506835938, -0.203643798828125, -0.19546890258789062, -0.18729400634765625, -0.17911911010742188, -0.1709442138671875, -0.16276931762695312, -0.15459442138671875, -0.14641952514648438, -0.13824462890625, -0.13006973266601562, -0.12189483642578125, -0.11371994018554688, -0.1055450439453125, -0.09737014770507812, -0.08919525146484375, -0.08102035522460938, -0.072845458984375, -0.06467056274414062, -0.05649566650390625, -0.048320770263671875, -0.0401458740234375, -0.031970977783203125, -0.02379608154296875, -0.015621185302734375, -0.0074462890625, 0.000728607177734375, 0.00890350341796875, 0.017078399658203125, 0.0252532958984375, 0.033428192138671875, 0.04160308837890625, 0.049777984619140625, 0.057952880859375, 0.06612777709960938, 0.07430267333984375, 0.08247756958007812, 0.0906524658203125, 0.09882736206054688, 0.10700225830078125, 0.11517715454101562, 0.12335205078125, 0.13152694702148438, 0.13970184326171875, 0.14787673950195312, 0.1560516357421875, 0.16422653198242188, 0.17240142822265625, 0.18057632446289062, 0.188751220703125, 0.19692611694335938, 0.20510101318359375, 0.21327590942382812, 0.2214508056640625, 0.22962570190429688, 0.23780059814453125, 0.24597549438476562, 0.254150390625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 8.0, 7.0, 2.0, 6.0, 14.0, 17.0, 32.0, 39.0, 65.0, 78.0, 161.0, 317.0, 581.0, 1405.0, 4554.0, 28023.0, 639693.0, 346679.0, 20694.0, 3736.0, 1234.0, 517.0, 273.0, 139.0, 80.0, 61.0, 45.0, 22.0, 18.0, 21.0, 12.0, 8.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.009765625, -0.9831466674804688, -0.9565277099609375, -0.9299087524414062, -0.903289794921875, -0.8766708374023438, -0.8500518798828125, -0.8234329223632812, -0.79681396484375, -0.7701950073242188, -0.7435760498046875, -0.7169570922851562, -0.690338134765625, -0.6637191772460938, -0.6371002197265625, -0.6104812622070312, -0.5838623046875, -0.5572433471679688, -0.5306243896484375, -0.5040054321289062, -0.477386474609375, -0.45076751708984375, -0.4241485595703125, -0.39752960205078125, -0.37091064453125, -0.34429168701171875, -0.3176727294921875, -0.29105377197265625, -0.264434814453125, -0.23781585693359375, -0.2111968994140625, -0.18457794189453125, -0.157958984375, -0.13134002685546875, -0.1047210693359375, -0.07810211181640625, -0.051483154296875, -0.02486419677734375, 0.0017547607421875, 0.02837371826171875, 0.05499267578125, 0.08161163330078125, 0.1082305908203125, 0.13484954833984375, 0.161468505859375, 0.18808746337890625, 0.2147064208984375, 0.24132537841796875, 0.2679443359375, 0.29456329345703125, 0.3211822509765625, 0.34780120849609375, 0.374420166015625, 0.40103912353515625, 0.4276580810546875, 0.45427703857421875, 0.48089599609375, 0.5075149536132812, 0.5341339111328125, 0.5607528686523438, 0.587371826171875, 0.6139907836914062, 0.6406097412109375, 0.6672286987304688, 0.69384765625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 4.0, 4.0, 8.0, 8.0, 10.0, 6.0, 14.0, 11.0, 22.0, 29.0, 33.0, 28.0, 41.0, 49.0, 51.0, 46.0, 61.0, 62.0, 63.0, 34.0, 42.0, 52.0, 67.0, 37.0, 38.0, 32.0, 28.0, 24.0, 20.0, 20.0, 18.0, 12.0, 6.0, 7.0, 5.0, 1.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.107421875, -1.0734100341796875, -1.039398193359375, -1.0053863525390625, -0.97137451171875, -0.9373626708984375, -0.903350830078125, -0.8693389892578125, -0.8353271484375, -0.8013153076171875, -0.767303466796875, -0.7332916259765625, -0.69927978515625, -0.6652679443359375, -0.631256103515625, -0.5972442626953125, -0.563232421875, -0.5292205810546875, -0.495208740234375, -0.4611968994140625, -0.42718505859375, -0.3931732177734375, -0.359161376953125, -0.3251495361328125, -0.2911376953125, -0.2571258544921875, -0.223114013671875, -0.1891021728515625, -0.15509033203125, -0.1210784912109375, -0.087066650390625, -0.0530548095703125, -0.01904296875, 0.0149688720703125, 0.048980712890625, 0.0829925537109375, 0.11700439453125, 0.1510162353515625, 0.185028076171875, 0.2190399169921875, 0.2530517578125, 0.2870635986328125, 0.321075439453125, 0.3550872802734375, 0.38909912109375, 0.4231109619140625, 0.457122802734375, 0.4911346435546875, 0.525146484375, 0.5591583251953125, 0.593170166015625, 0.6271820068359375, 0.66119384765625, 0.6952056884765625, 0.729217529296875, 0.7632293701171875, 0.7972412109375, 0.8312530517578125, 0.865264892578125, 0.8992767333984375, 0.93328857421875, 0.9673004150390625, 1.001312255859375, 1.0353240966796875, 1.0693359375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 5.0, 6.0, 10.0, 13.0, 21.0, 37.0, 62.0, 100.0, 231.0, 631.0, 2159.0, 10039.0, 79986.0, 846373.0, 94092.0, 11218.0, 2382.0, 681.0, 251.0, 102.0, 50.0, 35.0, 23.0, 22.0, 8.0, 4.0, 4.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.402587890625, -0.3898200988769531, -0.37705230712890625, -0.3642845153808594, -0.3515167236328125, -0.3387489318847656, -0.32598114013671875, -0.3132133483886719, -0.300445556640625, -0.2876777648925781, -0.27490997314453125, -0.2621421813964844, -0.2493743896484375, -0.23660659790039062, -0.22383880615234375, -0.21107101440429688, -0.19830322265625, -0.18553543090820312, -0.17276763916015625, -0.15999984741210938, -0.1472320556640625, -0.13446426391601562, -0.12169647216796875, -0.10892868041992188, -0.096160888671875, -0.08339309692382812, -0.07062530517578125, -0.057857513427734375, -0.0450897216796875, -0.032321929931640625, -0.01955413818359375, -0.006786346435546875, 0.0059814453125, 0.018749237060546875, 0.03151702880859375, 0.044284820556640625, 0.0570526123046875, 0.06982040405273438, 0.08258819580078125, 0.09535598754882812, 0.108123779296875, 0.12089157104492188, 0.13365936279296875, 0.14642715454101562, 0.1591949462890625, 0.17196273803710938, 0.18473052978515625, 0.19749832153320312, 0.21026611328125, 0.22303390502929688, 0.23580169677734375, 0.24856948852539062, 0.2613372802734375, 0.2741050720214844, 0.28687286376953125, 0.2996406555175781, 0.312408447265625, 0.3251762390136719, 0.33794403076171875, 0.3507118225097656, 0.3634796142578125, 0.3762474060058594, 0.38901519775390625, 0.4017829895019531, 0.41455078125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 2.0, 7.0, 4.0, 8.0, 5.0, 14.0, 20.0, 28.0, 32.0, 58.0, 66.0, 86.0, 106.0, 112.0, 91.0, 90.0, 74.0, 62.0, 33.0, 25.0, 20.0, 8.0, 11.0, 2.0, 5.0, 4.0, 7.0, 2.0, 1.0, 5.0, 1.0, 0.0, 5.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.888938903808594e-05, -5.667004734277725e-05, -5.445070564746857e-05, -5.223136395215988e-05, -5.0012022256851196e-05, -4.779268056154251e-05, -4.5573338866233826e-05, -4.335399717092514e-05, -4.1134655475616455e-05, -3.891531378030777e-05, -3.6695972084999084e-05, -3.44766303896904e-05, -3.2257288694381714e-05, -3.003794699907303e-05, -2.7818605303764343e-05, -2.5599263608455658e-05, -2.3379921913146973e-05, -2.1160580217838287e-05, -1.8941238522529602e-05, -1.6721896827220917e-05, -1.4502555131912231e-05, -1.2283213436603546e-05, -1.006387174129486e-05, -7.844530045986176e-06, -5.62518835067749e-06, -3.405846655368805e-06, -1.1865049600601196e-06, 1.0328367352485657e-06, 3.252178430557251e-06, 5.471520125865936e-06, 7.690861821174622e-06, 9.910203516483307e-06, 1.2129545211791992e-05, 1.4348886907100677e-05, 1.6568228602409363e-05, 1.8787570297718048e-05, 2.1006911993026733e-05, 2.322625368833542e-05, 2.5445595383644104e-05, 2.766493707895279e-05, 2.9884278774261475e-05, 3.210362046957016e-05, 3.4322962164878845e-05, 3.654230386018753e-05, 3.8761645555496216e-05, 4.09809872508049e-05, 4.3200328946113586e-05, 4.541967064142227e-05, 4.763901233673096e-05, 4.985835403203964e-05, 5.207769572734833e-05, 5.429703742265701e-05, 5.65163791179657e-05, 5.8735720813274384e-05, 6.095506250858307e-05, 6.317440420389175e-05, 6.539374589920044e-05, 6.761308759450912e-05, 6.983242928981781e-05, 7.20517709851265e-05, 7.427111268043518e-05, 7.649045437574387e-05, 7.870979607105255e-05, 8.092913776636124e-05, 8.314847946166992e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 7.0, 12.0, 12.0, 24.0, 35.0, 52.0, 94.0, 172.0, 325.0, 707.0, 1772.0, 6139.0, 30827.0, 279569.0, 666567.0, 49169.0, 8866.0, 2438.0, 866.0, 403.0, 224.0, 103.0, 61.0, 37.0, 19.0, 11.0, 9.0, 10.0, 6.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.400390625, -0.3896064758300781, -0.37882232666015625, -0.3680381774902344, -0.3572540283203125, -0.3464698791503906, -0.33568572998046875, -0.3249015808105469, -0.314117431640625, -0.3033332824707031, -0.29254913330078125, -0.2817649841308594, -0.2709808349609375, -0.2601966857910156, -0.24941253662109375, -0.23862838745117188, -0.22784423828125, -0.21706008911132812, -0.20627593994140625, -0.19549179077148438, -0.1847076416015625, -0.17392349243164062, -0.16313934326171875, -0.15235519409179688, -0.141571044921875, -0.13078689575195312, -0.12000274658203125, -0.10921859741210938, -0.0984344482421875, -0.08765029907226562, -0.07686614990234375, -0.06608200073242188, -0.0552978515625, -0.044513702392578125, -0.03372955322265625, -0.022945404052734375, -0.0121612548828125, -0.001377105712890625, 0.00940704345703125, 0.020191192626953125, 0.030975341796875, 0.041759490966796875, 0.05254364013671875, 0.06332778930664062, 0.0741119384765625, 0.08489608764648438, 0.09568023681640625, 0.10646438598632812, 0.11724853515625, 0.12803268432617188, 0.13881683349609375, 0.14960098266601562, 0.1603851318359375, 0.17116928100585938, 0.18195343017578125, 0.19273757934570312, 0.203521728515625, 0.21430587768554688, 0.22509002685546875, 0.23587417602539062, 0.2466583251953125, 0.2574424743652344, 0.26822662353515625, 0.2790107727050781, 0.289794921875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 6.0, 5.0, 3.0, 2.0, 6.0, 8.0, 8.0, 8.0, 17.0, 13.0, 29.0, 25.0, 36.0, 57.0, 57.0, 82.0, 99.0, 109.0, 81.0, 78.0, 59.0, 50.0, 24.0, 21.0, 20.0, 16.0, 19.0, 15.0, 8.0, 5.0, 8.0, 8.0, 1.0, 2.0, 4.0, 9.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2093505859375, -0.2024211883544922, -0.19549179077148438, -0.18856239318847656, -0.18163299560546875, -0.17470359802246094, -0.16777420043945312, -0.1608448028564453, -0.1539154052734375, -0.1469860076904297, -0.14005661010742188, -0.13312721252441406, -0.12619781494140625, -0.11926841735839844, -0.11233901977539062, -0.10540962219238281, -0.098480224609375, -0.09155082702636719, -0.08462142944335938, -0.07769203186035156, -0.07076263427734375, -0.06383323669433594, -0.056903839111328125, -0.04997444152832031, -0.0430450439453125, -0.03611564636230469, -0.029186248779296875, -0.022256851196289062, -0.01532745361328125, -0.008398056030273438, -0.001468658447265625, 0.0054607391357421875, 0.01239013671875, 0.019319534301757812, 0.026248931884765625, 0.03317832946777344, 0.04010772705078125, 0.04703712463378906, 0.053966522216796875, 0.06089591979980469, 0.0678253173828125, 0.07475471496582031, 0.08168411254882812, 0.08861351013183594, 0.09554290771484375, 0.10247230529785156, 0.10940170288085938, 0.11633110046386719, 0.123260498046875, 0.1301898956298828, 0.13711929321289062, 0.14404869079589844, 0.15097808837890625, 0.15790748596191406, 0.16483688354492188, 0.1717662811279297, 0.1786956787109375, 0.1856250762939453, 0.19255447387695312, 0.19948387145996094, 0.20641326904296875, 0.21334266662597656, 0.22027206420898438, 0.2272014617919922, 0.234130859375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 8.0, 11.0, 9.0, 28.0, 58.0, 137.0, 286.0, 247.0, 114.0, 48.0, 21.0, 11.0, 5.0, 4.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.16749095916748, -7.952314376831055, -7.737137794494629, -7.521961212158203, -7.306784152984619, -7.091607570648193, -6.876430988311768, -6.661254405975342, -6.446077346801758, -6.230900764465332, -6.015724182128906, -5.8005475997924805, -5.5853705406188965, -5.370193958282471, -5.155017375946045, -4.939840793609619, -4.724664211273193, -4.509487628936768, -4.294311046600342, -4.079133987426758, -3.863957405090332, -3.6487808227539062, -3.4336042404174805, -3.2184276580810547, -3.00325083732605, -2.788074254989624, -2.572897434234619, -2.3577208518981934, -2.1425442695617676, -1.9273674488067627, -1.712190866470337, -1.4970141649246216, -1.2818374633789062, -1.066660761833191, -0.8514841198921204, -0.6363074779510498, -0.4211307764053345, -0.20595407485961914, 0.00922250747680664, 0.22439920902252197, 0.4395759105682373, 0.6547526121139526, 0.8699292540550232, 1.0851058959960938, 1.300282597541809, 1.5154592990875244, 1.7306358814239502, 1.9458125829696655, 2.160989284515381, 2.3761658668518066, 2.5913426876068115, 2.8065192699432373, 3.021696090698242, 3.236872673034668, 3.4520492553710938, 3.6672258377075195, 3.8824026584625244, 4.097579479217529, 4.312756061553955, 4.527932643890381, 4.743109226226807, 4.958286285400391, 5.173462867736816, 5.388639450073242, 5.603816032409668]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 3.0, 4.0, 5.0, 13.0, 13.0, 20.0, 16.0, 18.0, 19.0, 29.0, 30.0, 40.0, 32.0, 56.0, 46.0, 64.0, 87.0, 79.0, 67.0, 57.0, 48.0, 43.0, 33.0, 27.0, 32.0, 17.0, 16.0, 23.0, 12.0, 13.0, 9.0, 13.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8827619552612305, -3.7477450370788574, -3.6127278804779053, -3.4777109622955322, -3.34269380569458, -3.207676887512207, -3.072659969329834, -2.937643051147461, -2.802625894546509, -2.6676089763641357, -2.5325918197631836, -2.3975749015808105, -2.2625579833984375, -2.1275408267974854, -1.9925239086151123, -1.8575068712234497, -1.722489833831787, -1.5874727964401245, -1.452455759048462, -1.3174388408660889, -1.1824218034744263, -1.0474047660827637, -0.9123877882957458, -0.777370810508728, -0.6423537731170654, -0.5073367357254028, -0.372319757938385, -0.2373027503490448, -0.10228574275970459, 0.03273129463195801, 0.16774827241897583, 0.30276525020599365, 0.43778228759765625, 0.5727993249893188, 0.7078163027763367, 0.8428332805633545, 0.9778503179550171, 1.1128673553466797, 1.2478842735290527, 1.3829013109207153, 1.517918348312378, 1.6529353857040405, 1.7879524230957031, 1.9229693412780762, 2.057986259460449, 2.1930034160614014, 2.3280203342437744, 2.4630374908447266, 2.5980544090270996, 2.7330713272094727, 2.868088483810425, 3.003105401992798, 3.13812255859375, 3.273139476776123, 3.408156394958496, 3.543173313140869, 3.6781904697418213, 3.8132073879241943, 3.9482245445251465, 4.0832414627075195, 4.218258380889893, 4.353275299072266, 4.488292694091797, 4.62330961227417, 4.758326530456543]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 4.0, 10.0, 22.0, 25.0, 60.0, 83.0, 187.0, 335.0, 697.0, 1531.0, 3462.0, 8750.0, 26803.0, 118352.0, 947042.0, 2619838.0, 380489.0, 59667.0, 16126.0, 5845.0, 2595.0, 1102.0, 552.0, 319.0, 148.0, 98.0, 52.0, 31.0, 19.0, 15.0, 8.0, 7.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.353759765625, -0.3431358337402344, -0.33251190185546875, -0.3218879699707031, -0.3112640380859375, -0.3006401062011719, -0.29001617431640625, -0.2793922424316406, -0.268768310546875, -0.2581443786621094, -0.24752044677734375, -0.23689651489257812, -0.2262725830078125, -0.21564865112304688, -0.20502471923828125, -0.19440078735351562, -0.18377685546875, -0.17315292358398438, -0.16252899169921875, -0.15190505981445312, -0.1412811279296875, -0.13065719604492188, -0.12003326416015625, -0.10940933227539062, -0.098785400390625, -0.08816146850585938, -0.07753753662109375, -0.06691360473632812, -0.0562896728515625, -0.045665740966796875, -0.03504180908203125, -0.024417877197265625, -0.0137939453125, -0.003170013427734375, 0.00745391845703125, 0.018077850341796875, 0.0287017822265625, 0.039325714111328125, 0.04994964599609375, 0.060573577880859375, 0.071197509765625, 0.08182144165039062, 0.09244537353515625, 0.10306930541992188, 0.1136932373046875, 0.12431716918945312, 0.13494110107421875, 0.14556503295898438, 0.15618896484375, 0.16681289672851562, 0.17743682861328125, 0.18806076049804688, 0.1986846923828125, 0.20930862426757812, 0.21993255615234375, 0.23055648803710938, 0.241180419921875, 0.2518043518066406, 0.26242828369140625, 0.2730522155761719, 0.2836761474609375, 0.2943000793457031, 0.30492401123046875, 0.3155479431152344, 0.326171875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 8.0, 4.0, 5.0, 14.0, 9.0, 16.0, 14.0, 17.0, 21.0, 31.0, 33.0, 32.0, 44.0, 45.0, 56.0, 37.0, 57.0, 60.0, 52.0, 50.0, 61.0, 50.0, 39.0, 41.0, 31.0, 27.0, 31.0, 18.0, 18.0, 18.0, 15.0, 10.0, 2.0, 9.0, 9.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.228515625, -0.22054290771484375, -0.2125701904296875, -0.20459747314453125, -0.196624755859375, -0.18865203857421875, -0.1806793212890625, -0.17270660400390625, -0.16473388671875, -0.15676116943359375, -0.1487884521484375, -0.14081573486328125, -0.132843017578125, -0.12487030029296875, -0.1168975830078125, -0.10892486572265625, -0.1009521484375, -0.09297943115234375, -0.0850067138671875, -0.07703399658203125, -0.069061279296875, -0.06108856201171875, -0.0531158447265625, -0.04514312744140625, -0.03717041015625, -0.02919769287109375, -0.0212249755859375, -0.01325225830078125, -0.005279541015625, 0.00269317626953125, 0.0106658935546875, 0.01863861083984375, 0.026611328125, 0.03458404541015625, 0.0425567626953125, 0.05052947998046875, 0.058502197265625, 0.06647491455078125, 0.0744476318359375, 0.08242034912109375, 0.09039306640625, 0.09836578369140625, 0.1063385009765625, 0.11431121826171875, 0.122283935546875, 0.13025665283203125, 0.1382293701171875, 0.14620208740234375, 0.1541748046875, 0.16214752197265625, 0.1701202392578125, 0.17809295654296875, 0.186065673828125, 0.19403839111328125, 0.2020111083984375, 0.20998382568359375, 0.21795654296875, 0.22592926025390625, 0.2339019775390625, 0.24187469482421875, 0.249847412109375, 0.25782012939453125, 0.2657928466796875, 0.27376556396484375, 0.28173828125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 7.0, 17.0, 25.0, 54.0, 191.0, 1206.0, 49802.0, 4133012.0, 9062.0, 674.0, 151.0, 44.0, 20.0, 14.0, 3.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.169921875, -3.091339111328125, -3.01275634765625, -2.934173583984375, -2.8555908203125, -2.777008056640625, -2.69842529296875, -2.619842529296875, -2.541259765625, -2.462677001953125, -2.38409423828125, -2.305511474609375, -2.2269287109375, -2.148345947265625, -2.06976318359375, -1.991180419921875, -1.91259765625, -1.834014892578125, -1.75543212890625, -1.676849365234375, -1.5982666015625, -1.519683837890625, -1.44110107421875, -1.362518310546875, -1.283935546875, -1.205352783203125, -1.12677001953125, -1.048187255859375, -0.9696044921875, -0.891021728515625, -0.81243896484375, -0.733856201171875, -0.6552734375, -0.576690673828125, -0.49810791015625, -0.419525146484375, -0.3409423828125, -0.262359619140625, -0.18377685546875, -0.105194091796875, -0.026611328125, 0.051971435546875, 0.13055419921875, 0.209136962890625, 0.2877197265625, 0.366302490234375, 0.44488525390625, 0.523468017578125, 0.60205078125, 0.680633544921875, 0.75921630859375, 0.837799072265625, 0.9163818359375, 0.994964599609375, 1.07354736328125, 1.152130126953125, 1.230712890625, 1.309295654296875, 1.38787841796875, 1.466461181640625, 1.5450439453125, 1.623626708984375, 1.70220947265625, 1.780792236328125, 1.859375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 9.0, 10.0, 23.0, 33.0, 49.0, 84.0, 158.0, 375.0, 788.0, 1126.0, 697.0, 342.0, 151.0, 78.0, 51.0, 32.0, 23.0, 17.0, 10.0, 3.0, 6.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.70556640625, -0.6798324584960938, -0.6540985107421875, -0.6283645629882812, -0.602630615234375, -0.5768966674804688, -0.5511627197265625, -0.5254287719726562, -0.49969482421875, -0.47396087646484375, -0.4482269287109375, -0.42249298095703125, -0.396759033203125, -0.37102508544921875, -0.3452911376953125, -0.31955718994140625, -0.2938232421875, -0.26808929443359375, -0.2423553466796875, -0.21662139892578125, -0.190887451171875, -0.16515350341796875, -0.1394195556640625, -0.11368560791015625, -0.08795166015625, -0.06221771240234375, -0.0364837646484375, -0.01074981689453125, 0.014984130859375, 0.04071807861328125, 0.0664520263671875, 0.09218597412109375, 0.117919921875, 0.14365386962890625, 0.1693878173828125, 0.19512176513671875, 0.220855712890625, 0.24658966064453125, 0.2723236083984375, 0.29805755615234375, 0.32379150390625, 0.34952545166015625, 0.3752593994140625, 0.40099334716796875, 0.426727294921875, 0.45246124267578125, 0.4781951904296875, 0.5039291381835938, 0.5296630859375, 0.5553970336914062, 0.5811309814453125, 0.6068649291992188, 0.632598876953125, 0.6583328247070312, 0.6840667724609375, 0.7098007202148438, 0.73553466796875, 0.7612686157226562, 0.7870025634765625, 0.8127365112304688, 0.838470458984375, 0.8642044067382812, 0.8899383544921875, 0.9156723022460938, 0.94140625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 7.0, 10.0, 17.0, 42.0, 73.0, 147.0, 210.0, 189.0, 126.0, 74.0, 51.0, 24.0, 9.0, 8.0, 5.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2516441345214844, -2.073621988296509, -1.8955998420715332, -1.7175776958465576, -1.539555549621582, -1.3615334033966064, -1.1835112571716309, -1.0054891109466553, -0.8274669647216797, -0.6494448184967041, -0.4714226722717285, -0.29340052604675293, -0.11537837982177734, 0.06264376640319824, 0.24066591262817383, 0.4186880588531494, 0.596710205078125, 0.7747323513031006, 0.9527544975280762, 1.1307766437530518, 1.3087987899780273, 1.486820936203003, 1.6648430824279785, 1.842865228652954, 2.0208873748779297, 2.1989095211029053, 2.376931667327881, 2.5549538135528564, 2.732975959777832, 2.9109981060028076, 3.089020252227783, 3.267042398452759, 3.4450645446777344, 3.62308669090271, 3.8011088371276855, 3.979130983352661, 4.157153129577637, 4.335175514221191, 4.513197422027588, 4.691219329833984, 4.869241714477539, 5.047264099121094, 5.22528600692749, 5.403307914733887, 5.581330299377441, 5.759352684020996, 5.937374591827393, 6.115396499633789, 6.293418884277344, 6.471441268920898, 6.649463176727295, 6.827485084533691, 7.005507469177246, 7.183529853820801, 7.361551761627197, 7.539573669433594, 7.717596054077148, 7.895618438720703, 8.073640823364258, 8.251662254333496, 8.42968463897705, 8.607707023620605, 8.785728454589844, 8.963750839233398, 9.141773223876953]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 4.0, 7.0, 5.0, 7.0, 11.0, 14.0, 14.0, 18.0, 16.0, 23.0, 34.0, 25.0, 29.0, 36.0, 34.0, 35.0, 44.0, 31.0, 35.0, 39.0, 41.0, 40.0, 29.0, 41.0, 35.0, 31.0, 38.0, 37.0, 35.0, 34.0, 20.0, 28.0, 19.0, 15.0, 11.0, 15.0, 13.0, 10.0, 12.0, 8.0, 6.0, 2.0, 2.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-1.8771250247955322, -1.817053198814392, -1.7569814920425415, -1.6969096660614014, -1.6368379592895508, -1.5767661333084106, -1.5166943073272705, -1.45662260055542, -1.3965507745742798, -1.3364789485931396, -1.276407241821289, -1.216335415840149, -1.1562635898590088, -1.0961918830871582, -1.036120057106018, -0.9760482907295227, -0.9159765243530273, -0.855904757976532, -0.7958329916000366, -0.7357611656188965, -0.6756893992424011, -0.6156176328659058, -0.5555458068847656, -0.49547404050827026, -0.4354022741317749, -0.37533050775527954, -0.3152587115764618, -0.25518691539764404, -0.19511514902114868, -0.13504338264465332, -0.07497158646583557, -0.014899790287017822, 0.04517197608947754, 0.1052437573671341, 0.16531553864479065, 0.2253873199224472, 0.28545910120010376, 0.3455308675765991, 0.40560266375541687, 0.4656744599342346, 0.52574622631073, 0.5858179926872253, 0.6458897590637207, 0.7059615850448608, 0.7660333514213562, 0.8261051177978516, 0.8861769437789917, 0.9462487101554871, 1.0063204765319824, 1.0663923025131226, 1.1264640092849731, 1.1865358352661133, 1.2466075420379639, 1.306679368019104, 1.3667511940002441, 1.4268229007720947, 1.4868947267532349, 1.546966552734375, 1.6070382595062256, 1.6671100854873657, 1.7271819114685059, 1.7872536182403564, 1.8473254442214966, 1.9073972702026367, 1.9674689769744873]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 4.0, 9.0, 5.0, 16.0, 11.0, 12.0, 17.0, 44.0, 50.0, 83.0, 108.0, 194.0, 274.0, 467.0, 710.0, 1217.0, 2119.0, 3899.0, 8271.0, 20516.0, 64180.0, 259589.0, 472065.0, 147519.0, 39896.0, 13924.0, 6064.0, 3006.0, 1655.0, 997.0, 560.0, 359.0, 238.0, 144.0, 98.0, 61.0, 49.0, 44.0, 24.0, 21.0, 9.0, 14.0, 3.0, 4.0, 3.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.40185546875, -0.390472412109375, -0.37908935546875, -0.367706298828125, -0.3563232421875, -0.344940185546875, -0.33355712890625, -0.322174072265625, -0.310791015625, -0.299407958984375, -0.28802490234375, -0.276641845703125, -0.2652587890625, -0.253875732421875, -0.24249267578125, -0.231109619140625, -0.2197265625, -0.208343505859375, -0.19696044921875, -0.185577392578125, -0.1741943359375, -0.162811279296875, -0.15142822265625, -0.140045166015625, -0.128662109375, -0.117279052734375, -0.10589599609375, -0.094512939453125, -0.0831298828125, -0.071746826171875, -0.06036376953125, -0.048980712890625, -0.03759765625, -0.026214599609375, -0.01483154296875, -0.003448486328125, 0.0079345703125, 0.019317626953125, 0.03070068359375, 0.042083740234375, 0.053466796875, 0.064849853515625, 0.07623291015625, 0.087615966796875, 0.0989990234375, 0.110382080078125, 0.12176513671875, 0.133148193359375, 0.14453125, 0.155914306640625, 0.16729736328125, 0.178680419921875, 0.1900634765625, 0.201446533203125, 0.21282958984375, 0.224212646484375, 0.235595703125, 0.246978759765625, 0.25836181640625, 0.269744873046875, 0.2811279296875, 0.292510986328125, 0.30389404296875, 0.315277099609375, 0.32666015625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 3.0, 5.0, 4.0, 8.0, 6.0, 8.0, 7.0, 16.0, 12.0, 19.0, 20.0, 24.0, 36.0, 39.0, 33.0, 43.0, 37.0, 23.0, 43.0, 52.0, 65.0, 56.0, 50.0, 46.0, 55.0, 38.0, 51.0, 29.0, 35.0, 25.0, 23.0, 19.0, 18.0, 12.0, 8.0, 9.0, 7.0, 9.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.269287109375, -0.2607879638671875, -0.252288818359375, -0.2437896728515625, -0.23529052734375, -0.2267913818359375, -0.218292236328125, -0.2097930908203125, -0.2012939453125, -0.1927947998046875, -0.184295654296875, -0.1757965087890625, -0.16729736328125, -0.1587982177734375, -0.150299072265625, -0.1417999267578125, -0.13330078125, -0.1248016357421875, -0.116302490234375, -0.1078033447265625, -0.09930419921875, -0.0908050537109375, -0.082305908203125, -0.0738067626953125, -0.0653076171875, -0.0568084716796875, -0.048309326171875, -0.0398101806640625, -0.03131103515625, -0.0228118896484375, -0.014312744140625, -0.0058135986328125, 0.002685546875, 0.0111846923828125, 0.019683837890625, 0.0281829833984375, 0.03668212890625, 0.0451812744140625, 0.053680419921875, 0.0621795654296875, 0.0706787109375, 0.0791778564453125, 0.087677001953125, 0.0961761474609375, 0.10467529296875, 0.1131744384765625, 0.121673583984375, 0.1301727294921875, 0.138671875, 0.1471710205078125, 0.155670166015625, 0.1641693115234375, 0.17266845703125, 0.1811676025390625, 0.189666748046875, 0.1981658935546875, 0.2066650390625, 0.2151641845703125, 0.223663330078125, 0.2321624755859375, 0.24066162109375, 0.2491607666015625, 0.257659912109375, 0.2661590576171875, 0.274658203125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 5.0, 6.0, 16.0, 11.0, 14.0, 27.0, 33.0, 56.0, 85.0, 136.0, 225.0, 436.0, 982.0, 2751.0, 12795.0, 199045.0, 793344.0, 31138.0, 4724.0, 1391.0, 558.0, 296.0, 169.0, 101.0, 52.0, 35.0, 34.0, 24.0, 13.0, 17.0, 6.0, 8.0, 4.0, 6.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.068359375, -1.0403900146484375, -1.012420654296875, -0.9844512939453125, -0.95648193359375, -0.9285125732421875, -0.900543212890625, -0.8725738525390625, -0.8446044921875, -0.8166351318359375, -0.788665771484375, -0.7606964111328125, -0.73272705078125, -0.7047576904296875, -0.676788330078125, -0.6488189697265625, -0.620849609375, -0.5928802490234375, -0.564910888671875, -0.5369415283203125, -0.50897216796875, -0.4810028076171875, -0.453033447265625, -0.4250640869140625, -0.3970947265625, -0.3691253662109375, -0.341156005859375, -0.3131866455078125, -0.28521728515625, -0.2572479248046875, -0.229278564453125, -0.2013092041015625, -0.17333984375, -0.1453704833984375, -0.117401123046875, -0.0894317626953125, -0.06146240234375, -0.0334930419921875, -0.005523681640625, 0.0224456787109375, 0.0504150390625, 0.0783843994140625, 0.106353759765625, 0.1343231201171875, 0.16229248046875, 0.1902618408203125, 0.218231201171875, 0.2462005615234375, 0.274169921875, 0.3021392822265625, 0.330108642578125, 0.3580780029296875, 0.38604736328125, 0.4140167236328125, 0.441986083984375, 0.4699554443359375, 0.4979248046875, 0.5258941650390625, 0.553863525390625, 0.5818328857421875, 0.60980224609375, 0.6377716064453125, 0.665740966796875, 0.6937103271484375, 0.7216796875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 0.0, 4.0, 6.0, 7.0, 8.0, 8.0, 10.0, 11.0, 10.0, 26.0, 27.0, 22.0, 37.0, 43.0, 35.0, 41.0, 52.0, 44.0, 55.0, 39.0, 60.0, 62.0, 46.0, 37.0, 42.0, 43.0, 24.0, 37.0, 27.0, 19.0, 15.0, 24.0, 18.0, 9.0, 14.0, 9.0, 5.0, 5.0, 5.0, 4.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.044921875, -1.0133895874023438, -0.9818572998046875, -0.9503250122070312, -0.918792724609375, -0.8872604370117188, -0.8557281494140625, -0.8241958618164062, -0.79266357421875, -0.7611312866210938, -0.7295989990234375, -0.6980667114257812, -0.666534423828125, -0.6350021362304688, -0.6034698486328125, -0.5719375610351562, -0.5404052734375, -0.5088729858398438, -0.4773406982421875, -0.44580841064453125, -0.414276123046875, -0.38274383544921875, -0.3512115478515625, -0.31967926025390625, -0.28814697265625, -0.25661468505859375, -0.2250823974609375, -0.19355010986328125, -0.162017822265625, -0.13048553466796875, -0.0989532470703125, -0.06742095947265625, -0.035888671875, -0.00435638427734375, 0.0271759033203125, 0.05870819091796875, 0.090240478515625, 0.12177276611328125, 0.1533050537109375, 0.18483734130859375, 0.21636962890625, 0.24790191650390625, 0.2794342041015625, 0.31096649169921875, 0.342498779296875, 0.37403106689453125, 0.4055633544921875, 0.43709564208984375, 0.4686279296875, 0.5001602172851562, 0.5316925048828125, 0.5632247924804688, 0.594757080078125, 0.6262893676757812, 0.6578216552734375, 0.6893539428710938, 0.72088623046875, 0.7524185180664062, 0.7839508056640625, 0.8154830932617188, 0.847015380859375, 0.8785476684570312, 0.9100799560546875, 0.9416122436523438, 0.97314453125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 2.0, 5.0, 8.0, 6.0, 15.0, 17.0, 35.0, 40.0, 57.0, 74.0, 104.0, 189.0, 377.0, 786.0, 1718.0, 4551.0, 14908.0, 75367.0, 784279.0, 133937.0, 21743.0, 6024.0, 2224.0, 986.0, 436.0, 231.0, 164.0, 96.0, 53.0, 42.0, 31.0, 12.0, 10.0, 4.0, 4.0, 3.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.2222900390625, -0.21478843688964844, -0.20728683471679688, -0.1997852325439453, -0.19228363037109375, -0.1847820281982422, -0.17728042602539062, -0.16977882385253906, -0.1622772216796875, -0.15477561950683594, -0.14727401733398438, -0.1397724151611328, -0.13227081298828125, -0.12476921081542969, -0.11726760864257812, -0.10976600646972656, -0.102264404296875, -0.09476280212402344, -0.08726119995117188, -0.07975959777832031, -0.07225799560546875, -0.06475639343261719, -0.057254791259765625, -0.04975318908691406, -0.0422515869140625, -0.03474998474121094, -0.027248382568359375, -0.019746780395507812, -0.01224517822265625, -0.0047435760498046875, 0.002758026123046875, 0.010259628295898438, 0.01776123046875, 0.025262832641601562, 0.032764434814453125, 0.04026603698730469, 0.04776763916015625, 0.05526924133300781, 0.06277084350585938, 0.07027244567871094, 0.0777740478515625, 0.08527565002441406, 0.09277725219726562, 0.10027885437011719, 0.10778045654296875, 0.11528205871582031, 0.12278366088867188, 0.13028526306152344, 0.137786865234375, 0.14528846740722656, 0.15279006958007812, 0.1602916717529297, 0.16779327392578125, 0.1752948760986328, 0.18279647827148438, 0.19029808044433594, 0.1977996826171875, 0.20530128479003906, 0.21280288696289062, 0.2203044891357422, 0.22780609130859375, 0.2353076934814453, 0.24280929565429688, 0.25031089782714844, 0.2578125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 5.0, 4.0, 9.0, 15.0, 13.0, 31.0, 56.0, 83.0, 88.0, 147.0, 151.0, 127.0, 66.0, 75.0, 52.0, 27.0, 13.0, 10.0, 3.0, 7.0, 7.0, 4.0, 0.0, 0.0, 0.0, 5.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.101629257202148e-05, -8.857715874910355e-05, -8.613802492618561e-05, -8.369889110326767e-05, -8.125975728034973e-05, -7.882062345743179e-05, -7.638148963451385e-05, -7.394235581159592e-05, -7.150322198867798e-05, -6.906408816576004e-05, -6.66249543428421e-05, -6.418582051992416e-05, -6.174668669700623e-05, -5.930755287408829e-05, -5.686841905117035e-05, -5.442928522825241e-05, -5.199015140533447e-05, -4.9551017582416534e-05, -4.7111883759498596e-05, -4.467274993658066e-05, -4.223361611366272e-05, -3.979448229074478e-05, -3.735534846782684e-05, -3.4916214644908905e-05, -3.247708082199097e-05, -3.003794699907303e-05, -2.759881317615509e-05, -2.5159679353237152e-05, -2.2720545530319214e-05, -2.0281411707401276e-05, -1.7842277884483337e-05, -1.54031440615654e-05, -1.2964010238647461e-05, -1.0524876415729523e-05, -8.085742592811584e-06, -5.646608769893646e-06, -3.207474946975708e-06, -7.683411240577698e-07, 1.6707926988601685e-06, 4.109926521778107e-06, 6.549060344696045e-06, 8.988194167613983e-06, 1.1427327990531921e-05, 1.386646181344986e-05, 1.6305595636367798e-05, 1.8744729459285736e-05, 2.1183863282203674e-05, 2.3622997105121613e-05, 2.606213092803955e-05, 2.850126475095749e-05, 3.094039857387543e-05, 3.3379532396793365e-05, 3.5818666219711304e-05, 3.825780004262924e-05, 4.069693386554718e-05, 4.313606768846512e-05, 4.557520151138306e-05, 4.8014335334300995e-05, 5.045346915721893e-05, 5.289260298013687e-05, 5.533173680305481e-05, 5.777087062597275e-05, 6.0210004448890686e-05, 6.264913827180862e-05, 6.508827209472656e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 5.0, 6.0, 16.0, 19.0, 25.0, 25.0, 45.0, 69.0, 96.0, 164.0, 278.0, 578.0, 1212.0, 2934.0, 8979.0, 37281.0, 324208.0, 613273.0, 43375.0, 10025.0, 3243.0, 1248.0, 594.0, 331.0, 184.0, 119.0, 70.0, 40.0, 25.0, 29.0, 15.0, 11.0, 12.0, 3.0, 3.0, 7.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.200927734375, -0.19321441650390625, -0.1855010986328125, -0.17778778076171875, -0.170074462890625, -0.16236114501953125, -0.1546478271484375, -0.14693450927734375, -0.13922119140625, -0.13150787353515625, -0.1237945556640625, -0.11608123779296875, -0.108367919921875, -0.10065460205078125, -0.0929412841796875, -0.08522796630859375, -0.0775146484375, -0.06980133056640625, -0.0620880126953125, -0.05437469482421875, -0.046661376953125, -0.03894805908203125, -0.0312347412109375, -0.02352142333984375, -0.01580810546875, -0.00809478759765625, -0.0003814697265625, 0.00733184814453125, 0.015045166015625, 0.02275848388671875, 0.0304718017578125, 0.03818511962890625, 0.0458984375, 0.05361175537109375, 0.0613250732421875, 0.06903839111328125, 0.076751708984375, 0.08446502685546875, 0.0921783447265625, 0.09989166259765625, 0.10760498046875, 0.11531829833984375, 0.1230316162109375, 0.13074493408203125, 0.138458251953125, 0.14617156982421875, 0.1538848876953125, 0.16159820556640625, 0.1693115234375, 0.17702484130859375, 0.1847381591796875, 0.19245147705078125, 0.200164794921875, 0.20787811279296875, 0.2155914306640625, 0.22330474853515625, 0.23101806640625, 0.23873138427734375, 0.2464447021484375, 0.25415802001953125, 0.261871337890625, 0.26958465576171875, 0.2772979736328125, 0.28501129150390625, 0.292724609375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 4.0, 9.0, 11.0, 5.0, 17.0, 11.0, 27.0, 41.0, 47.0, 49.0, 82.0, 98.0, 129.0, 103.0, 101.0, 61.0, 37.0, 41.0, 20.0, 25.0, 18.0, 16.0, 9.0, 11.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.205078125, -0.19840240478515625, -0.1917266845703125, -0.18505096435546875, -0.178375244140625, -0.17169952392578125, -0.1650238037109375, -0.15834808349609375, -0.15167236328125, -0.14499664306640625, -0.1383209228515625, -0.13164520263671875, -0.124969482421875, -0.11829376220703125, -0.1116180419921875, -0.10494232177734375, -0.0982666015625, -0.09159088134765625, -0.0849151611328125, -0.07823944091796875, -0.071563720703125, -0.06488800048828125, -0.0582122802734375, -0.05153656005859375, -0.04486083984375, -0.03818511962890625, -0.0315093994140625, -0.02483367919921875, -0.018157958984375, -0.01148223876953125, -0.0048065185546875, 0.00186920166015625, 0.008544921875, 0.01522064208984375, 0.0218963623046875, 0.02857208251953125, 0.035247802734375, 0.04192352294921875, 0.0485992431640625, 0.05527496337890625, 0.06195068359375, 0.06862640380859375, 0.0753021240234375, 0.08197784423828125, 0.088653564453125, 0.09532928466796875, 0.1020050048828125, 0.10868072509765625, 0.1153564453125, 0.12203216552734375, 0.1287078857421875, 0.13538360595703125, 0.142059326171875, 0.14873504638671875, 0.1554107666015625, 0.16208648681640625, 0.16876220703125, 0.17543792724609375, 0.1821136474609375, 0.18878936767578125, 0.195465087890625, 0.20214080810546875, 0.2088165283203125, 0.21549224853515625, 0.22216796875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 5.0, 6.0, 24.0, 52.0, 152.0, 420.0, 180.0, 100.0, 35.0, 11.0, 8.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.260405540466309, -8.021198272705078, -7.781991004943848, -7.542784214019775, -7.303576946258545, -7.0643696784973145, -6.825162410736084, -6.585955619812012, -6.346748352050781, -6.107541084289551, -5.86833381652832, -5.629127025604248, -5.389919757843018, -5.150712490081787, -4.911505222320557, -4.672298431396484, -4.433091163635254, -4.193883895874023, -3.954676866531372, -3.7154695987701416, -3.4762625694274902, -3.2370553016662598, -2.9978480339050293, -2.758641004562378, -2.5194334983825684, -2.280226230621338, -2.0410192012786865, -1.801811933517456, -1.5626049041748047, -1.3233976364135742, -1.0841904878616333, -0.8449833393096924, -0.605776309967041, -0.3665691614151001, -0.1273619830608368, 0.11184519529342651, 0.35105234384536743, 0.5902595520019531, 0.829466700553894, 1.068673849105835, 1.3078809976577759, 1.5470881462097168, 1.7862952947616577, 2.0255024433135986, 2.264709711074829, 2.5039167404174805, 2.743124008178711, 2.9823312759399414, 3.2215383052825928, 3.4607455730438232, 3.6999526023864746, 3.939159870147705, 4.1783671379089355, 4.417573928833008, 4.656781196594238, 4.895988464355469, 5.135195732116699, 5.37440299987793, 5.61361026763916, 5.852817058563232, 6.092024326324463, 6.331231594085693, 6.570438861846924, 6.809645652770996, 7.048852920532227]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 5.0, 2.0, 8.0, 6.0, 8.0, 9.0, 9.0, 15.0, 13.0, 13.0, 15.0, 26.0, 31.0, 28.0, 31.0, 30.0, 40.0, 40.0, 65.0, 67.0, 83.0, 77.0, 57.0, 45.0, 44.0, 37.0, 41.0, 26.0, 29.0, 19.0, 22.0, 9.0, 8.0, 10.0, 8.0, 5.0, 7.0, 3.0, 5.0, 2.0, 7.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0791754722595215, -2.9541518688201904, -2.8291280269622803, -2.704104423522949, -2.579080581665039, -2.454056978225708, -2.329033374786377, -2.204009532928467, -2.0789859294891357, -1.9539622068405151, -1.8289384841918945, -1.7039148807525635, -1.5788911581039429, -1.4538674354553223, -1.3288438320159912, -1.2038201093673706, -1.07879638671875, -0.9537726640701294, -0.8287490010261536, -0.7037253379821777, -0.5787016153335571, -0.4536778926849365, -0.3286542296409607, -0.20363056659698486, -0.07860684394836426, 0.04641684889793396, 0.17144054174423218, 0.2964642345905304, 0.4214879274368286, 0.5465116500854492, 0.671535313129425, 0.7965589761734009, 0.9215826988220215, 1.046606421470642, 1.1716301441192627, 1.2966537475585938, 1.4216774702072144, 1.546701192855835, 1.671724796295166, 1.7967485189437866, 1.9217722415924072, 2.0467958450317383, 2.1718196868896484, 2.2968432903289795, 2.4218668937683105, 2.5468907356262207, 2.6719143390655518, 2.796937942504883, 2.921961784362793, 3.046985387802124, 3.172009229660034, 3.2970328330993652, 3.4220566749572754, 3.5470802783966064, 3.6721038818359375, 3.7971277236938477, 3.9221513271331787, 4.04717493057251, 4.17219877243042, 4.29722261428833, 4.422245979309082, 4.547269821166992, 4.672293663024902, 4.797317028045654, 4.9223408699035645]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 10.0, 11.0, 13.0, 25.0, 55.0, 48.0, 99.0, 168.0, 269.0, 467.0, 911.0, 1771.0, 3979.0, 10318.0, 35348.0, 174758.0, 1200977.0, 2308878.0, 364592.0, 63651.0, 16752.0, 5890.0, 2585.0, 1171.0, 636.0, 366.0, 195.0, 135.0, 88.0, 45.0, 32.0, 11.0, 10.0, 7.0, 9.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.322265625, -0.3122596740722656, -0.30225372314453125, -0.2922477722167969, -0.2822418212890625, -0.2722358703613281, -0.26222991943359375, -0.2522239685058594, -0.242218017578125, -0.23221206665039062, -0.22220611572265625, -0.21220016479492188, -0.2021942138671875, -0.19218826293945312, -0.18218231201171875, -0.17217636108398438, -0.16217041015625, -0.15216445922851562, -0.14215850830078125, -0.13215255737304688, -0.1221466064453125, -0.11214065551757812, -0.10213470458984375, -0.09212875366210938, -0.082122802734375, -0.07211685180664062, -0.06211090087890625, -0.052104949951171875, -0.0420989990234375, -0.032093048095703125, -0.02208709716796875, -0.012081146240234375, -0.0020751953125, 0.007930755615234375, 0.01793670654296875, 0.027942657470703125, 0.0379486083984375, 0.047954559326171875, 0.05796051025390625, 0.06796646118164062, 0.077972412109375, 0.08797836303710938, 0.09798431396484375, 0.10799026489257812, 0.1179962158203125, 0.12800216674804688, 0.13800811767578125, 0.14801406860351562, 0.15802001953125, 0.16802597045898438, 0.17803192138671875, 0.18803787231445312, 0.1980438232421875, 0.20804977416992188, 0.21805572509765625, 0.22806167602539062, 0.238067626953125, 0.24807357788085938, 0.25807952880859375, 0.2680854797363281, 0.2780914306640625, 0.2880973815917969, 0.29810333251953125, 0.3081092834472656, 0.318115234375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 2.0, 6.0, 11.0, 10.0, 15.0, 14.0, 20.0, 16.0, 23.0, 25.0, 23.0, 28.0, 29.0, 41.0, 40.0, 52.0, 37.0, 50.0, 61.0, 53.0, 47.0, 47.0, 45.0, 43.0, 34.0, 37.0, 33.0, 30.0, 25.0, 21.0, 12.0, 17.0, 12.0, 6.0, 10.0, 8.0, 5.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.281982421875, -0.27381324768066406, -0.2656440734863281, -0.2574748992919922, -0.24930572509765625, -0.2411365509033203, -0.23296737670898438, -0.22479820251464844, -0.2166290283203125, -0.20845985412597656, -0.20029067993164062, -0.1921215057373047, -0.18395233154296875, -0.1757831573486328, -0.16761398315429688, -0.15944480895996094, -0.151275634765625, -0.14310646057128906, -0.13493728637695312, -0.1267681121826172, -0.11859893798828125, -0.11042976379394531, -0.10226058959960938, -0.09409141540527344, -0.0859222412109375, -0.07775306701660156, -0.06958389282226562, -0.06141471862792969, -0.05324554443359375, -0.04507637023925781, -0.036907196044921875, -0.028738021850585938, -0.02056884765625, -0.012399673461914062, -0.004230499267578125, 0.0039386749267578125, 0.01210784912109375, 0.020277023315429688, 0.028446197509765625, 0.03661537170410156, 0.0447845458984375, 0.05295372009277344, 0.061122894287109375, 0.06929206848144531, 0.07746124267578125, 0.08563041687011719, 0.09379959106445312, 0.10196876525878906, 0.110137939453125, 0.11830711364746094, 0.12647628784179688, 0.1346454620361328, 0.14281463623046875, 0.1509838104248047, 0.15915298461914062, 0.16732215881347656, 0.1754913330078125, 0.18366050720214844, 0.19182968139648438, 0.1999988555908203, 0.20816802978515625, 0.2163372039794922, 0.22450637817382812, 0.23267555236816406, 0.2408447265625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 9.0, 12.0, 31.0, 108.0, 552.0, 6243.0, 3934442.0, 250120.0, 2320.0, 301.0, 84.0, 29.0, 15.0, 7.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8876953125, -1.8222198486328125, -1.756744384765625, -1.6912689208984375, -1.62579345703125, -1.5603179931640625, -1.494842529296875, -1.4293670654296875, -1.3638916015625, -1.2984161376953125, -1.232940673828125, -1.1674652099609375, -1.10198974609375, -1.0365142822265625, -0.971038818359375, -0.9055633544921875, -0.840087890625, -0.7746124267578125, -0.709136962890625, -0.6436614990234375, -0.57818603515625, -0.5127105712890625, -0.447235107421875, -0.3817596435546875, -0.3162841796875, -0.2508087158203125, -0.185333251953125, -0.1198577880859375, -0.05438232421875, 0.0110931396484375, 0.076568603515625, 0.1420440673828125, 0.20751953125, 0.2729949951171875, 0.338470458984375, 0.4039459228515625, 0.46942138671875, 0.5348968505859375, 0.600372314453125, 0.6658477783203125, 0.7313232421875, 0.7967987060546875, 0.862274169921875, 0.9277496337890625, 0.99322509765625, 1.0587005615234375, 1.124176025390625, 1.1896514892578125, 1.255126953125, 1.3206024169921875, 1.386077880859375, 1.4515533447265625, 1.51702880859375, 1.5825042724609375, 1.647979736328125, 1.7134552001953125, 1.7789306640625, 1.8444061279296875, 1.909881591796875, 1.9753570556640625, 2.04083251953125, 2.1063079833984375, 2.171783447265625, 2.2372589111328125, 2.302734375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 10.0, 7.0, 10.0, 20.0, 33.0, 39.0, 69.0, 107.0, 232.0, 456.0, 831.0, 983.0, 577.0, 298.0, 151.0, 91.0, 61.0, 28.0, 22.0, 14.0, 12.0, 11.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68408203125, -0.66143798828125, -0.6387939453125, -0.61614990234375, -0.593505859375, -0.57086181640625, -0.5482177734375, -0.52557373046875, -0.5029296875, -0.48028564453125, -0.4576416015625, -0.43499755859375, -0.412353515625, -0.38970947265625, -0.3670654296875, -0.34442138671875, -0.32177734375, -0.29913330078125, -0.2764892578125, -0.25384521484375, -0.231201171875, -0.20855712890625, -0.1859130859375, -0.16326904296875, -0.140625, -0.11798095703125, -0.0953369140625, -0.07269287109375, -0.050048828125, -0.02740478515625, -0.0047607421875, 0.01788330078125, 0.04052734375, 0.06317138671875, 0.0858154296875, 0.10845947265625, 0.131103515625, 0.15374755859375, 0.1763916015625, 0.19903564453125, 0.2216796875, 0.24432373046875, 0.2669677734375, 0.28961181640625, 0.312255859375, 0.33489990234375, 0.3575439453125, 0.38018798828125, 0.40283203125, 0.42547607421875, 0.4481201171875, 0.47076416015625, 0.493408203125, 0.51605224609375, 0.5386962890625, 0.56134033203125, 0.583984375, 0.60662841796875, 0.6292724609375, 0.65191650390625, 0.674560546875, 0.69720458984375, 0.7198486328125, 0.74249267578125, 0.76513671875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 7.0, 12.0, 18.0, 23.0, 39.0, 62.0, 89.0, 131.0, 143.0, 159.0, 112.0, 76.0, 40.0, 31.0, 16.0, 12.0, 6.0, 7.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5388402938842773, -2.4306893348693848, -2.322538137435913, -2.2143871784210205, -2.106235980987549, -1.9980850219726562, -1.8899340629577637, -1.7817829847335815, -1.6736319065093994, -1.5654808282852173, -1.4573297500610352, -1.3491787910461426, -1.2410277128219604, -1.1328766345977783, -1.0247256755828857, -0.9165745973587036, -0.8084235191345215, -0.7002724409103394, -0.592121422290802, -0.48397037386894226, -0.3758193254470825, -0.2676682472229004, -0.15951722860336304, -0.051366209983825684, 0.056784868240356445, 0.1649359166622162, 0.2730869650840759, 0.38123801350593567, 0.4893890619277954, 0.5975401401519775, 0.7056911587715149, 0.8138421773910522, 0.9219932556152344, 1.0301443338394165, 1.1382954120635986, 1.2464463710784912, 1.3545974493026733, 1.4627485275268555, 1.570899486541748, 1.6790505647659302, 1.7872016429901123, 1.8953527212142944, 2.0035037994384766, 2.111654758453369, 2.2198057174682617, 2.3279569149017334, 2.436107873916626, 2.5442590713500977, 2.6524100303649902, 2.760560989379883, 2.8687121868133545, 2.976863145828247, 3.0850143432617188, 3.1931653022766113, 3.301316261291504, 3.4094672203063965, 3.517618417739868, 3.6257693767547607, 3.7339205741882324, 3.842071533203125, 3.9502224922180176, 4.05837345123291, 4.166524887084961, 4.2746758460998535, 4.382826805114746]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 15.0, 3.0, 10.0, 17.0, 15.0, 18.0, 28.0, 25.0, 39.0, 32.0, 37.0, 50.0, 54.0, 74.0, 72.0, 57.0, 54.0, 46.0, 47.0, 38.0, 42.0, 40.0, 27.0, 25.0, 22.0, 18.0, 27.0, 14.0, 11.0, 15.0, 10.0, 5.0, 1.0, 1.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.853916645050049, -2.7687692642211914, -2.683621883392334, -2.5984745025634766, -2.51332688331604, -2.4281795024871826, -2.343032121658325, -2.2578847408294678, -2.1727373600006104, -2.087589979171753, -2.0024425983428955, -1.9172950983047485, -1.8321477174758911, -1.7470002174377441, -1.6618528366088867, -1.5767054557800293, -1.4915579557418823, -1.406410574913025, -1.321263074874878, -1.2361156940460205, -1.150968313217163, -1.0658209323883057, -0.9806734323501587, -0.8955260515213013, -0.8103786110877991, -0.7252311706542969, -0.6400837898254395, -0.5549363493919373, -0.46978893876075745, -0.38464152812957764, -0.29949408769607544, -0.21434670686721802, -0.12919926643371582, -0.044051848351955414, 0.04109556972980499, 0.126242995262146, 0.2113904058933258, 0.2965378165245056, 0.3816852569580078, 0.46683263778686523, 0.5519800782203674, 0.6371275186538696, 0.722274899482727, 0.8074223399162292, 0.8925697803497314, 0.9777171611785889, 1.0628645420074463, 1.1480119228363037, 1.2331594228744507, 1.318306803703308, 1.403454303741455, 1.4886016845703125, 1.57374906539917, 1.6588964462280273, 1.7440439462661743, 1.8291913270950317, 1.9143388271331787, 1.9994862079620361, 2.0846335887908936, 2.16978120803833, 2.2549285888671875, 2.340075969696045, 2.4252233505249023, 2.5103707313537598, 2.595518112182617]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 4.0, 5.0, 8.0, 13.0, 18.0, 30.0, 33.0, 33.0, 61.0, 104.0, 180.0, 216.0, 408.0, 671.0, 1210.0, 2245.0, 4590.0, 10402.0, 24352.0, 64518.0, 210695.0, 452918.0, 179071.0, 56675.0, 21801.0, 9141.0, 4306.0, 2101.0, 1093.0, 648.0, 362.0, 248.0, 127.0, 90.0, 69.0, 37.0, 23.0, 17.0, 10.0, 6.0, 8.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.354248046875, -0.3433265686035156, -0.33240509033203125, -0.3214836120605469, -0.3105621337890625, -0.2996406555175781, -0.28871917724609375, -0.2777976989746094, -0.266876220703125, -0.2559547424316406, -0.24503326416015625, -0.23411178588867188, -0.2231903076171875, -0.21226882934570312, -0.20134735107421875, -0.19042587280273438, -0.17950439453125, -0.16858291625976562, -0.15766143798828125, -0.14673995971679688, -0.1358184814453125, -0.12489700317382812, -0.11397552490234375, -0.10305404663085938, -0.092132568359375, -0.08121109008789062, -0.07028961181640625, -0.059368133544921875, -0.0484466552734375, -0.037525177001953125, -0.02660369873046875, -0.015682220458984375, -0.0047607421875, 0.006160736083984375, 0.01708221435546875, 0.028003692626953125, 0.0389251708984375, 0.049846649169921875, 0.06076812744140625, 0.07168960571289062, 0.082611083984375, 0.09353256225585938, 0.10445404052734375, 0.11537551879882812, 0.1262969970703125, 0.13721847534179688, 0.14813995361328125, 0.15906143188476562, 0.16998291015625, 0.18090438842773438, 0.19182586669921875, 0.20274734497070312, 0.2136688232421875, 0.22459030151367188, 0.23551177978515625, 0.24643325805664062, 0.257354736328125, 0.2682762145996094, 0.27919769287109375, 0.2901191711425781, 0.3010406494140625, 0.3119621276855469, 0.32288360595703125, 0.3338050842285156, 0.3447265625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0, 2.0, 7.0, 10.0, 18.0, 11.0, 23.0, 16.0, 28.0, 28.0, 27.0, 37.0, 40.0, 42.0, 50.0, 47.0, 54.0, 64.0, 64.0, 48.0, 58.0, 64.0, 45.0, 33.0, 36.0, 29.0, 29.0, 31.0, 11.0, 14.0, 10.0, 7.0, 4.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.347412109375, -0.3376502990722656, -0.32788848876953125, -0.3181266784667969, -0.3083648681640625, -0.2986030578613281, -0.28884124755859375, -0.2790794372558594, -0.269317626953125, -0.2595558166503906, -0.24979400634765625, -0.24003219604492188, -0.2302703857421875, -0.22050857543945312, -0.21074676513671875, -0.20098495483398438, -0.19122314453125, -0.18146133422851562, -0.17169952392578125, -0.16193771362304688, -0.1521759033203125, -0.14241409301757812, -0.13265228271484375, -0.12289047241210938, -0.113128662109375, -0.10336685180664062, -0.09360504150390625, -0.08384323120117188, -0.0740814208984375, -0.06431961059570312, -0.05455780029296875, -0.044795989990234375, -0.0350341796875, -0.025272369384765625, -0.01551055908203125, -0.005748748779296875, 0.0040130615234375, 0.013774871826171875, 0.02353668212890625, 0.033298492431640625, 0.043060302734375, 0.052822113037109375, 0.06258392333984375, 0.07234573364257812, 0.0821075439453125, 0.09186935424804688, 0.10163116455078125, 0.11139297485351562, 0.12115478515625, 0.13091659545898438, 0.14067840576171875, 0.15044021606445312, 0.1602020263671875, 0.16996383666992188, 0.17972564697265625, 0.18948745727539062, 0.199249267578125, 0.20901107788085938, 0.21877288818359375, 0.22853469848632812, 0.2382965087890625, 0.24805831909179688, 0.25782012939453125, 0.2675819396972656, 0.27734375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 4.0, 8.0, 5.0, 14.0, 15.0, 28.0, 29.0, 57.0, 79.0, 133.0, 224.0, 464.0, 874.0, 2344.0, 9693.0, 89059.0, 869624.0, 64054.0, 8080.0, 1985.0, 774.0, 403.0, 213.0, 137.0, 71.0, 58.0, 30.0, 32.0, 13.0, 9.0, 10.0, 7.0, 6.0, 7.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.99365234375, -0.9663848876953125, -0.939117431640625, -0.9118499755859375, -0.88458251953125, -0.8573150634765625, -0.830047607421875, -0.8027801513671875, -0.7755126953125, -0.7482452392578125, -0.720977783203125, -0.6937103271484375, -0.66644287109375, -0.6391754150390625, -0.611907958984375, -0.5846405029296875, -0.557373046875, -0.5301055908203125, -0.502838134765625, -0.4755706787109375, -0.44830322265625, -0.4210357666015625, -0.393768310546875, -0.3665008544921875, -0.3392333984375, -0.3119659423828125, -0.284698486328125, -0.2574310302734375, -0.23016357421875, -0.2028961181640625, -0.175628662109375, -0.1483612060546875, -0.12109375, -0.0938262939453125, -0.066558837890625, -0.0392913818359375, -0.01202392578125, 0.0152435302734375, 0.042510986328125, 0.0697784423828125, 0.0970458984375, 0.1243133544921875, 0.151580810546875, 0.1788482666015625, 0.20611572265625, 0.2333831787109375, 0.260650634765625, 0.2879180908203125, 0.315185546875, 0.3424530029296875, 0.369720458984375, 0.3969879150390625, 0.42425537109375, 0.4515228271484375, 0.478790283203125, 0.5060577392578125, 0.5333251953125, 0.5605926513671875, 0.587860107421875, 0.6151275634765625, 0.64239501953125, 0.6696624755859375, 0.696929931640625, 0.7241973876953125, 0.75146484375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 9.0, 10.0, 7.0, 9.0, 8.0, 14.0, 16.0, 19.0, 20.0, 29.0, 30.0, 45.0, 50.0, 53.0, 56.0, 62.0, 52.0, 63.0, 52.0, 53.0, 43.0, 39.0, 31.0, 24.0, 45.0, 22.0, 24.0, 14.0, 27.0, 21.0, 12.0, 7.0, 4.0, 4.0, 6.0, 3.0, 5.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1435546875, -1.1089630126953125, -1.074371337890625, -1.0397796630859375, -1.00518798828125, -0.9705963134765625, -0.936004638671875, -0.9014129638671875, -0.8668212890625, -0.8322296142578125, -0.797637939453125, -0.7630462646484375, -0.72845458984375, -0.6938629150390625, -0.659271240234375, -0.6246795654296875, -0.590087890625, -0.5554962158203125, -0.520904541015625, -0.4863128662109375, -0.45172119140625, -0.4171295166015625, -0.382537841796875, -0.3479461669921875, -0.3133544921875, -0.2787628173828125, -0.244171142578125, -0.2095794677734375, -0.17498779296875, -0.1403961181640625, -0.105804443359375, -0.0712127685546875, -0.03662109375, -0.0020294189453125, 0.032562255859375, 0.0671539306640625, 0.10174560546875, 0.1363372802734375, 0.170928955078125, 0.2055206298828125, 0.2401123046875, 0.2747039794921875, 0.309295654296875, 0.3438873291015625, 0.37847900390625, 0.4130706787109375, 0.447662353515625, 0.4822540283203125, 0.516845703125, 0.5514373779296875, 0.586029052734375, 0.6206207275390625, 0.65521240234375, 0.6898040771484375, 0.724395751953125, 0.7589874267578125, 0.7935791015625, 0.8281707763671875, 0.862762451171875, 0.8973541259765625, 0.93194580078125, 0.9665374755859375, 1.001129150390625, 1.0357208251953125, 1.0703125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 5.0, 3.0, 4.0, 8.0, 7.0, 9.0, 4.0, 16.0, 18.0, 30.0, 50.0, 82.0, 117.0, 216.0, 470.0, 1265.0, 3535.0, 12451.0, 64402.0, 806059.0, 132405.0, 19207.0, 5170.0, 1676.0, 615.0, 287.0, 155.0, 88.0, 50.0, 38.0, 22.0, 20.0, 14.0, 9.0, 10.0, 12.0, 5.0, 1.0, 2.0, 3.0, 4.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.2232666015625, -0.21663284301757812, -0.20999908447265625, -0.20336532592773438, -0.1967315673828125, -0.19009780883789062, -0.18346405029296875, -0.17683029174804688, -0.170196533203125, -0.16356277465820312, -0.15692901611328125, -0.15029525756835938, -0.1436614990234375, -0.13702774047851562, -0.13039398193359375, -0.12376022338867188, -0.11712646484375, -0.11049270629882812, -0.10385894775390625, -0.09722518920898438, -0.0905914306640625, -0.08395767211914062, -0.07732391357421875, -0.07069015502929688, -0.064056396484375, -0.057422637939453125, -0.05078887939453125, -0.044155120849609375, -0.0375213623046875, -0.030887603759765625, -0.02425384521484375, -0.017620086669921875, -0.010986328125, -0.004352569580078125, 0.00228118896484375, 0.008914947509765625, 0.0155487060546875, 0.022182464599609375, 0.02881622314453125, 0.035449981689453125, 0.042083740234375, 0.048717498779296875, 0.05535125732421875, 0.061985015869140625, 0.0686187744140625, 0.07525253295898438, 0.08188629150390625, 0.08852005004882812, 0.09515380859375, 0.10178756713867188, 0.10842132568359375, 0.11505508422851562, 0.1216888427734375, 0.12832260131835938, 0.13495635986328125, 0.14159011840820312, 0.148223876953125, 0.15485763549804688, 0.16149139404296875, 0.16812515258789062, 0.1747589111328125, 0.18139266967773438, 0.18802642822265625, 0.19466018676757812, 0.2012939453125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 1.0, 3.0, 7.0, 3.0, 11.0, 10.0, 16.0, 20.0, 32.0, 44.0, 89.0, 140.0, 174.0, 186.0, 98.0, 55.0, 40.0, 21.0, 17.0, 4.0, 9.0, 8.0, 4.0, 1.0, 5.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.617473602294922e-05, -7.296167314052582e-05, -6.974861025810242e-05, -6.653554737567902e-05, -6.332248449325562e-05, -6.0109421610832214e-05, -5.6896358728408813e-05, -5.368329584598541e-05, -5.047023296356201e-05, -4.725717008113861e-05, -4.404410719871521e-05, -4.083104431629181e-05, -3.761798143386841e-05, -3.440491855144501e-05, -3.1191855669021606e-05, -2.7978792786598206e-05, -2.4765729904174805e-05, -2.1552667021751404e-05, -1.8339604139328003e-05, -1.5126541256904602e-05, -1.1913478374481201e-05, -8.7004154920578e-06, -5.487352609634399e-06, -2.2742897272109985e-06, 9.387731552124023e-07, 4.151836037635803e-06, 7.364898920059204e-06, 1.0577961802482605e-05, 1.3791024684906006e-05, 1.7004087567329407e-05, 2.0217150449752808e-05, 2.343021333217621e-05, 2.664327621459961e-05, 2.985633909702301e-05, 3.306940197944641e-05, 3.628246486186981e-05, 3.949552774429321e-05, 4.2708590626716614e-05, 4.5921653509140015e-05, 4.9134716391563416e-05, 5.2347779273986816e-05, 5.556084215641022e-05, 5.877390503883362e-05, 6.198696792125702e-05, 6.520003080368042e-05, 6.841309368610382e-05, 7.162615656852722e-05, 7.483921945095062e-05, 7.805228233337402e-05, 8.126534521579742e-05, 8.447840809822083e-05, 8.769147098064423e-05, 9.090453386306763e-05, 9.411759674549103e-05, 9.733065962791443e-05, 0.00010054372251033783, 0.00010375678539276123, 0.00010696984827518463, 0.00011018291115760803, 0.00011339597404003143, 0.00011660903692245483, 0.00011982209980487823, 0.00012303516268730164, 0.00012624822556972504, 0.00012946128845214844]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 6.0, 3.0, 12.0, 11.0, 25.0, 24.0, 43.0, 62.0, 116.0, 197.0, 341.0, 696.0, 1490.0, 4054.0, 14013.0, 72486.0, 755738.0, 163064.0, 25443.0, 6534.0, 2168.0, 901.0, 460.0, 245.0, 153.0, 97.0, 58.0, 43.0, 26.0, 17.0, 8.0, 4.0, 6.0, 0.0, 6.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2064208984375, -0.20010757446289062, -0.19379425048828125, -0.18748092651367188, -0.1811676025390625, -0.17485427856445312, -0.16854095458984375, -0.16222763061523438, -0.155914306640625, -0.14960098266601562, -0.14328765869140625, -0.13697433471679688, -0.1306610107421875, -0.12434768676757812, -0.11803436279296875, -0.11172103881835938, -0.10540771484375, -0.09909439086914062, -0.09278106689453125, -0.08646774291992188, -0.0801544189453125, -0.07384109497070312, -0.06752777099609375, -0.061214447021484375, -0.054901123046875, -0.048587799072265625, -0.04227447509765625, -0.035961151123046875, -0.0296478271484375, -0.023334503173828125, -0.01702117919921875, -0.010707855224609375, -0.00439453125, 0.001918792724609375, 0.00823211669921875, 0.014545440673828125, 0.0208587646484375, 0.027172088623046875, 0.03348541259765625, 0.039798736572265625, 0.046112060546875, 0.052425384521484375, 0.05873870849609375, 0.06505203247070312, 0.0713653564453125, 0.07767868041992188, 0.08399200439453125, 0.09030532836914062, 0.09661865234375, 0.10293197631835938, 0.10924530029296875, 0.11555862426757812, 0.1218719482421875, 0.12818527221679688, 0.13449859619140625, 0.14081192016601562, 0.147125244140625, 0.15343856811523438, 0.15975189208984375, 0.16606521606445312, 0.1723785400390625, 0.17869186401367188, 0.18500518798828125, 0.19131851196289062, 0.1976318359375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 5.0, 1.0, 3.0, 4.0, 4.0, 7.0, 10.0, 6.0, 11.0, 7.0, 5.0, 16.0, 17.0, 23.0, 18.0, 34.0, 27.0, 54.0, 64.0, 86.0, 99.0, 86.0, 89.0, 74.0, 59.0, 41.0, 25.0, 32.0, 22.0, 8.0, 9.0, 10.0, 10.0, 6.0, 9.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1591796875, -0.15387916564941406, -0.14857864379882812, -0.1432781219482422, -0.13797760009765625, -0.1326770782470703, -0.12737655639648438, -0.12207603454589844, -0.1167755126953125, -0.11147499084472656, -0.10617446899414062, -0.10087394714355469, -0.09557342529296875, -0.09027290344238281, -0.08497238159179688, -0.07967185974121094, -0.074371337890625, -0.06907081604003906, -0.06377029418945312, -0.05846977233886719, -0.05316925048828125, -0.04786872863769531, -0.042568206787109375, -0.03726768493652344, -0.0319671630859375, -0.026666641235351562, -0.021366119384765625, -0.016065597534179688, -0.01076507568359375, -0.0054645538330078125, -0.000164031982421875, 0.0051364898681640625, 0.01043701171875, 0.015737533569335938, 0.021038055419921875, 0.026338577270507812, 0.03163909912109375, 0.03693962097167969, 0.042240142822265625, 0.04754066467285156, 0.0528411865234375, 0.05814170837402344, 0.06344223022460938, 0.06874275207519531, 0.07404327392578125, 0.07934379577636719, 0.08464431762695312, 0.08994483947753906, 0.095245361328125, 0.10054588317871094, 0.10584640502929688, 0.11114692687988281, 0.11644744873046875, 0.12174797058105469, 0.12704849243164062, 0.13234901428222656, 0.1376495361328125, 0.14295005798339844, 0.14825057983398438, 0.1535511016845703, 0.15885162353515625, 0.1641521453857422, 0.16945266723632812, 0.17475318908691406, 0.1800537109375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 8.0, 13.0, 42.0, 139.0, 482.0, 227.0, 62.0, 19.0, 8.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.384860038757324, -8.045254707336426, -7.7056498527526855, -7.366044998168945, -7.026439666748047, -6.686834335327148, -6.347229480743408, -6.007624626159668, -5.6680192947387695, -5.328413963317871, -4.988809108734131, -4.649204254150391, -4.309598922729492, -3.969993829727173, -3.6303887367248535, -3.290783643722534, -2.951178550720215, -2.6115734577178955, -2.271968364715576, -1.9323632717132568, -1.5927581787109375, -1.2531530857086182, -0.9135479927062988, -0.5739428997039795, -0.23433780670166016, 0.10526728630065918, 0.4448723793029785, 0.7844774723052979, 1.1240825653076172, 1.4636876583099365, 1.8032927513122559, 2.142897844314575, 2.482501983642578, 2.8221070766448975, 3.161712169647217, 3.501317262649536, 3.8409223556518555, 4.180527687072754, 4.520132541656494, 4.859737396240234, 5.199342727661133, 5.538948059082031, 5.8785529136657715, 6.218157768249512, 6.55776309967041, 6.897368431091309, 7.236973285675049, 7.576578140258789, 7.9161834716796875, 8.255788803100586, 8.595394134521484, 8.934998512268066, 9.274603843688965, 9.614209175109863, 9.953813552856445, 10.293418884277344, 10.633024215698242, 10.97262954711914, 11.312234878540039, 11.651839256286621, 11.99144458770752, 12.331049919128418, 12.670654296875, 13.010259628295898, 13.349864959716797]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 4.0, 6.0, 5.0, 7.0, 7.0, 9.0, 14.0, 13.0, 17.0, 23.0, 21.0, 32.0, 30.0, 30.0, 54.0, 57.0, 85.0, 114.0, 108.0, 66.0, 44.0, 28.0, 31.0, 31.0, 26.0, 26.0, 15.0, 29.0, 13.0, 8.0, 10.0, 8.0, 8.0, 6.0, 5.0, 2.0, 4.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.308422565460205, -4.158952236175537, -4.009481906890869, -3.8600118160247803, -3.7105417251586914, -3.5610713958740234, -3.4116010665893555, -3.2621307373046875, -3.1126606464385986, -2.9631903171539307, -2.813720226287842, -2.664249897003174, -2.514779567718506, -2.365309476852417, -2.215839147567749, -2.06636905670166, -1.9168987274169922, -1.7674285173416138, -1.6179583072662354, -1.4684879779815674, -1.319017767906189, -1.1695475578308105, -1.0200772285461426, -0.8706070184707642, -0.7211368083953857, -0.5716665983200073, -0.42219632863998413, -0.2727260887622833, -0.12325584888458252, 0.0262143611907959, 0.1756846308708191, 0.3251549005508423, 0.4746255874633789, 0.6240957975387573, 0.7735660672187805, 0.9230363368988037, 1.0725065469741821, 1.2219767570495605, 1.3714470863342285, 1.520917296409607, 1.6703875064849854, 1.8198577165603638, 1.9693279266357422, 2.11879825592041, 2.268268585205078, 2.417738676071167, 2.567209005355835, 2.716679096221924, 2.866149425506592, 3.0156197547912598, 3.1650898456573486, 3.3145601749420166, 3.4640302658081055, 3.6135005950927734, 3.7629709243774414, 3.9124412536621094, 4.061911582946777, 4.211381912231445, 4.360852241516113, 4.510322093963623, 4.659792423248291, 4.809262752532959, 4.958733081817627, 5.108203411102295, 5.257673263549805]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 12.0, 17.0, 11.0, 37.0, 43.0, 89.0, 128.0, 234.0, 444.0, 821.0, 1814.0, 4525.0, 13142.0, 50328.0, 301216.0, 2157424.0, 1432920.0, 179593.0, 34435.0, 10140.0, 3633.0, 1560.0, 776.0, 408.0, 204.0, 125.0, 88.0, 32.0, 27.0, 24.0, 9.0, 6.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7275390625, -0.7078094482421875, -0.688079833984375, -0.6683502197265625, -0.64862060546875, -0.6288909912109375, -0.609161376953125, -0.5894317626953125, -0.5697021484375, -0.5499725341796875, -0.530242919921875, -0.5105133056640625, -0.49078369140625, -0.4710540771484375, -0.451324462890625, -0.4315948486328125, -0.411865234375, -0.3921356201171875, -0.372406005859375, -0.3526763916015625, -0.33294677734375, -0.3132171630859375, -0.293487548828125, -0.2737579345703125, -0.2540283203125, -0.2342987060546875, -0.214569091796875, -0.1948394775390625, -0.17510986328125, -0.1553802490234375, -0.135650634765625, -0.1159210205078125, -0.09619140625, -0.0764617919921875, -0.056732177734375, -0.0370025634765625, -0.01727294921875, 0.0024566650390625, 0.022186279296875, 0.0419158935546875, 0.0616455078125, 0.0813751220703125, 0.101104736328125, 0.1208343505859375, 0.14056396484375, 0.1602935791015625, 0.180023193359375, 0.1997528076171875, 0.219482421875, 0.2392120361328125, 0.258941650390625, 0.2786712646484375, 0.29840087890625, 0.3181304931640625, 0.337860107421875, 0.3575897216796875, 0.3773193359375, 0.3970489501953125, 0.416778564453125, 0.4365081787109375, 0.45623779296875, 0.4759674072265625, 0.495697021484375, 0.5154266357421875, 0.53515625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 12.0, 4.0, 12.0, 18.0, 14.0, 21.0, 17.0, 23.0, 24.0, 25.0, 35.0, 30.0, 34.0, 36.0, 42.0, 40.0, 52.0, 36.0, 59.0, 47.0, 44.0, 46.0, 41.0, 33.0, 33.0, 41.0, 28.0, 28.0, 27.0, 23.0, 12.0, 16.0, 14.0, 11.0, 7.0, 7.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2061767578125, -0.1982555389404297, -0.19033432006835938, -0.18241310119628906, -0.17449188232421875, -0.16657066345214844, -0.15864944458007812, -0.1507282257080078, -0.1428070068359375, -0.1348857879638672, -0.12696456909179688, -0.11904335021972656, -0.11112213134765625, -0.10320091247558594, -0.09527969360351562, -0.08735847473144531, -0.079437255859375, -0.07151603698730469, -0.06359481811523438, -0.05567359924316406, -0.04775238037109375, -0.03983116149902344, -0.031909942626953125, -0.023988723754882812, -0.0160675048828125, -0.008146286010742188, -0.000225067138671875, 0.0076961517333984375, 0.01561737060546875, 0.023538589477539062, 0.031459808349609375, 0.03938102722167969, 0.04730224609375, 0.05522346496582031, 0.06314468383789062, 0.07106590270996094, 0.07898712158203125, 0.08690834045410156, 0.09482955932617188, 0.10275077819824219, 0.1106719970703125, 0.11859321594238281, 0.12651443481445312, 0.13443565368652344, 0.14235687255859375, 0.15027809143066406, 0.15819931030273438, 0.1661205291748047, 0.174041748046875, 0.1819629669189453, 0.18988418579101562, 0.19780540466308594, 0.20572662353515625, 0.21364784240722656, 0.22156906127929688, 0.2294902801513672, 0.2374114990234375, 0.2453327178955078, 0.2532539367675781, 0.26117515563964844, 0.26909637451171875, 0.27701759338378906, 0.2849388122558594, 0.2928600311279297, 0.30078125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 5.0, 3.0, 1.0, 6.0, 8.0, 10.0, 24.0, 35.0, 85.0, 199.0, 645.0, 4463.0, 4133694.0, 53065.0, 1440.0, 325.0, 136.0, 64.0, 31.0, 16.0, 12.0, 8.0, 5.0, 1.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.09765625, -3.92510986328125, -3.7525634765625, -3.58001708984375, -3.407470703125, -3.23492431640625, -3.0623779296875, -2.88983154296875, -2.71728515625, -2.54473876953125, -2.3721923828125, -2.19964599609375, -2.027099609375, -1.85455322265625, -1.6820068359375, -1.50946044921875, -1.3369140625, -1.16436767578125, -0.9918212890625, -0.81927490234375, -0.646728515625, -0.47418212890625, -0.3016357421875, -0.12908935546875, 0.04345703125, 0.21600341796875, 0.3885498046875, 0.56109619140625, 0.733642578125, 0.90618896484375, 1.0787353515625, 1.25128173828125, 1.423828125, 1.59637451171875, 1.7689208984375, 1.94146728515625, 2.114013671875, 2.28656005859375, 2.4591064453125, 2.63165283203125, 2.80419921875, 2.97674560546875, 3.1492919921875, 3.32183837890625, 3.494384765625, 3.66693115234375, 3.8394775390625, 4.01202392578125, 4.1845703125, 4.35711669921875, 4.5296630859375, 4.70220947265625, 4.874755859375, 5.04730224609375, 5.2198486328125, 5.39239501953125, 5.56494140625, 5.73748779296875, 5.9100341796875, 6.08258056640625, 6.255126953125, 6.42767333984375, 6.6002197265625, 6.77276611328125, 6.9453125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 3.0, 4.0, 12.0, 19.0, 21.0, 31.0, 47.0, 61.0, 94.0, 155.0, 240.0, 381.0, 595.0, 746.0, 572.0, 368.0, 237.0, 152.0, 99.0, 75.0, 50.0, 32.0, 22.0, 13.0, 11.0, 8.0, 6.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.97119140625, -0.9344253540039062, -0.8976593017578125, -0.8608932495117188, -0.824127197265625, -0.7873611450195312, -0.7505950927734375, -0.7138290405273438, -0.67706298828125, -0.6402969360351562, -0.6035308837890625, -0.5667648315429688, -0.529998779296875, -0.49323272705078125, -0.4564666748046875, -0.41970062255859375, -0.3829345703125, -0.34616851806640625, -0.3094024658203125, -0.27263641357421875, -0.235870361328125, -0.19910430908203125, -0.1623382568359375, -0.12557220458984375, -0.08880615234375, -0.05204010009765625, -0.0152740478515625, 0.02149200439453125, 0.058258056640625, 0.09502410888671875, 0.1317901611328125, 0.16855621337890625, 0.205322265625, 0.24208831787109375, 0.2788543701171875, 0.31562042236328125, 0.352386474609375, 0.38915252685546875, 0.4259185791015625, 0.46268463134765625, 0.49945068359375, 0.5362167358398438, 0.5729827880859375, 0.6097488403320312, 0.646514892578125, 0.6832809448242188, 0.7200469970703125, 0.7568130493164062, 0.7935791015625, 0.8303451538085938, 0.8671112060546875, 0.9038772583007812, 0.940643310546875, 0.9774093627929688, 1.0141754150390625, 1.0509414672851562, 1.08770751953125, 1.1244735717773438, 1.1612396240234375, 1.1980056762695312, 1.234771728515625, 1.2715377807617188, 1.3083038330078125, 1.3450698852539062, 1.3818359375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 8.0, 11.0, 24.0, 88.0, 222.0, 312.0, 200.0, 70.0, 40.0, 12.0, 6.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.941831588745117, -27.28297233581543, -26.624113082885742, -25.965255737304688, -25.306396484375, -24.647537231445312, -23.988677978515625, -23.329818725585938, -22.67095947265625, -22.012100219726562, -21.353240966796875, -20.69438362121582, -20.035524368286133, -19.376665115356445, -18.717805862426758, -18.05894660949707, -17.400089263916016, -16.741230010986328, -16.08237075805664, -15.42351245880127, -14.764654159545898, -14.105794906616211, -13.446935653686523, -12.788076400756836, -12.129218101501465, -11.470358848571777, -10.811500549316406, -10.152641296386719, -9.493782043457031, -8.83492374420166, -8.176064491271973, -7.517205715179443, -6.858345031738281, -6.199486255645752, -5.540627479553223, -4.881768226623535, -4.222909450531006, -3.5640506744384766, -2.905191659927368, -2.2463326454162598, -1.5874738693237305, -0.9286149740219116, -0.2697560787200928, 0.3891028165817261, 1.047961711883545, 1.7068204879760742, 2.3656795024871826, 3.024538516998291, 3.6833972930908203, 4.34225606918335, 5.001114845275879, 5.659974098205566, 6.318832874298096, 6.977691650390625, 7.6365509033203125, 8.29541015625, 8.954268455505371, 9.613127708435059, 10.27198600769043, 10.930845260620117, 11.589704513549805, 12.248562812805176, 12.907422065734863, 13.566280364990234, 14.225139617919922]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 8.0, 5.0, 10.0, 2.0, 14.0, 12.0, 9.0, 11.0, 20.0, 29.0, 20.0, 32.0, 28.0, 41.0, 42.0, 44.0, 49.0, 47.0, 58.0, 60.0, 50.0, 51.0, 53.0, 40.0, 40.0, 30.0, 31.0, 31.0, 28.0, 20.0, 15.0, 15.0, 11.0, 4.0, 6.0, 5.0, 9.0, 4.0, 2.0, 6.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.890759468078613, -5.7161126136779785, -5.541465759277344, -5.366818904876709, -5.192172050476074, -5.0175251960754395, -4.842878341674805, -4.66823148727417, -4.493584632873535, -4.3189377784729, -4.144290924072266, -3.969644069671631, -3.794997215270996, -3.6203503608703613, -3.4457035064697266, -3.271056652069092, -3.096410036087036, -2.9217631816864014, -2.7471163272857666, -2.572469472885132, -2.397822618484497, -2.2231757640838623, -2.0485291481018066, -1.8738821744918823, -1.6992353200912476, -1.5245884656906128, -1.349941611289978, -1.1752948760986328, -1.000648021697998, -0.8260011076927185, -0.6513543128967285, -0.47670745849609375, -0.302060604095459, -0.1274137645959854, 0.04723307490348816, 0.22187989950180054, 0.3965267539024353, 0.5711736083030701, 0.7458204030990601, 0.9204672574996948, 1.0951141119003296, 1.2697609663009644, 1.4444078207015991, 1.6190545558929443, 1.793701410293579, 1.9683482646942139, 2.1429951190948486, 2.3176419734954834, 2.492288827896118, 2.666935682296753, 2.8415825366973877, 3.0162293910980225, 3.1908762454986572, 3.365523099899292, 3.5401697158813477, 3.7148165702819824, 3.889463424682617, 4.064110279083252, 4.238757133483887, 4.4134039878845215, 4.588050842285156, 4.762697696685791, 4.937344551086426, 5.1119914054870605, 5.286638259887695]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 10.0, 10.0, 21.0, 16.0, 46.0, 46.0, 96.0, 139.0, 184.0, 327.0, 556.0, 910.0, 1785.0, 3675.0, 8717.0, 24748.0, 93215.0, 564590.0, 269628.0, 51946.0, 15957.0, 5978.0, 2768.0, 1288.0, 722.0, 419.0, 259.0, 167.0, 108.0, 74.0, 49.0, 39.0, 17.0, 9.0, 11.0, 3.0, 5.0, 7.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.478271484375, -0.4632301330566406, -0.44818878173828125, -0.4331474304199219, -0.4181060791015625, -0.4030647277832031, -0.38802337646484375, -0.3729820251464844, -0.357940673828125, -0.3428993225097656, -0.32785797119140625, -0.3128166198730469, -0.2977752685546875, -0.2827339172363281, -0.26769256591796875, -0.2526512145996094, -0.23760986328125, -0.22256851196289062, -0.20752716064453125, -0.19248580932617188, -0.1774444580078125, -0.16240310668945312, -0.14736175537109375, -0.13232040405273438, -0.117279052734375, -0.10223770141601562, -0.08719635009765625, -0.07215499877929688, -0.0571136474609375, -0.042072296142578125, -0.02703094482421875, -0.011989593505859375, 0.0030517578125, 0.018093109130859375, 0.03313446044921875, 0.048175811767578125, 0.0632171630859375, 0.07825851440429688, 0.09329986572265625, 0.10834121704101562, 0.123382568359375, 0.13842391967773438, 0.15346527099609375, 0.16850662231445312, 0.1835479736328125, 0.19858932495117188, 0.21363067626953125, 0.22867202758789062, 0.24371337890625, 0.2587547302246094, 0.27379608154296875, 0.2888374328613281, 0.3038787841796875, 0.3189201354980469, 0.33396148681640625, 0.3490028381347656, 0.364044189453125, 0.3790855407714844, 0.39412689208984375, 0.4091682434082031, 0.4242095947265625, 0.4392509460449219, 0.45429229736328125, 0.4693336486816406, 0.484375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 3.0, 3.0, 7.0, 4.0, 9.0, 13.0, 11.0, 11.0, 18.0, 24.0, 24.0, 27.0, 35.0, 32.0, 37.0, 47.0, 55.0, 54.0, 43.0, 56.0, 72.0, 47.0, 62.0, 42.0, 44.0, 43.0, 35.0, 18.0, 19.0, 22.0, 15.0, 13.0, 9.0, 9.0, 12.0, 3.0, 4.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.430419921875, -0.4156761169433594, -0.40093231201171875, -0.3861885070800781, -0.3714447021484375, -0.3567008972167969, -0.34195709228515625, -0.3272132873535156, -0.312469482421875, -0.2977256774902344, -0.28298187255859375, -0.2682380676269531, -0.2534942626953125, -0.23875045776367188, -0.22400665283203125, -0.20926284790039062, -0.19451904296875, -0.17977523803710938, -0.16503143310546875, -0.15028762817382812, -0.1355438232421875, -0.12080001831054688, -0.10605621337890625, -0.09131240844726562, -0.076568603515625, -0.061824798583984375, -0.04708099365234375, -0.032337188720703125, -0.0175933837890625, -0.002849578857421875, 0.01189422607421875, 0.026638031005859375, 0.0413818359375, 0.056125640869140625, 0.07086944580078125, 0.08561325073242188, 0.1003570556640625, 0.11510086059570312, 0.12984466552734375, 0.14458847045898438, 0.159332275390625, 0.17407608032226562, 0.18881988525390625, 0.20356369018554688, 0.2183074951171875, 0.23305130004882812, 0.24779510498046875, 0.2625389099121094, 0.27728271484375, 0.2920265197753906, 0.30677032470703125, 0.3215141296386719, 0.3362579345703125, 0.3510017395019531, 0.36574554443359375, 0.3804893493652344, 0.395233154296875, 0.4099769592285156, 0.42472076416015625, 0.4394645690917969, 0.4542083740234375, 0.4689521789550781, 0.48369598388671875, 0.4984397888183594, 0.51318359375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 10.0, 9.0, 16.0, 22.0, 28.0, 68.0, 108.0, 157.0, 336.0, 839.0, 2558.0, 13864.0, 232703.0, 775370.0, 17671.0, 3041.0, 936.0, 381.0, 182.0, 102.0, 53.0, 38.0, 22.0, 9.0, 13.0, 6.0, 5.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7021484375, -0.67413330078125, -0.6461181640625, -0.61810302734375, -0.590087890625, -0.56207275390625, -0.5340576171875, -0.50604248046875, -0.47802734375, -0.45001220703125, -0.4219970703125, -0.39398193359375, -0.365966796875, -0.33795166015625, -0.3099365234375, -0.28192138671875, -0.25390625, -0.22589111328125, -0.1978759765625, -0.16986083984375, -0.141845703125, -0.11383056640625, -0.0858154296875, -0.05780029296875, -0.02978515625, -0.00177001953125, 0.0262451171875, 0.05426025390625, 0.082275390625, 0.11029052734375, 0.1383056640625, 0.16632080078125, 0.1943359375, 0.22235107421875, 0.2503662109375, 0.27838134765625, 0.306396484375, 0.33441162109375, 0.3624267578125, 0.39044189453125, 0.41845703125, 0.44647216796875, 0.4744873046875, 0.50250244140625, 0.530517578125, 0.55853271484375, 0.5865478515625, 0.61456298828125, 0.642578125, 0.67059326171875, 0.6986083984375, 0.72662353515625, 0.754638671875, 0.78265380859375, 0.8106689453125, 0.83868408203125, 0.86669921875, 0.89471435546875, 0.9227294921875, 0.95074462890625, 0.978759765625, 1.00677490234375, 1.0347900390625, 1.06280517578125, 1.0908203125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 6.0, 4.0, 8.0, 7.0, 16.0, 7.0, 18.0, 24.0, 16.0, 25.0, 42.0, 41.0, 60.0, 67.0, 75.0, 94.0, 92.0, 77.0, 72.0, 51.0, 46.0, 36.0, 24.0, 17.0, 13.0, 25.0, 6.0, 8.0, 13.0, 5.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.68359375, -1.616058349609375, -1.54852294921875, -1.480987548828125, -1.4134521484375, -1.345916748046875, -1.27838134765625, -1.210845947265625, -1.143310546875, -1.075775146484375, -1.00823974609375, -0.940704345703125, -0.8731689453125, -0.805633544921875, -0.73809814453125, -0.670562744140625, -0.60302734375, -0.535491943359375, -0.46795654296875, -0.400421142578125, -0.3328857421875, -0.265350341796875, -0.19781494140625, -0.130279541015625, -0.062744140625, 0.004791259765625, 0.07232666015625, 0.139862060546875, 0.2073974609375, 0.274932861328125, 0.34246826171875, 0.410003662109375, 0.4775390625, 0.545074462890625, 0.61260986328125, 0.680145263671875, 0.7476806640625, 0.815216064453125, 0.88275146484375, 0.950286865234375, 1.017822265625, 1.085357666015625, 1.15289306640625, 1.220428466796875, 1.2879638671875, 1.355499267578125, 1.42303466796875, 1.490570068359375, 1.55810546875, 1.625640869140625, 1.69317626953125, 1.760711669921875, 1.8282470703125, 1.895782470703125, 1.96331787109375, 2.030853271484375, 2.098388671875, 2.165924072265625, 2.23345947265625, 2.300994873046875, 2.3685302734375, 2.436065673828125, 2.50360107421875, 2.571136474609375, 2.638671875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 5.0, 9.0, 11.0, 21.0, 23.0, 36.0, 40.0, 64.0, 119.0, 159.0, 277.0, 451.0, 1004.0, 2345.0, 6581.0, 26226.0, 238226.0, 730183.0, 30650.0, 7249.0, 2502.0, 1022.0, 516.0, 276.0, 167.0, 120.0, 77.0, 49.0, 44.0, 22.0, 23.0, 14.0, 16.0, 13.0, 1.0, 3.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11279296875, -0.109039306640625, -0.10528564453125, -0.101531982421875, -0.0977783203125, -0.094024658203125, -0.09027099609375, -0.086517333984375, -0.082763671875, -0.079010009765625, -0.07525634765625, -0.071502685546875, -0.0677490234375, -0.063995361328125, -0.06024169921875, -0.056488037109375, -0.052734375, -0.048980712890625, -0.04522705078125, -0.041473388671875, -0.0377197265625, -0.033966064453125, -0.03021240234375, -0.026458740234375, -0.022705078125, -0.018951416015625, -0.01519775390625, -0.011444091796875, -0.0076904296875, -0.003936767578125, -0.00018310546875, 0.003570556640625, 0.00732421875, 0.011077880859375, 0.01483154296875, 0.018585205078125, 0.0223388671875, 0.026092529296875, 0.02984619140625, 0.033599853515625, 0.037353515625, 0.041107177734375, 0.04486083984375, 0.048614501953125, 0.0523681640625, 0.056121826171875, 0.05987548828125, 0.063629150390625, 0.0673828125, 0.071136474609375, 0.07489013671875, 0.078643798828125, 0.0823974609375, 0.086151123046875, 0.08990478515625, 0.093658447265625, 0.097412109375, 0.101165771484375, 0.10491943359375, 0.108673095703125, 0.1124267578125, 0.116180419921875, 0.11993408203125, 0.123687744140625, 0.12744140625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 1.0, 5.0, 9.0, 2.0, 1.0, 2.0, 3.0, 13.0, 16.0, 12.0, 24.0, 43.0, 22.0, 58.0, 59.0, 87.0, 103.0, 89.0, 99.0, 63.0, 62.0, 62.0, 31.0, 22.0, 24.0, 18.0, 17.0, 18.0, 9.0, 5.0, 4.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.49879264831543e-05, -3.394670784473419e-05, -3.290548920631409e-05, -3.186427056789398e-05, -3.082305192947388e-05, -2.9781833291053772e-05, -2.8740614652633667e-05, -2.7699396014213562e-05, -2.6658177375793457e-05, -2.5616958737373352e-05, -2.4575740098953247e-05, -2.3534521460533142e-05, -2.2493302822113037e-05, -2.1452084183692932e-05, -2.0410865545272827e-05, -1.9369646906852722e-05, -1.8328428268432617e-05, -1.7287209630012512e-05, -1.6245990991592407e-05, -1.5204772353172302e-05, -1.4163553714752197e-05, -1.3122335076332092e-05, -1.2081116437911987e-05, -1.1039897799491882e-05, -9.998679161071777e-06, -8.957460522651672e-06, -7.916241884231567e-06, -6.875023245811462e-06, -5.833804607391357e-06, -4.7925859689712524e-06, -3.7513673305511475e-06, -2.7101486921310425e-06, -1.6689300537109375e-06, -6.277114152908325e-07, 4.1350722312927246e-07, 1.4547258615493774e-06, 2.4959444999694824e-06, 3.5371631383895874e-06, 4.578381776809692e-06, 5.619600415229797e-06, 6.660819053649902e-06, 7.702037692070007e-06, 8.743256330490112e-06, 9.784474968910217e-06, 1.0825693607330322e-05, 1.1866912245750427e-05, 1.2908130884170532e-05, 1.3949349522590637e-05, 1.4990568161010742e-05, 1.6031786799430847e-05, 1.7073005437850952e-05, 1.8114224076271057e-05, 1.9155442714691162e-05, 2.0196661353111267e-05, 2.1237879991531372e-05, 2.2279098629951477e-05, 2.3320317268371582e-05, 2.4361535906791687e-05, 2.5402754545211792e-05, 2.6443973183631897e-05, 2.7485191822052002e-05, 2.8526410460472107e-05, 2.9567629098892212e-05, 3.060884773731232e-05, 3.165006637573242e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 5.0, 5.0, 8.0, 5.0, 2.0, 3.0, 8.0, 10.0, 13.0, 10.0, 22.0, 28.0, 35.0, 40.0, 61.0, 95.0, 173.0, 249.0, 441.0, 837.0, 1678.0, 4093.0, 11000.0, 45005.0, 829688.0, 123472.0, 20139.0, 6206.0, 2586.0, 1146.0, 569.0, 319.0, 200.0, 103.0, 96.0, 55.0, 35.0, 33.0, 17.0, 11.0, 14.0, 9.0, 9.0, 6.0, 9.0, 2.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1396484375, -0.13478851318359375, -0.1299285888671875, -0.12506866455078125, -0.120208740234375, -0.11534881591796875, -0.1104888916015625, -0.10562896728515625, -0.10076904296875, -0.09590911865234375, -0.0910491943359375, -0.08618927001953125, -0.081329345703125, -0.07646942138671875, -0.0716094970703125, -0.06674957275390625, -0.0618896484375, -0.05702972412109375, -0.0521697998046875, -0.04730987548828125, -0.042449951171875, -0.03759002685546875, -0.0327301025390625, -0.02787017822265625, -0.02301025390625, -0.01815032958984375, -0.0132904052734375, -0.00843048095703125, -0.003570556640625, 0.00128936767578125, 0.0061492919921875, 0.01100921630859375, 0.015869140625, 0.02072906494140625, 0.0255889892578125, 0.03044891357421875, 0.035308837890625, 0.04016876220703125, 0.0450286865234375, 0.04988861083984375, 0.05474853515625, 0.05960845947265625, 0.0644683837890625, 0.06932830810546875, 0.074188232421875, 0.07904815673828125, 0.0839080810546875, 0.08876800537109375, 0.0936279296875, 0.09848785400390625, 0.1033477783203125, 0.10820770263671875, 0.113067626953125, 0.11792755126953125, 0.1227874755859375, 0.12764739990234375, 0.13250732421875, 0.13736724853515625, 0.1422271728515625, 0.14708709716796875, 0.151947021484375, 0.15680694580078125, 0.1616668701171875, 0.16652679443359375, 0.17138671875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 2.0, 4.0, 2.0, 11.0, 5.0, 11.0, 5.0, 7.0, 15.0, 16.0, 8.0, 16.0, 22.0, 49.0, 53.0, 92.0, 118.0, 110.0, 112.0, 75.0, 82.0, 55.0, 41.0, 20.0, 16.0, 10.0, 5.0, 7.0, 8.0, 5.0, 5.0, 5.0, 1.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1302490234375, -0.12499427795410156, -0.11973953247070312, -0.11448478698730469, -0.10923004150390625, -0.10397529602050781, -0.09872055053710938, -0.09346580505371094, -0.0882110595703125, -0.08295631408691406, -0.07770156860351562, -0.07244682312011719, -0.06719207763671875, -0.06193733215332031, -0.056682586669921875, -0.05142784118652344, -0.046173095703125, -0.04091835021972656, -0.035663604736328125, -0.030408859252929688, -0.02515411376953125, -0.019899368286132812, -0.014644622802734375, -0.009389877319335938, -0.0041351318359375, 0.0011196136474609375, 0.006374359130859375, 0.011629104614257812, 0.01688385009765625, 0.022138595581054688, 0.027393341064453125, 0.03264808654785156, 0.03790283203125, 0.04315757751464844, 0.048412322998046875, 0.05366706848144531, 0.05892181396484375, 0.06417655944824219, 0.06943130493164062, 0.07468605041503906, 0.0799407958984375, 0.08519554138183594, 0.09045028686523438, 0.09570503234863281, 0.10095977783203125, 0.10621452331542969, 0.11146926879882812, 0.11672401428222656, 0.121978759765625, 0.12723350524902344, 0.13248825073242188, 0.1377429962158203, 0.14299774169921875, 0.1482524871826172, 0.15350723266601562, 0.15876197814941406, 0.1640167236328125, 0.16927146911621094, 0.17452621459960938, 0.1797809600830078, 0.18503570556640625, 0.1902904510498047, 0.19554519653320312, 0.20079994201660156, 0.2060546875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 9.0, 11.0, 21.0, 20.0, 44.0, 95.0, 123.0, 193.0, 163.0, 128.0, 80.0, 42.0, 18.0, 16.0, 12.0, 9.0, 5.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.456381320953369, -5.315451145172119, -5.174521446228027, -5.033591270446777, -4.892661094665527, -4.7517313957214355, -4.6108012199401855, -4.469871520996094, -4.328941345214844, -4.188011169433594, -4.047081470489502, -3.906151294708252, -3.765221357345581, -3.62429141998291, -3.48336124420166, -3.3424313068389893, -3.2015013694763184, -3.0605714321136475, -2.9196414947509766, -2.7787113189697266, -2.6377813816070557, -2.4968514442443848, -2.3559212684631348, -2.214991331100464, -2.074061393737793, -1.933131456375122, -1.7922013998031616, -1.6512713432312012, -1.5103414058685303, -1.3694114685058594, -1.228481411933899, -1.0875513553619385, -0.9466209411621094, -0.8056909441947937, -0.664760947227478, -0.5238309502601624, -0.3829009532928467, -0.241970956325531, -0.10104095935821533, 0.03988903760910034, 0.18081903457641602, 0.3217490315437317, 0.46267902851104736, 0.603609025478363, 0.7445390224456787, 0.8854690194129944, 1.02639901638031, 1.1673290729522705, 1.3082590103149414, 1.4491889476776123, 1.5901190042495728, 1.7310490608215332, 1.871978998184204, 2.012908935546875, 2.153839111328125, 2.294769048690796, 2.435698986053467, 2.5766289234161377, 2.7175588607788086, 2.8584890365600586, 2.9994189739227295, 3.1403489112854004, 3.2812790870666504, 3.4222090244293213, 3.563138961791992]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 0.0, 5.0, 4.0, 6.0, 9.0, 13.0, 13.0, 16.0, 27.0, 34.0, 66.0, 72.0, 108.0, 82.0, 69.0, 69.0, 81.0, 83.0, 64.0, 58.0, 35.0, 27.0, 9.0, 8.0, 13.0, 12.0, 8.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.703159332275391, -4.507888317108154, -4.312617778778076, -4.11734676361084, -3.9220759868621826, -3.7268052101135254, -3.531534433364868, -3.336263656616211, -3.1409926414489746, -2.9457218647003174, -2.75045108795166, -2.555180072784424, -2.3599092960357666, -2.1646385192871094, -1.9693677425384521, -1.7740968465805054, -1.5788261890411377, -1.3835554122924805, -1.1882845163345337, -0.9930137395858765, -0.7977429032325745, -0.6024720668792725, -0.40720129013061523, -0.21193039417266846, -0.01665961742401123, 0.17861120402812958, 0.3738820254802704, 0.56915283203125, 0.764423668384552, 0.959694504737854, 1.1549652814865112, 1.350236177444458, 1.5455069541931152, 1.7407777309417725, 1.9360486268997192, 2.131319522857666, 2.3265902996063232, 2.5218610763549805, 2.7171318531036377, 2.912402629852295, 3.1076736450195312, 3.3029444217681885, 3.4982151985168457, 3.693486213684082, 3.8887569904327393, 4.0840277671813965, 4.279298782348633, 4.474569320678711, 4.669839859008789, 4.865110874176025, 5.0603814125061035, 5.25565242767334, 5.450922966003418, 5.646193981170654, 5.841464996337891, 6.036735534667969, 6.232006549835205, 6.427277565002441, 6.6225481033325195, 6.817819118499756, 7.013089656829834, 7.20836067199707, 7.403631210327148, 7.598902225494385, 7.794173240661621]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 6.0, 4.0, 7.0, 7.0, 12.0, 10.0, 12.0, 19.0, 18.0, 28.0, 13.0, 25.0, 34.0, 45.0, 35.0, 118.0, 191.0, 114.0, 53.0, 42.0, 39.0, 30.0, 30.0, 22.0, 15.0, 19.0, 14.0, 11.0, 8.0, 3.0, 5.0, 6.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.417724609375, -0.4015007019042969, -0.38527679443359375, -0.3690528869628906, -0.3528289794921875, -0.3366050720214844, -0.32038116455078125, -0.3041572570800781, -0.287933349609375, -0.2717094421386719, -0.25548553466796875, -0.23926162719726562, -0.2230377197265625, -0.20681381225585938, -0.19058990478515625, -0.17436599731445312, -0.15814208984375, -0.14191818237304688, -0.12569427490234375, -0.10947036743164062, -0.0932464599609375, -0.07702255249023438, -0.06079864501953125, -0.044574737548828125, -0.028350830078125, -0.012126922607421875, 0.00409698486328125, 0.020320892333984375, 0.0365447998046875, 0.052768707275390625, 0.06899261474609375, 0.08521652221679688, 0.1014404296875, 0.11766433715820312, 0.13388824462890625, 0.15011215209960938, 0.1663360595703125, 0.18255996704101562, 0.19878387451171875, 0.21500778198242188, 0.231231689453125, 0.24745559692382812, 0.26367950439453125, 0.2799034118652344, 0.2961273193359375, 0.3123512268066406, 0.32857513427734375, 0.3447990417480469, 0.36102294921875, 0.3772468566894531, 0.39347076416015625, 0.4096946716308594, 0.4259185791015625, 0.4421424865722656, 0.45836639404296875, 0.4745903015136719, 0.490814208984375, 0.5070381164550781, 0.5232620239257812, 0.5394859313964844, 0.5557098388671875, 0.5719337463378906, 0.5881576538085938, 0.6043815612792969, 0.62060546875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 9.0, 3.0, 1.0, 0.0, 6.0, 7.0, 8.0, 11.0, 16.0, 15.0, 27.0, 31.0, 70.0, 106.0, 173.0, 348.0, 739.0, 2025.0, 7418.0, 87001.0, 8270184.0, 14789.0, 3390.0, 1210.0, 431.0, 220.0, 115.0, 64.0, 48.0, 31.0, 34.0, 25.0, 14.0, 9.0, 4.0, 1.0, 5.0, 5.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7719508409500122, -1.69874906539917, -1.6255474090576172, -1.5523457527160645, -1.4791439771652222, -1.4059422016143799, -1.3327405452728271, -1.2595388889312744, -1.1863371133804321, -1.1131353378295898, -1.039933681488037, -0.9667319655418396, -0.8935302495956421, -0.8203285336494446, -0.7471268177032471, -0.6739251017570496, -0.600723385810852, -0.5275216698646545, -0.45431995391845703, -0.3811182379722595, -0.307916522026062, -0.2347148060798645, -0.161513090133667, -0.08831137418746948, -0.015109658241271973, 0.05809205770492554, 0.13129377365112305, 0.20449548959732056, 0.27769720554351807, 0.3508989214897156, 0.4241006374359131, 0.4973023533821106, 0.5705041885375977, 0.6437059044837952, 0.7169076204299927, 0.7901093363761902, 0.8633110523223877, 0.9365127682685852, 1.0097144842147827, 1.082916259765625, 1.1561179161071777, 1.2293195724487305, 1.3025213479995728, 1.375723123550415, 1.4489247798919678, 1.5221264362335205, 1.5953282117843628, 1.668529987335205, 1.7417316436767578, 1.8149333000183105, 1.8881350755691528, 1.9613368511199951, 2.034538507461548, 2.1077401638031006, 2.1809420585632324, 2.254143714904785, 2.327345371246338, 2.4005470275878906, 2.4737486839294434, 2.546950578689575, 2.620152235031128, 2.6933538913726807, 2.7665557861328125, 2.8397574424743652, 2.912959098815918]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 2.0, 6.0, 11.0, 9.0, 5.0, 9.0, 4.0, 8.0, 6.0, 2.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.05401086807251, -6.861531734466553, -6.6690521240234375, -6.4765729904174805, -6.284093856811523, -6.091614723205566, -5.899135112762451, -5.706655979156494, -5.514176368713379, -5.321697235107422, -5.129217624664307, -4.93673849105835, -4.744259357452393, -4.551779747009277, -4.35930061340332, -4.166821479797363, -3.9743423461914062, -3.78186297416687, -3.589383840560913, -3.396904468536377, -3.20442533493042, -3.011945962905884, -2.8194665908813477, -2.6269874572753906, -2.4345080852508545, -2.2420287132263184, -2.0495495796203613, -1.8570702075958252, -1.6645909547805786, -1.472111701965332, -1.279632329940796, -1.0871530771255493, -0.8946738243103027, -0.7021945714950562, -0.5097152590751648, -0.31723594665527344, -0.12475669384002686, 0.06772255897521973, 0.26020193099975586, 0.45268118381500244, 0.645160436630249, 0.8376396894454956, 1.0301189422607422, 1.2225983142852783, 1.415077567100525, 1.6075568199157715, 1.8000361919403076, 1.9925154447555542, 2.184994697570801, 2.377474069595337, 2.569953203201294, 2.76243257522583, 2.954911708831787, 3.1473910808563232, 3.3398704528808594, 3.5323495864868164, 3.7248289585113525, 3.9173083305358887, 4.109787464141846, 4.302267074584961, 4.494746208190918, 4.687225341796875, 4.879704475402832, 5.072184085845947, 5.264663219451904]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 4.0, 3.0, 8.0, 13.0, 13.0, 23.0, 36.0, 52.0, 69.0, 77.0, 99.0, 107.0, 109.0, 108.0, 83.0, 44.0, 39.0, 36.0, 29.0, 16.0, 10.0, 10.0, 10.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.8779296875, -0.8552780151367188, -0.8326263427734375, -0.8099746704101562, -0.787322998046875, -0.7646713256835938, -0.7420196533203125, -0.7193679809570312, -0.69671630859375, -0.6740646362304688, -0.6514129638671875, -0.6287612915039062, -0.606109619140625, -0.5834579467773438, -0.5608062744140625, -0.5381546020507812, -0.5155029296875, -0.49285125732421875, -0.4701995849609375, -0.44754791259765625, -0.424896240234375, -0.40224456787109375, -0.3795928955078125, -0.35694122314453125, -0.33428955078125, -0.31163787841796875, -0.2889862060546875, -0.26633453369140625, -0.243682861328125, -0.22103118896484375, -0.1983795166015625, -0.17572784423828125, -0.153076171875, -0.13042449951171875, -0.1077728271484375, -0.08512115478515625, -0.062469482421875, -0.03981781005859375, -0.0171661376953125, 0.00548553466796875, 0.02813720703125, 0.05078887939453125, 0.0734405517578125, 0.09609222412109375, 0.118743896484375, 0.14139556884765625, 0.1640472412109375, 0.18669891357421875, 0.2093505859375, 0.23200225830078125, 0.2546539306640625, 0.27730560302734375, 0.299957275390625, 0.32260894775390625, 0.3452606201171875, 0.36791229248046875, 0.39056396484375, 0.41321563720703125, 0.4358673095703125, 0.45851898193359375, 0.481170654296875, 0.5038223266601562, 0.5264739990234375, 0.5491256713867188, 0.57177734375]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 6.0, 6.0, 7.0, 12.0, 19.0, 31.0, 57.0, 48.0, 124.0, 223.0, 406.0, 909.0, 2133.0, 6195.0, 21820.0, 88006.0, 250257.0, 113975.0, 27525.0, 7694.0, 2574.0, 1087.0, 452.0, 250.0, 163.0, 92.0, 65.0, 46.0, 30.0, 11.0, 13.0, 6.0, 12.0, 7.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.580078125, -2.48980712890625, -2.3995361328125, -2.30926513671875, -2.218994140625, -2.12872314453125, -2.0384521484375, -1.94818115234375, -1.85791015625, -1.76763916015625, -1.6773681640625, -1.58709716796875, -1.496826171875, -1.40655517578125, -1.3162841796875, -1.22601318359375, -1.1357421875, -1.04547119140625, -0.9552001953125, -0.86492919921875, -0.774658203125, -0.68438720703125, -0.5941162109375, -0.50384521484375, -0.41357421875, -0.32330322265625, -0.2330322265625, -0.14276123046875, -0.052490234375, 0.03778076171875, 0.1280517578125, 0.21832275390625, 0.30859375, 0.39886474609375, 0.4891357421875, 0.57940673828125, 0.669677734375, 0.75994873046875, 0.8502197265625, 0.94049072265625, 1.03076171875, 1.12103271484375, 1.2113037109375, 1.30157470703125, 1.391845703125, 1.48211669921875, 1.5723876953125, 1.66265869140625, 1.7529296875, 1.84320068359375, 1.9334716796875, 2.02374267578125, 2.114013671875, 2.20428466796875, 2.2945556640625, 2.38482666015625, 2.47509765625, 2.56536865234375, 2.6556396484375, 2.74591064453125, 2.836181640625, 2.92645263671875, 3.0167236328125, 3.10699462890625, 3.197265625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 11.0, 8.0, 20.0, 23.0, 24.0, 46.0, 42.0, 60.0, 74.0, 95.0, 106.0, 89.0, 87.0, 84.0, 59.0, 51.0, 38.0, 23.0, 30.0, 11.0, 9.0, 10.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39697265625, -0.37873077392578125, -0.3604888916015625, -0.34224700927734375, -0.324005126953125, -0.30576324462890625, -0.2875213623046875, -0.26927947998046875, -0.25103759765625, -0.23279571533203125, -0.2145538330078125, -0.19631195068359375, -0.178070068359375, -0.15982818603515625, -0.1415863037109375, -0.12334442138671875, -0.1051025390625, -0.08686065673828125, -0.0686187744140625, -0.05037689208984375, -0.032135009765625, -0.01389312744140625, 0.0043487548828125, 0.02259063720703125, 0.04083251953125, 0.05907440185546875, 0.0773162841796875, 0.09555816650390625, 0.113800048828125, 0.13204193115234375, 0.1502838134765625, 0.16852569580078125, 0.186767578125, 0.20500946044921875, 0.2232513427734375, 0.24149322509765625, 0.259735107421875, 0.27797698974609375, 0.2962188720703125, 0.31446075439453125, 0.33270263671875, 0.35094451904296875, 0.3691864013671875, 0.38742828369140625, 0.405670166015625, 0.42391204833984375, 0.4421539306640625, 0.46039581298828125, 0.4786376953125, 0.49687957763671875, 0.5151214599609375, 0.5333633422851562, 0.551605224609375, 0.5698471069335938, 0.5880889892578125, 0.6063308715820312, 0.62457275390625, 0.6428146362304688, 0.6610565185546875, 0.6792984008789062, 0.697540283203125, 0.7157821655273438, 0.7340240478515625, 0.7522659301757812, 0.7705078125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 4.0, 4.0, 2.0, 4.0, 7.0, 12.0, 6.0, 9.0, 27.0, 41.0, 69.0, 93.0, 83.0, 49.0, 22.0, 18.0, 4.0, 7.0, 2.0, 3.0, 2.0, 3.0, 6.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.599531650543213, -2.5224297046661377, -2.4453277587890625, -2.3682258129119873, -2.291123867034912, -2.214022159576416, -2.1369199752807617, -2.0598182678222656, -1.9827163219451904, -1.9056143760681152, -1.82851243019104, -1.7514104843139648, -1.6743086576461792, -1.597206711769104, -1.5201047658920288, -1.4430029392242432, -1.3659008741378784, -1.2887989282608032, -1.211696982383728, -1.1345951557159424, -1.0574932098388672, -0.980391263961792, -0.9032893180847168, -0.8261874318122864, -0.7490854859352112, -0.671983540058136, -0.5948816537857056, -0.5177797079086304, -0.44067779183387756, -0.36357587575912476, -0.28647392988204956, -0.20937204360961914, -0.13227009773254395, -0.05516817420721054, 0.021933749318122864, 0.09903568029403687, 0.17613759636878967, 0.2532395124435425, 0.3303414583206177, 0.4074433445930481, 0.4845452904701233, 0.5616472363471985, 0.6387491226196289, 0.7158510684967041, 0.7929530143737793, 0.8700549006462097, 0.9471568465232849, 1.0242587327957153, 1.1013606786727905, 1.1784626245498657, 1.255564570426941, 1.3326663970947266, 1.4097683429718018, 1.486870288848877, 1.5639722347259521, 1.6410741806030273, 1.7181761264801025, 1.7952780723571777, 1.872380018234253, 1.9494819641113281, 2.0265839099884033, 2.1036858558654785, 2.1807875633239746, 2.25788950920105, 2.334991455078125]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 3.0, 1.0, 10.0, 16.0, 16.0, 27.0, 56.0, 72.0, 78.0, 60.0, 42.0, 22.0, 7.0, 6.0, 5.0, 5.0, 3.0, 6.0, 3.0, 8.0, 3.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8594943284988403, -1.7972393035888672, -1.734984278678894, -1.672729253768921, -1.6104743480682373, -1.5482193231582642, -1.485964298248291, -1.4237092733383179, -1.3614542484283447, -1.2991992235183716, -1.2369441986083984, -1.1746892929077148, -1.1124342679977417, -1.0501792430877686, -0.9879242181777954, -0.9256691932678223, -0.8634142875671387, -0.8011592626571655, -0.7389042973518372, -0.676649272441864, -0.6143943071365356, -0.5521392822265625, -0.48988425731658936, -0.4276292622089386, -0.36537426710128784, -0.3031192719936371, -0.24086426198482513, -0.17860925197601318, -0.11635425686836243, -0.05409926176071167, 0.008155763149261475, 0.07041075825691223, 0.13266563415527344, 0.1949206292629242, 0.25717562437057495, 0.3194306492805481, 0.38168564438819885, 0.4439406394958496, 0.5061956644058228, 0.5684506893157959, 0.6307056546211243, 0.6929606795310974, 0.7552156448364258, 0.8174706697463989, 0.8797256946563721, 0.9419806599617004, 1.0042357444763184, 1.066490650177002, 1.128745675086975, 1.1910006999969482, 1.2532557249069214, 1.3155107498168945, 1.3777656555175781, 1.4400206804275513, 1.5022757053375244, 1.5645307302474976, 1.6267857551574707, 1.6890407800674438, 1.751295804977417, 1.8135507106781006, 1.8758057355880737, 1.9380607604980469, 2.0003156661987305, 2.062570810317993, 2.1248257160186768]}, "eval/loss": 0.309664785861969, "eval/wer": 0.09321697738992463, "eval/runtime": 583.4014, "eval/samples_per_second": 4.529, "eval/steps_per_second": 0.567} \ No newline at end of file +{"train/loss": 0.1199, "train/learning_rate": 6.936416184971098e-07, "train/epoch": 5.0, "train/global_step": 2230, "_runtime": 27349, "_timestamp": 1647994104, "_step": 2234, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 12.0, 56.0, 279.0, 497.0, 140.0, 30.0, 5.0], "bins": [-7.940925598144531, -7.809273719787598, -7.677621841430664, -7.5459699630737305, -7.414318084716797, -7.282666206359863, -7.15101432800293, -7.019362449645996, -6.8877105712890625, -6.756058692932129, -6.624406814575195, -6.492754936218262, -6.361103057861328, -6.2294511795043945, -6.097799301147461, -5.966147422790527, -5.834495544433594, -5.70284366607666, -5.571191787719727, -5.439539909362793, -5.307888031005859, -5.176236152648926, -5.044584274291992, -4.912932395935059, -4.781280517578125, -4.649628639221191, -4.517976760864258, -4.386324882507324, -4.254673004150391, -4.123021125793457, -3.9913692474365234, -3.85971736907959, -3.728065013885498, -3.5964131355285645, -3.464761257171631, -3.3331093788146973, -3.2014575004577637, -3.06980562210083, -2.9381537437438965, -2.806501865386963, -2.6748499870300293, -2.5431981086730957, -2.411546230316162, -2.2798943519592285, -2.148242473602295, -2.0165905952453613, -1.8849387168884277, -1.7532868385314941, -1.62163507938385, -1.4899832010269165, -1.358331322669983, -1.2266794443130493, -1.0950275659561157, -0.9633756875991821, -0.8317238092422485, -0.7000719308853149, -0.5684200525283813, -0.43676817417144775, -0.30511629581451416, -0.17346441745758057, -0.04181253910064697, 0.08983933925628662, 0.22149121761322021, 0.3531430959701538, 0.4847949743270874]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 5.0, 3.0, 6.0, 2.0, 5.0, 9.0, 10.0, 15.0, 12.0, 17.0, 16.0, 22.0, 29.0, 39.0, 28.0, 36.0, 29.0, 35.0, 38.0, 45.0, 62.0, 45.0, 49.0, 48.0, 51.0, 40.0, 45.0, 43.0, 33.0, 29.0, 31.0, 30.0, 21.0, 16.0, 17.0, 14.0, 10.0, 9.0, 5.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4662081003189087, -0.44751691818237305, -0.4288257360458374, -0.41013455390930176, -0.3914433717727661, -0.37275218963623047, -0.35406097769737244, -0.3353697955608368, -0.31667861342430115, -0.2979874312877655, -0.27929624915122986, -0.2606050670146942, -0.24191386997699738, -0.22322268784046173, -0.2045314908027649, -0.18584030866622925, -0.1671491265296936, -0.14845794439315796, -0.12976676225662231, -0.11107556521892548, -0.09238438308238983, -0.07369320094585419, -0.055002011358737946, -0.036310821771621704, -0.01761963963508606, 0.0010715462267398834, 0.019762732088565826, 0.03845391795039177, 0.05714510381221771, 0.07583628594875336, 0.0945274755358696, 0.11321866512298584, 0.13190990686416626, 0.1506010890007019, 0.16929227113723755, 0.1879834681749344, 0.20667465031147003, 0.22536583244800568, 0.24405702948570251, 0.26274821162223816, 0.2814393937587738, 0.30013057589530945, 0.3188217580318451, 0.33751294016838074, 0.35620415210723877, 0.3748953342437744, 0.39358651638031006, 0.4122776985168457, 0.43096888065338135, 0.449660062789917, 0.46835124492645264, 0.4870424270629883, 0.5057336091995239, 0.5244247913360596, 0.5431159734725952, 0.5618071556091309, 0.5804983377456665, 0.5991895198822021, 0.6178807020187378, 0.6365718841552734, 0.6552630662918091, 0.6739542484283447, 0.6926454305648804, 0.711336612701416, 0.7300278544425964]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 0.0, 2.0, 4.0, 6.0, 8.0, 7.0, 15.0, 12.0, 27.0, 27.0, 51.0, 58.0, 97.0, 154.0, 252.0, 420.0, 743.0, 1437.0, 3148.0, 8260.0, 35352.0, 952590.0, 3075218.0, 95395.0, 12498.0, 4388.0, 1911.0, 942.0, 493.0, 251.0, 183.0, 104.0, 56.0, 47.0, 33.0, 32.0, 8.0, 18.0, 9.0, 7.0, 7.0, 3.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.841796875, -2.753509521484375, -2.66522216796875, -2.576934814453125, -2.4886474609375, -2.400360107421875, -2.31207275390625, -2.223785400390625, -2.135498046875, -2.047210693359375, -1.95892333984375, -1.870635986328125, -1.7823486328125, -1.694061279296875, -1.60577392578125, -1.517486572265625, -1.42919921875, -1.340911865234375, -1.25262451171875, -1.164337158203125, -1.0760498046875, -0.987762451171875, -0.89947509765625, -0.811187744140625, -0.722900390625, -0.634613037109375, -0.54632568359375, -0.458038330078125, -0.3697509765625, -0.281463623046875, -0.19317626953125, -0.104888916015625, -0.0166015625, 0.071685791015625, 0.15997314453125, 0.248260498046875, 0.3365478515625, 0.424835205078125, 0.51312255859375, 0.601409912109375, 0.689697265625, 0.777984619140625, 0.86627197265625, 0.954559326171875, 1.0428466796875, 1.131134033203125, 1.21942138671875, 1.307708740234375, 1.39599609375, 1.484283447265625, 1.57257080078125, 1.660858154296875, 1.7491455078125, 1.837432861328125, 1.92572021484375, 2.014007568359375, 2.102294921875, 2.190582275390625, 2.27886962890625, 2.367156982421875, 2.4554443359375, 2.543731689453125, 2.63201904296875, 2.720306396484375, 2.80859375]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 7.0, 8.0, 10.0, 4.0, 10.0, 13.0, 10.0, 15.0, 26.0, 12.0, 29.0, 26.0, 29.0, 19.0, 31.0, 37.0, 31.0, 38.0, 52.0, 48.0, 44.0, 45.0, 49.0, 38.0, 35.0, 44.0, 37.0, 35.0, 36.0, 31.0, 20.0, 26.0, 24.0, 19.0, 10.0, 16.0, 10.0, 9.0, 7.0, 6.0, 5.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.87841796875, -0.8500137329101562, -0.8216094970703125, -0.7932052612304688, -0.764801025390625, -0.7363967895507812, -0.7079925537109375, -0.6795883178710938, -0.65118408203125, -0.6227798461914062, -0.5943756103515625, -0.5659713745117188, -0.537567138671875, -0.5091629028320312, -0.4807586669921875, -0.45235443115234375, -0.4239501953125, -0.39554595947265625, -0.3671417236328125, -0.33873748779296875, -0.310333251953125, -0.28192901611328125, -0.2535247802734375, -0.22512054443359375, -0.19671630859375, -0.16831207275390625, -0.1399078369140625, -0.11150360107421875, -0.083099365234375, -0.05469512939453125, -0.0262908935546875, 0.00211334228515625, 0.030517578125, 0.05892181396484375, 0.0873260498046875, 0.11573028564453125, 0.144134521484375, 0.17253875732421875, 0.2009429931640625, 0.22934722900390625, 0.25775146484375, 0.28615570068359375, 0.3145599365234375, 0.34296417236328125, 0.371368408203125, 0.39977264404296875, 0.4281768798828125, 0.45658111572265625, 0.4849853515625, 0.5133895874023438, 0.5417938232421875, 0.5701980590820312, 0.598602294921875, 0.6270065307617188, 0.6554107666015625, 0.6838150024414062, 0.71221923828125, 0.7406234741210938, 0.7690277099609375, 0.7974319458007812, 0.825836181640625, 0.8542404174804688, 0.8826446533203125, 0.9110488891601562, 0.939453125]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 4.0, 13.0, 18.0, 28.0, 46.0, 120.0, 245.0, 876.0, 3459606.0, 732161.0, 799.0, 164.0, 90.0, 37.0, 28.0, 21.0, 6.0, 3.0, 6.0, 2.0, 0.0, 5.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-22.125, -21.6102294921875, -21.095458984375, -20.5806884765625, -20.06591796875, -19.5511474609375, -19.036376953125, -18.5216064453125, -18.0068359375, -17.4920654296875, -16.977294921875, -16.4625244140625, -15.94775390625, -15.4329833984375, -14.918212890625, -14.4034423828125, -13.888671875, -13.3739013671875, -12.859130859375, -12.3443603515625, -11.82958984375, -11.3148193359375, -10.800048828125, -10.2852783203125, -9.7705078125, -9.2557373046875, -8.740966796875, -8.2261962890625, -7.71142578125, -7.1966552734375, -6.681884765625, -6.1671142578125, -5.65234375, -5.1375732421875, -4.622802734375, -4.1080322265625, -3.59326171875, -3.0784912109375, -2.563720703125, -2.0489501953125, -1.5341796875, -1.0194091796875, -0.504638671875, 0.0101318359375, 0.52490234375, 1.0396728515625, 1.554443359375, 2.0692138671875, 2.583984375, 3.0987548828125, 3.613525390625, 4.1282958984375, 4.64306640625, 5.1578369140625, 5.672607421875, 6.1873779296875, 6.7021484375, 7.2169189453125, 7.731689453125, 8.2464599609375, 8.76123046875, 9.2760009765625, 9.790771484375, 10.3055419921875, 10.8203125]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 7.0, 15.0, 14.0, 27.0, 67.0, 102.0, 190.0, 681.0, 1946.0, 665.0, 165.0, 80.0, 41.0, 27.0, 20.0, 9.0, 7.0, 2.0, 4.0, 2.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2822265625, -1.2540359497070312, -1.2258453369140625, -1.1976547241210938, -1.169464111328125, -1.1412734985351562, -1.1130828857421875, -1.0848922729492188, -1.05670166015625, -1.0285110473632812, -1.0003204345703125, -0.9721298217773438, -0.943939208984375, -0.9157485961914062, -0.8875579833984375, -0.8593673706054688, -0.8311767578125, -0.8029861450195312, -0.7747955322265625, -0.7466049194335938, -0.718414306640625, -0.6902236938476562, -0.6620330810546875, -0.6338424682617188, -0.60565185546875, -0.5774612426757812, -0.5492706298828125, -0.5210800170898438, -0.492889404296875, -0.46469879150390625, -0.4365081787109375, -0.40831756591796875, -0.380126953125, -0.35193634033203125, -0.3237457275390625, -0.29555511474609375, -0.267364501953125, -0.23917388916015625, -0.2109832763671875, -0.18279266357421875, -0.15460205078125, -0.12641143798828125, -0.0982208251953125, -0.07003021240234375, -0.041839599609375, -0.01364898681640625, 0.0145416259765625, 0.04273223876953125, 0.0709228515625, 0.09911346435546875, 0.1273040771484375, 0.15549468994140625, 0.183685302734375, 0.21187591552734375, 0.2400665283203125, 0.26825714111328125, 0.29644775390625, 0.32463836669921875, 0.3528289794921875, 0.38101959228515625, 0.409210205078125, 0.43740081787109375, 0.4655914306640625, 0.49378204345703125, 0.52197265625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 2.0, 7.0, 11.0, 11.0, 8.0, 12.0, 24.0, 24.0, 36.0, 47.0, 53.0, 70.0, 79.0, 89.0, 98.0, 87.0, 70.0, 58.0, 48.0, 44.0, 30.0, 24.0, 14.0, 18.0, 13.0, 10.0, 7.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9769927263259888, -0.9347792863845825, -0.8925658464431763, -0.8503524661064148, -0.8081390261650085, -0.7659255862236023, -0.7237122058868408, -0.6814987659454346, -0.6392853260040283, -0.5970718860626221, -0.5548584461212158, -0.5126450657844543, -0.4704316258430481, -0.42821818590164185, -0.386004775762558, -0.3437913656234741, -0.30157792568206787, -0.2593644857406616, -0.21715107560157776, -0.1749376505613327, -0.13272422552108765, -0.09051080048084259, -0.048297375440597534, -0.006083965301513672, 0.03612947463989258, 0.07834289968013763, 0.12055632472038269, 0.16276974976062775, 0.2049831748008728, 0.24719659984111786, 0.2894100248813629, 0.3316234350204468, 0.3738369941711426, 0.41605043411254883, 0.4582638442516327, 0.5004772543907166, 0.5426906943321228, 0.584904134273529, 0.6271175146102905, 0.6693309545516968, 0.711544394493103, 0.7537578344345093, 0.7959712743759155, 0.838184654712677, 0.8803980946540833, 0.9226115345954895, 0.964824914932251, 1.0070383548736572, 1.0492517948150635, 1.0914652347564697, 1.133678674697876, 1.1758921146392822, 1.2181055545806885, 1.2603188753128052, 1.3025323152542114, 1.3447457551956177, 1.386959195137024, 1.4291726350784302, 1.4713860750198364, 1.5135995149612427, 1.5558128356933594, 1.5980262756347656, 1.6402397155761719, 1.6824531555175781, 1.7246665954589844]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 10.0, 8.0, 11.0, 10.0, 11.0, 15.0, 19.0, 12.0, 19.0, 28.0, 28.0, 28.0, 23.0, 36.0, 41.0, 44.0, 36.0, 31.0, 44.0, 47.0, 41.0, 46.0, 37.0, 35.0, 35.0, 35.0, 34.0, 33.0, 26.0, 28.0, 29.0, 26.0, 15.0, 15.0, 17.0, 13.0, 14.0, 10.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7832375168800354, -0.7575938701629639, -0.7319502830505371, -0.7063066363334656, -0.680662989616394, -0.6550193428993225, -0.629375696182251, -0.6037321090698242, -0.5780884623527527, -0.5524448156356812, -0.5268012285232544, -0.5011575818061829, -0.47551393508911133, -0.4498702883720398, -0.42422667145729065, -0.3985830545425415, -0.37293940782546997, -0.34729576110839844, -0.3216521441936493, -0.29600852727890015, -0.2703648805618286, -0.24472124874591827, -0.21907761693000793, -0.1934339851140976, -0.16779035329818726, -0.14214672148227692, -0.11650308966636658, -0.09085945785045624, -0.0652158260345459, -0.03957219421863556, -0.01392856240272522, 0.01171506941318512, 0.037358641624450684, 0.06300227344036102, 0.08864590525627136, 0.1142895370721817, 0.13993316888809204, 0.16557680070400238, 0.19122043251991272, 0.21686406433582306, 0.2425076961517334, 0.26815134286880493, 0.2937949597835541, 0.3194385766983032, 0.34508222341537476, 0.3707258701324463, 0.39636948704719543, 0.4220131039619446, 0.4476567506790161, 0.47330039739608765, 0.4989440143108368, 0.5245876312255859, 0.5502312779426575, 0.575874924659729, 0.6015185117721558, 0.6271621584892273, 0.6528058052062988, 0.6784494519233704, 0.7040930986404419, 0.7297366857528687, 0.7553803324699402, 0.7810239791870117, 0.8066675662994385, 0.83231121301651, 0.8579548597335815]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 4.0, 12.0, 8.0, 31.0, 29.0, 40.0, 50.0, 84.0, 139.0, 185.0, 251.0, 369.0, 555.0, 753.0, 1155.0, 1643.0, 2561.0, 3756.0, 5780.0, 8996.0, 14705.0, 24379.0, 43156.0, 80441.0, 171793.0, 311438.0, 179636.0, 84756.0, 44890.0, 25105.0, 14985.0, 9146.0, 5832.0, 3889.0, 2508.0, 1682.0, 1156.0, 848.0, 535.0, 408.0, 258.0, 189.0, 131.0, 87.0, 62.0, 44.0, 25.0, 19.0, 20.0, 11.0, 9.0, 6.0, 6.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.397216796875, -0.3850059509277344, -0.37279510498046875, -0.3605842590332031, -0.3483734130859375, -0.3361625671386719, -0.32395172119140625, -0.3117408752441406, -0.299530029296875, -0.2873191833496094, -0.27510833740234375, -0.2628974914550781, -0.2506866455078125, -0.23847579956054688, -0.22626495361328125, -0.21405410766601562, -0.20184326171875, -0.18963241577148438, -0.17742156982421875, -0.16521072387695312, -0.1529998779296875, -0.14078903198242188, -0.12857818603515625, -0.11636734008789062, -0.104156494140625, -0.09194564819335938, -0.07973480224609375, -0.06752395629882812, -0.0553131103515625, -0.043102264404296875, -0.03089141845703125, -0.018680572509765625, -0.0064697265625, 0.005741119384765625, 0.01795196533203125, 0.030162811279296875, 0.0423736572265625, 0.054584503173828125, 0.06679534912109375, 0.07900619506835938, 0.091217041015625, 0.10342788696289062, 0.11563873291015625, 0.12784957885742188, 0.1400604248046875, 0.15227127075195312, 0.16448211669921875, 0.17669296264648438, 0.18890380859375, 0.20111465454101562, 0.21332550048828125, 0.22553634643554688, 0.2377471923828125, 0.24995803833007812, 0.26216888427734375, 0.2743797302246094, 0.286590576171875, 0.2988014221191406, 0.31101226806640625, 0.3232231140136719, 0.3354339599609375, 0.3476448059082031, 0.35985565185546875, 0.3720664978027344, 0.38427734375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 6.0, 2.0, 8.0, 6.0, 8.0, 9.0, 7.0, 14.0, 15.0, 21.0, 21.0, 18.0, 28.0, 31.0, 33.0, 24.0, 31.0, 38.0, 44.0, 43.0, 27.0, 45.0, 46.0, 45.0, 40.0, 46.0, 23.0, 39.0, 32.0, 41.0, 31.0, 36.0, 26.0, 21.0, 19.0, 13.0, 10.0, 9.0, 10.0, 10.0, 6.0, 9.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.467529296875, -0.4515571594238281, -0.43558502197265625, -0.4196128845214844, -0.4036407470703125, -0.3876686096191406, -0.37169647216796875, -0.3557243347167969, -0.339752197265625, -0.3237800598144531, -0.30780792236328125, -0.2918357849121094, -0.2758636474609375, -0.2598915100097656, -0.24391937255859375, -0.22794723510742188, -0.21197509765625, -0.19600296020507812, -0.18003082275390625, -0.16405868530273438, -0.1480865478515625, -0.13211441040039062, -0.11614227294921875, -0.10017013549804688, -0.084197998046875, -0.06822586059570312, -0.05225372314453125, -0.036281585693359375, -0.0203094482421875, -0.004337310791015625, 0.01163482666015625, 0.027606964111328125, 0.0435791015625, 0.059551239013671875, 0.07552337646484375, 0.09149551391601562, 0.1074676513671875, 0.12343978881835938, 0.13941192626953125, 0.15538406372070312, 0.171356201171875, 0.18732833862304688, 0.20330047607421875, 0.21927261352539062, 0.2352447509765625, 0.2512168884277344, 0.26718902587890625, 0.2831611633300781, 0.29913330078125, 0.3151054382324219, 0.33107757568359375, 0.3470497131347656, 0.3630218505859375, 0.3789939880371094, 0.39496612548828125, 0.4109382629394531, 0.426910400390625, 0.4428825378417969, 0.45885467529296875, 0.4748268127441406, 0.4907989501953125, 0.5067710876464844, 0.5227432250976562, 0.5387153625488281, 0.5546875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 10.0, 11.0, 15.0, 19.0, 25.0, 40.0, 50.0, 87.0, 121.0, 226.0, 393.0, 770.0, 1604.0, 4019.0, 11302.0, 38684.0, 175614.0, 592346.0, 167750.0, 37173.0, 10984.0, 3846.0, 1645.0, 757.0, 422.0, 216.0, 130.0, 82.0, 70.0, 45.0, 36.0, 21.0, 11.0, 4.0, 9.0, 4.0, 4.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6591796875, -0.6368255615234375, -0.614471435546875, -0.5921173095703125, -0.56976318359375, -0.5474090576171875, -0.525054931640625, -0.5027008056640625, -0.4803466796875, -0.4579925537109375, -0.435638427734375, -0.4132843017578125, -0.39093017578125, -0.3685760498046875, -0.346221923828125, -0.3238677978515625, -0.301513671875, -0.2791595458984375, -0.256805419921875, -0.2344512939453125, -0.21209716796875, -0.1897430419921875, -0.167388916015625, -0.1450347900390625, -0.1226806640625, -0.1003265380859375, -0.077972412109375, -0.0556182861328125, -0.03326416015625, -0.0109100341796875, 0.011444091796875, 0.0337982177734375, 0.05615234375, 0.0785064697265625, 0.100860595703125, 0.1232147216796875, 0.14556884765625, 0.1679229736328125, 0.190277099609375, 0.2126312255859375, 0.2349853515625, 0.2573394775390625, 0.279693603515625, 0.3020477294921875, 0.32440185546875, 0.3467559814453125, 0.369110107421875, 0.3914642333984375, 0.413818359375, 0.4361724853515625, 0.458526611328125, 0.4808807373046875, 0.50323486328125, 0.5255889892578125, 0.547943115234375, 0.5702972412109375, 0.5926513671875, 0.6150054931640625, 0.637359619140625, 0.6597137451171875, 0.68206787109375, 0.7044219970703125, 0.726776123046875, 0.7491302490234375, 0.771484375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 8.0, 2.0, 3.0, 5.0, 4.0, 9.0, 3.0, 15.0, 16.0, 16.0, 11.0, 18.0, 21.0, 20.0, 22.0, 34.0, 28.0, 31.0, 40.0, 30.0, 30.0, 52.0, 46.0, 31.0, 36.0, 37.0, 42.0, 42.0, 39.0, 35.0, 29.0, 35.0, 33.0, 25.0, 22.0, 22.0, 16.0, 12.0, 18.0, 12.0, 11.0, 10.0, 9.0, 7.0, 8.0, 4.0, 3.0, 3.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.97998046875, -0.9475173950195312, -0.9150543212890625, -0.8825912475585938, -0.850128173828125, -0.8176651000976562, -0.7852020263671875, -0.7527389526367188, -0.72027587890625, -0.6878128051757812, -0.6553497314453125, -0.6228866577148438, -0.590423583984375, -0.5579605102539062, -0.5254974365234375, -0.49303436279296875, -0.4605712890625, -0.42810821533203125, -0.3956451416015625, -0.36318206787109375, -0.330718994140625, -0.29825592041015625, -0.2657928466796875, -0.23332977294921875, -0.20086669921875, -0.16840362548828125, -0.1359405517578125, -0.10347747802734375, -0.071014404296875, -0.03855133056640625, -0.0060882568359375, 0.02637481689453125, 0.058837890625, 0.09130096435546875, 0.1237640380859375, 0.15622711181640625, 0.188690185546875, 0.22115325927734375, 0.2536163330078125, 0.28607940673828125, 0.31854248046875, 0.35100555419921875, 0.3834686279296875, 0.41593170166015625, 0.448394775390625, 0.48085784912109375, 0.5133209228515625, 0.5457839965820312, 0.5782470703125, 0.6107101440429688, 0.6431732177734375, 0.6756362915039062, 0.708099365234375, 0.7405624389648438, 0.7730255126953125, 0.8054885864257812, 0.83795166015625, 0.8704147338867188, 0.9028778076171875, 0.9353408813476562, 0.967803955078125, 1.0002670288085938, 1.0327301025390625, 1.0651931762695312, 1.09765625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 2.0, 5.0, 10.0, 9.0, 11.0, 20.0, 26.0, 41.0, 63.0, 89.0, 133.0, 236.0, 383.0, 614.0, 1075.0, 2224.0, 4633.0, 10843.0, 30540.0, 125972.0, 622456.0, 185615.0, 38995.0, 13142.0, 5604.0, 2588.0, 1322.0, 717.0, 435.0, 263.0, 167.0, 99.0, 58.0, 57.0, 30.0, 29.0, 14.0, 12.0, 6.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1253662109375, -0.12152099609375, -0.11767578125, -0.11383056640625, -0.1099853515625, -0.10614013671875, -0.102294921875, -0.09844970703125, -0.0946044921875, -0.09075927734375, -0.0869140625, -0.08306884765625, -0.0792236328125, -0.07537841796875, -0.071533203125, -0.06768798828125, -0.0638427734375, -0.05999755859375, -0.05615234375, -0.05230712890625, -0.0484619140625, -0.04461669921875, -0.040771484375, -0.03692626953125, -0.0330810546875, -0.02923583984375, -0.025390625, -0.02154541015625, -0.0177001953125, -0.01385498046875, -0.010009765625, -0.00616455078125, -0.0023193359375, 0.00152587890625, 0.00537109375, 0.00921630859375, 0.0130615234375, 0.01690673828125, 0.020751953125, 0.02459716796875, 0.0284423828125, 0.03228759765625, 0.0361328125, 0.03997802734375, 0.0438232421875, 0.04766845703125, 0.051513671875, 0.05535888671875, 0.0592041015625, 0.06304931640625, 0.06689453125, 0.07073974609375, 0.0745849609375, 0.07843017578125, 0.082275390625, 0.08612060546875, 0.0899658203125, 0.09381103515625, 0.09765625, 0.10150146484375, 0.1053466796875, 0.10919189453125, 0.113037109375, 0.11688232421875, 0.1207275390625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 3.0, 8.0, 7.0, 22.0, 24.0, 38.0, 94.0, 202.0, 280.0, 168.0, 66.0, 29.0, 17.0, 17.0, 6.0, 8.0, 4.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014853477478027344, -0.0001431051641702652, -0.00013767555356025696, -0.00013224594295024872, -0.00012681633234024048, -0.00012138672173023224, -0.000115957111120224, -0.00011052750051021576, -0.00010509788990020752, -9.966827929019928e-05, -9.423866868019104e-05, -8.88090580701828e-05, -8.337944746017456e-05, -7.794983685016632e-05, -7.252022624015808e-05, -6.709061563014984e-05, -6.16610050201416e-05, -5.623139441013336e-05, -5.080178380012512e-05, -4.537217319011688e-05, -3.994256258010864e-05, -3.45129519701004e-05, -2.9083341360092163e-05, -2.3653730750083923e-05, -1.8224120140075684e-05, -1.2794509530067444e-05, -7.364898920059204e-06, -1.9352883100509644e-06, 3.4943222999572754e-06, 8.923932909965515e-06, 1.4353543519973755e-05, 1.9783154129981995e-05, 2.5212764739990234e-05, 3.0642375349998474e-05, 3.6071985960006714e-05, 4.1501596570014954e-05, 4.693120718002319e-05, 5.236081779003143e-05, 5.779042840003967e-05, 6.322003901004791e-05, 6.864964962005615e-05, 7.407926023006439e-05, 7.950887084007263e-05, 8.493848145008087e-05, 9.036809206008911e-05, 9.579770267009735e-05, 0.00010122731328010559, 0.00010665692389011383, 0.00011208653450012207, 0.00011751614511013031, 0.00012294575572013855, 0.0001283753663301468, 0.00013380497694015503, 0.00013923458755016327, 0.0001446641981601715, 0.00015009380877017975, 0.000155523419380188, 0.00016095302999019623, 0.00016638264060020447, 0.0001718122512102127, 0.00017724186182022095, 0.0001826714724302292, 0.00018810108304023743, 0.00019353069365024567, 0.0001989603042602539]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 2.0, 3.0, 6.0, 9.0, 12.0, 12.0, 20.0, 26.0, 44.0, 53.0, 93.0, 163.0, 472.0, 1708.0, 9062.0, 84776.0, 867065.0, 74046.0, 8568.0, 1576.0, 383.0, 185.0, 83.0, 46.0, 38.0, 23.0, 15.0, 7.0, 10.0, 16.0, 8.0, 1.0, 1.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.255126953125, -0.24584197998046875, -0.2365570068359375, -0.22727203369140625, -0.217987060546875, -0.20870208740234375, -0.1994171142578125, -0.19013214111328125, -0.18084716796875, -0.17156219482421875, -0.1622772216796875, -0.15299224853515625, -0.143707275390625, -0.13442230224609375, -0.1251373291015625, -0.11585235595703125, -0.1065673828125, -0.09728240966796875, -0.0879974365234375, -0.07871246337890625, -0.069427490234375, -0.06014251708984375, -0.0508575439453125, -0.04157257080078125, -0.03228759765625, -0.02300262451171875, -0.0137176513671875, -0.00443267822265625, 0.004852294921875, 0.01413726806640625, 0.0234222412109375, 0.03270721435546875, 0.0419921875, 0.05127716064453125, 0.0605621337890625, 0.06984710693359375, 0.079132080078125, 0.08841705322265625, 0.0977020263671875, 0.10698699951171875, 0.11627197265625, 0.12555694580078125, 0.1348419189453125, 0.14412689208984375, 0.153411865234375, 0.16269683837890625, 0.1719818115234375, 0.18126678466796875, 0.1905517578125, 0.19983673095703125, 0.2091217041015625, 0.21840667724609375, 0.227691650390625, 0.23697662353515625, 0.2462615966796875, 0.25554656982421875, 0.26483154296875, 0.27411651611328125, 0.2834014892578125, 0.29268646240234375, 0.301971435546875, 0.31125640869140625, 0.3205413818359375, 0.32982635498046875, 0.339111328125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 8.0, 0.0, 3.0, 5.0, 6.0, 3.0, 6.0, 9.0, 7.0, 14.0, 17.0, 20.0, 32.0, 38.0, 49.0, 77.0, 86.0, 109.0, 104.0, 98.0, 79.0, 57.0, 52.0, 40.0, 15.0, 7.0, 9.0, 12.0, 5.0, 6.0, 7.0, 7.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0423583984375, -0.040851593017578125, -0.03934478759765625, -0.037837982177734375, -0.0363311767578125, -0.034824371337890625, -0.03331756591796875, -0.031810760498046875, -0.030303955078125, -0.028797149658203125, -0.02729034423828125, -0.025783538818359375, -0.0242767333984375, -0.022769927978515625, -0.02126312255859375, -0.019756317138671875, -0.01824951171875, -0.016742706298828125, -0.01523590087890625, -0.013729095458984375, -0.0122222900390625, -0.010715484619140625, -0.00920867919921875, -0.007701873779296875, -0.006195068359375, -0.004688262939453125, -0.00318145751953125, -0.001674652099609375, -0.0001678466796875, 0.001338958740234375, 0.00284576416015625, 0.004352569580078125, 0.005859375, 0.007366180419921875, 0.00887298583984375, 0.010379791259765625, 0.0118865966796875, 0.013393402099609375, 0.01490020751953125, 0.016407012939453125, 0.017913818359375, 0.019420623779296875, 0.02092742919921875, 0.022434234619140625, 0.0239410400390625, 0.025447845458984375, 0.02695465087890625, 0.028461456298828125, 0.02996826171875, 0.031475067138671875, 0.03298187255859375, 0.034488677978515625, 0.0359954833984375, 0.037502288818359375, 0.03900909423828125, 0.040515899658203125, 0.042022705078125, 0.043529510498046875, 0.04503631591796875, 0.046543121337890625, 0.0480499267578125, 0.049556732177734375, 0.05106353759765625, 0.052570343017578125, 0.0540771484375]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 6.0, 10.0, 13.0, 48.0, 138.0, 300.0, 284.0, 140.0, 53.0, 13.0, 6.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7234145402908325, -1.645379662513733, -1.5673447847366333, -1.4893099069595337, -1.411275029182434, -1.3332401514053345, -1.2552051544189453, -1.1771702766418457, -1.099135398864746, -1.0211005210876465, -0.9430656433105469, -0.8650307655334473, -0.7869958877563477, -0.708961009979248, -0.6309260725975037, -0.552891194820404, -0.4748563766479492, -0.3968214988708496, -0.31878662109375, -0.240751713514328, -0.1627168357372284, -0.08468195796012878, -0.006647050380706787, 0.07138782739639282, 0.14942270517349243, 0.22745758295059204, 0.30549246072769165, 0.38352736830711365, 0.46156224608421326, 0.5395971536636353, 0.6176320314407349, 0.6956669092178345, 0.7737016677856445, 0.8517365455627441, 0.9297714233398438, 1.0078063011169434, 1.085841178894043, 1.1638760566711426, 1.2419109344482422, 1.3199458122253418, 1.3979806900024414, 1.476015567779541, 1.5540504455566406, 1.6320853233337402, 1.7101202011108398, 1.7881550788879395, 1.866189956665039, 1.9442248344421387, 2.0222597122192383, 2.100294589996338, 2.1783294677734375, 2.256364345550537, 2.3343992233276367, 2.4124341011047363, 2.490468978881836, 2.5685038566589355, 2.6465389728546143, 2.724573850631714, 2.8026087284088135, 2.880643606185913, 2.9586784839630127, 3.0367133617401123, 3.114748239517212, 3.1927831172943115, 3.270817995071411]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 7.0, 5.0, 6.0, 10.0, 6.0, 13.0, 22.0, 14.0, 22.0, 17.0, 27.0, 28.0, 24.0, 36.0, 47.0, 33.0, 30.0, 47.0, 44.0, 42.0, 52.0, 45.0, 36.0, 32.0, 32.0, 45.0, 42.0, 34.0, 36.0, 32.0, 35.0, 24.0, 14.0, 12.0, 13.0, 11.0, 11.0, 10.0, 1.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.49540552496910095, -0.47856956720352173, -0.4617336094379425, -0.4448976516723633, -0.42806169390678406, -0.41122573614120483, -0.394389808177948, -0.3775538206100464, -0.36071789264678955, -0.3438819348812103, -0.3270459771156311, -0.3102100193500519, -0.29337406158447266, -0.27653810381889343, -0.2597021460533142, -0.24286620318889618, -0.22603023052215576, -0.20919427275657654, -0.19235831499099731, -0.1755223572254181, -0.15868639945983887, -0.14185044169425964, -0.1250144988298416, -0.10817854106426239, -0.09134258329868317, -0.07450662553310394, -0.05767067149281502, -0.04083471745252609, -0.02399875968694687, -0.007162801921367645, 0.009673148393630981, 0.026509106159210205, 0.043345093727111816, 0.06018105149269104, 0.07701700925827026, 0.09385295957326889, 0.11068891733884811, 0.12752488255500793, 0.14436082541942596, 0.1611967831850052, 0.1780327409505844, 0.19486869871616364, 0.21170465648174286, 0.2285405993461609, 0.2453765571117401, 0.26221251487731934, 0.27904847264289856, 0.2958844304084778, 0.312720388174057, 0.32955634593963623, 0.34639230370521545, 0.3632282614707947, 0.3800642192363739, 0.3969001770019531, 0.41373610496520996, 0.4305720925331116, 0.4474080204963684, 0.46424397826194763, 0.48107993602752686, 0.4979158937931061, 0.5147518515586853, 0.5315877795219421, 0.5484237670898438, 0.5652596950531006, 0.5820956826210022]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 6.0, 8.0, 12.0, 19.0, 17.0, 45.0, 47.0, 66.0, 95.0, 139.0, 223.0, 298.0, 400.0, 542.0, 805.0, 1194.0, 1783.0, 2511.0, 3643.0, 5385.0, 8093.0, 12271.0, 18494.0, 28566.0, 44604.0, 73856.0, 133460.0, 280382.0, 183934.0, 92881.0, 54460.0, 34101.0, 21735.0, 14236.0, 9588.0, 6459.0, 4417.0, 3087.0, 2124.0, 1389.0, 975.0, 658.0, 496.0, 311.0, 253.0, 135.0, 122.0, 72.0, 58.0, 38.0, 29.0, 13.0, 8.0, 9.0, 4.0, 5.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.1849365234375, -0.17910385131835938, -0.17327117919921875, -0.16743850708007812, -0.1616058349609375, -0.15577316284179688, -0.14994049072265625, -0.14410781860351562, -0.138275146484375, -0.13244247436523438, -0.12660980224609375, -0.12077713012695312, -0.1149444580078125, -0.10911178588867188, -0.10327911376953125, -0.09744644165039062, -0.09161376953125, -0.08578109741210938, -0.07994842529296875, -0.07411575317382812, -0.0682830810546875, -0.062450408935546875, -0.05661773681640625, -0.050785064697265625, -0.044952392578125, -0.039119720458984375, -0.03328704833984375, -0.027454376220703125, -0.0216217041015625, -0.015789031982421875, -0.00995635986328125, -0.004123687744140625, 0.001708984375, 0.007541656494140625, 0.01337432861328125, 0.019207000732421875, 0.0250396728515625, 0.030872344970703125, 0.03670501708984375, 0.042537689208984375, 0.048370361328125, 0.054203033447265625, 0.06003570556640625, 0.06586837768554688, 0.0717010498046875, 0.07753372192382812, 0.08336639404296875, 0.08919906616210938, 0.09503173828125, 0.10086441040039062, 0.10669708251953125, 0.11252975463867188, 0.1183624267578125, 0.12419509887695312, 0.13002777099609375, 0.13586044311523438, 0.141693115234375, 0.14752578735351562, 0.15335845947265625, 0.15919113159179688, 0.1650238037109375, 0.17085647583007812, 0.17668914794921875, 0.18252182006835938, 0.1883544921875]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 5.0, 4.0, 9.0, 10.0, 15.0, 11.0, 17.0, 23.0, 22.0, 12.0, 27.0, 16.0, 20.0, 21.0, 24.0, 36.0, 17.0, 36.0, 28.0, 41.0, 52.0, 61.0, 45.0, 36.0, 38.0, 33.0, 45.0, 31.0, 28.0, 22.0, 35.0, 24.0, 24.0, 18.0, 21.0, 17.0, 11.0, 11.0, 10.0, 9.0, 8.0, 7.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.353515625, -3.24029541015625, -3.1270751953125, -3.01385498046875, -2.900634765625, -2.78741455078125, -2.6741943359375, -2.56097412109375, -2.44775390625, -2.33453369140625, -2.2213134765625, -2.10809326171875, -1.994873046875, -1.88165283203125, -1.7684326171875, -1.65521240234375, -1.5419921875, -1.42877197265625, -1.3155517578125, -1.20233154296875, -1.089111328125, -0.97589111328125, -0.8626708984375, -0.74945068359375, -0.63623046875, -0.52301025390625, -0.4097900390625, -0.29656982421875, -0.183349609375, -0.07012939453125, 0.0430908203125, 0.15631103515625, 0.26953125, 0.38275146484375, 0.4959716796875, 0.60919189453125, 0.722412109375, 0.83563232421875, 0.9488525390625, 1.06207275390625, 1.17529296875, 1.28851318359375, 1.4017333984375, 1.51495361328125, 1.628173828125, 1.74139404296875, 1.8546142578125, 1.96783447265625, 2.0810546875, 2.19427490234375, 2.3074951171875, 2.42071533203125, 2.533935546875, 2.64715576171875, 2.7603759765625, 2.87359619140625, 2.98681640625, 3.10003662109375, 3.2132568359375, 3.32647705078125, 3.439697265625, 3.55291748046875, 3.6661376953125, 3.77935791015625, 3.892578125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 2.0, 3.0, 2.0, 4.0, 4.0, 12.0, 9.0, 18.0, 22.0, 19.0, 22.0, 28.0, 30.0, 32.0, 46.0, 62.0, 80.0, 105.0, 150.0, 305.0, 827.0, 15270.0, 1017048.0, 12811.0, 744.0, 322.0, 138.0, 109.0, 56.0, 55.0, 43.0, 34.0, 23.0, 28.0, 19.0, 11.0, 12.0, 10.0, 5.0, 14.0, 4.0, 4.0, 4.0, 2.0, 5.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-3.357421875, -3.265411376953125, -3.17340087890625, -3.081390380859375, -2.9893798828125, -2.897369384765625, -2.80535888671875, -2.713348388671875, -2.621337890625, -2.529327392578125, -2.43731689453125, -2.345306396484375, -2.2532958984375, -2.161285400390625, -2.06927490234375, -1.977264404296875, -1.88525390625, -1.793243408203125, -1.70123291015625, -1.609222412109375, -1.5172119140625, -1.425201416015625, -1.33319091796875, -1.241180419921875, -1.149169921875, -1.057159423828125, -0.96514892578125, -0.873138427734375, -0.7811279296875, -0.689117431640625, -0.59710693359375, -0.505096435546875, -0.4130859375, -0.321075439453125, -0.22906494140625, -0.137054443359375, -0.0450439453125, 0.046966552734375, 0.13897705078125, 0.230987548828125, 0.322998046875, 0.415008544921875, 0.50701904296875, 0.599029541015625, 0.6910400390625, 0.783050537109375, 0.87506103515625, 0.967071533203125, 1.05908203125, 1.151092529296875, 1.24310302734375, 1.335113525390625, 1.4271240234375, 1.519134521484375, 1.61114501953125, 1.703155517578125, 1.795166015625, 1.887176513671875, 1.97918701171875, 2.071197509765625, 2.1632080078125, 2.255218505859375, 2.34722900390625, 2.439239501953125, 2.53125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 1.0, 3.0, 2.0, 4.0, 5.0, 13.0, 12.0, 16.0, 20.0, 14.0, 26.0, 27.0, 17.0, 28.0, 37.0, 31.0, 35.0, 39.0, 28.0, 46.0, 40.0, 52.0, 53.0, 36.0, 47.0, 45.0, 33.0, 42.0, 28.0, 32.0, 29.0, 27.0, 22.0, 23.0, 19.0, 11.0, 9.0, 10.0, 7.0, 13.0, 4.0, 3.0, 5.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.75390625, -4.6231689453125, -4.492431640625, -4.3616943359375, -4.23095703125, -4.1002197265625, -3.969482421875, -3.8387451171875, -3.7080078125, -3.5772705078125, -3.446533203125, -3.3157958984375, -3.18505859375, -3.0543212890625, -2.923583984375, -2.7928466796875, -2.662109375, -2.5313720703125, -2.400634765625, -2.2698974609375, -2.13916015625, -2.0084228515625, -1.877685546875, -1.7469482421875, -1.6162109375, -1.4854736328125, -1.354736328125, -1.2239990234375, -1.09326171875, -0.9625244140625, -0.831787109375, -0.7010498046875, -0.5703125, -0.4395751953125, -0.308837890625, -0.1781005859375, -0.04736328125, 0.0833740234375, 0.214111328125, 0.3448486328125, 0.4755859375, 0.6063232421875, 0.737060546875, 0.8677978515625, 0.99853515625, 1.1292724609375, 1.260009765625, 1.3907470703125, 1.521484375, 1.6522216796875, 1.782958984375, 1.9136962890625, 2.04443359375, 2.1751708984375, 2.305908203125, 2.4366455078125, 2.5673828125, 2.6981201171875, 2.828857421875, 2.9595947265625, 3.09033203125, 3.2210693359375, 3.351806640625, 3.4825439453125, 3.61328125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 6.0, 11.0, 17.0, 22.0, 25.0, 34.0, 49.0, 116.0, 174.0, 272.0, 488.0, 868.0, 1627.0, 3866.0, 14039.0, 894249.0, 116665.0, 9632.0, 3118.0, 1449.0, 718.0, 424.0, 255.0, 154.0, 74.0, 55.0, 35.0, 38.0, 18.0, 15.0, 12.0, 3.0, 5.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.2314453125, -0.22517013549804688, -0.21889495849609375, -0.21261978149414062, -0.2063446044921875, -0.20006942749023438, -0.19379425048828125, -0.18751907348632812, -0.181243896484375, -0.17496871948242188, -0.16869354248046875, -0.16241836547851562, -0.1561431884765625, -0.14986801147460938, -0.14359283447265625, -0.13731765747070312, -0.13104248046875, -0.12476730346679688, -0.11849212646484375, -0.11221694946289062, -0.1059417724609375, -0.09966659545898438, -0.09339141845703125, -0.08711624145507812, -0.080841064453125, -0.07456588745117188, -0.06829071044921875, -0.062015533447265625, -0.0557403564453125, -0.049465179443359375, -0.04319000244140625, -0.036914825439453125, -0.0306396484375, -0.024364471435546875, -0.01808929443359375, -0.011814117431640625, -0.0055389404296875, 0.000736236572265625, 0.00701141357421875, 0.013286590576171875, 0.019561767578125, 0.025836944580078125, 0.03211212158203125, 0.038387298583984375, 0.0446624755859375, 0.050937652587890625, 0.05721282958984375, 0.06348800659179688, 0.06976318359375, 0.07603836059570312, 0.08231353759765625, 0.08858871459960938, 0.0948638916015625, 0.10113906860351562, 0.10741424560546875, 0.11368942260742188, 0.119964599609375, 0.12623977661132812, 0.13251495361328125, 0.13879013061523438, 0.1450653076171875, 0.15134048461914062, 0.15761566162109375, 0.16389083862304688, 0.170166015625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 7.0, 8.0, 17.0, 32.0, 215.0, 595.0, 67.0, 20.0, 9.0, 7.0, 8.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5510787963867188e-05, -2.436526119709015e-05, -2.321973443031311e-05, -2.2074207663536072e-05, -2.0928680896759033e-05, -1.9783154129981995e-05, -1.8637627363204956e-05, -1.7492100596427917e-05, -1.634657382965088e-05, -1.520104706287384e-05, -1.4055520296096802e-05, -1.2909993529319763e-05, -1.1764466762542725e-05, -1.0618939995765686e-05, -9.473413228988647e-06, -8.327886462211609e-06, -7.18235969543457e-06, -6.036832928657532e-06, -4.891306161880493e-06, -3.7457793951034546e-06, -2.600252628326416e-06, -1.4547258615493774e-06, -3.0919909477233887e-07, 8.363276720046997e-07, 1.9818544387817383e-06, 3.127381205558777e-06, 4.2729079723358154e-06, 5.418434739112854e-06, 6.563961505889893e-06, 7.709488272666931e-06, 8.85501503944397e-06, 1.0000541806221008e-05, 1.1146068572998047e-05, 1.2291595339775085e-05, 1.3437122106552124e-05, 1.4582648873329163e-05, 1.57281756401062e-05, 1.687370240688324e-05, 1.801922917366028e-05, 1.9164755940437317e-05, 2.0310282707214355e-05, 2.1455809473991394e-05, 2.2601336240768433e-05, 2.374686300754547e-05, 2.489238977432251e-05, 2.603791654109955e-05, 2.7183443307876587e-05, 2.8328970074653625e-05, 2.9474496841430664e-05, 3.06200236082077e-05, 3.176555037498474e-05, 3.291107714176178e-05, 3.405660390853882e-05, 3.520213067531586e-05, 3.6347657442092896e-05, 3.7493184208869934e-05, 3.863871097564697e-05, 3.978423774242401e-05, 4.092976450920105e-05, 4.207529127597809e-05, 4.322081804275513e-05, 4.4366344809532166e-05, 4.5511871576309204e-05, 4.665739834308624e-05, 4.780292510986328e-05]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 12.0, 21.0, 24.0, 21.0, 49.0, 80.0, 103.0, 195.0, 479.0, 973.0, 2485.0, 10857.0, 992173.0, 34409.0, 4017.0, 1347.0, 625.0, 278.0, 170.0, 57.0, 54.0, 38.0, 37.0, 17.0, 12.0, 3.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.3642578125, -0.353759765625, -0.34326171875, -0.332763671875, -0.322265625, -0.311767578125, -0.30126953125, -0.290771484375, -0.2802734375, -0.269775390625, -0.25927734375, -0.248779296875, -0.23828125, -0.227783203125, -0.21728515625, -0.206787109375, -0.1962890625, -0.185791015625, -0.17529296875, -0.164794921875, -0.154296875, -0.143798828125, -0.13330078125, -0.122802734375, -0.1123046875, -0.101806640625, -0.09130859375, -0.080810546875, -0.0703125, -0.059814453125, -0.04931640625, -0.038818359375, -0.0283203125, -0.017822265625, -0.00732421875, 0.003173828125, 0.013671875, 0.024169921875, 0.03466796875, 0.045166015625, 0.0556640625, 0.066162109375, 0.07666015625, 0.087158203125, 0.09765625, 0.108154296875, 0.11865234375, 0.129150390625, 0.1396484375, 0.150146484375, 0.16064453125, 0.171142578125, 0.181640625, 0.192138671875, 0.20263671875, 0.213134765625, 0.2236328125, 0.234130859375, 0.24462890625, 0.255126953125, 0.265625, 0.276123046875, 0.28662109375, 0.297119140625, 0.3076171875]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 15.0, 33.0, 88.0, 694.0, 93.0, 32.0, 20.0, 6.0, 4.0, 4.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.145263671875, -0.14129066467285156, -0.13731765747070312, -0.1333446502685547, -0.12937164306640625, -0.1253986358642578, -0.12142562866210938, -0.11745262145996094, -0.1134796142578125, -0.10950660705566406, -0.10553359985351562, -0.10156059265136719, -0.09758758544921875, -0.09361457824707031, -0.08964157104492188, -0.08566856384277344, -0.081695556640625, -0.07772254943847656, -0.07374954223632812, -0.06977653503417969, -0.06580352783203125, -0.06183052062988281, -0.057857513427734375, -0.05388450622558594, -0.0499114990234375, -0.04593849182128906, -0.041965484619140625, -0.03799247741699219, -0.03401947021484375, -0.030046463012695312, -0.026073455810546875, -0.022100448608398438, -0.01812744140625, -0.014154434204101562, -0.010181427001953125, -0.0062084197998046875, -0.00223541259765625, 0.0017375946044921875, 0.005710601806640625, 0.009683609008789062, 0.0136566162109375, 0.017629623413085938, 0.021602630615234375, 0.025575637817382812, 0.02954864501953125, 0.03352165222167969, 0.037494659423828125, 0.04146766662597656, 0.045440673828125, 0.04941368103027344, 0.053386688232421875, 0.05735969543457031, 0.06133270263671875, 0.06530570983886719, 0.06927871704101562, 0.07325172424316406, 0.0772247314453125, 0.08119773864746094, 0.08517074584960938, 0.08914375305175781, 0.09311676025390625, 0.09708976745605469, 0.10106277465820312, 0.10503578186035156, 0.1090087890625]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 26.0, 929.0, 67.0, 0.0, 0.0, 1.0], "bins": [-40.947471618652344, -40.26072311401367, -39.573974609375, -38.887229919433594, -38.20048141479492, -37.51373291015625, -36.82698440551758, -36.140235900878906, -35.453487396240234, -34.76673889160156, -34.07999038696289, -33.39324188232422, -32.70649719238281, -32.01974868774414, -31.33300018310547, -30.646251678466797, -29.959505081176758, -29.272756576538086, -28.586009979248047, -27.899261474609375, -27.212512969970703, -26.52576446533203, -25.839017868041992, -25.15226936340332, -24.46552276611328, -23.77877426147461, -23.09202766418457, -22.4052791595459, -21.718530654907227, -21.031784057617188, -20.345035552978516, -19.658287048339844, -18.971540451049805, -18.284791946411133, -17.598045349121094, -16.911296844482422, -16.22454833984375, -15.537800788879395, -14.851053237915039, -14.164304733276367, -13.477556228637695, -12.79080867767334, -12.104060173034668, -11.417312622070312, -10.73056411743164, -10.043816566467285, -9.35706901550293, -8.670320510864258, -7.9835734367370605, -7.296825408935547, -6.610077857971191, -5.923329830169678, -5.236581802368164, -4.54983377456665, -3.863086223602295, -3.1763381958007812, -2.4895901679992676, -1.8028422594070435, -1.1160943508148193, -0.42934656143188477, 0.2574014663696289, 0.9441494941711426, 1.630897045135498, 2.3176450729370117, 3.0043931007385254]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 5.0, 5.0, 2.0, 8.0, 7.0, 12.0, 12.0, 14.0, 18.0, 22.0, 21.0, 28.0, 25.0, 21.0, 26.0, 33.0, 38.0, 40.0, 43.0, 43.0, 41.0, 40.0, 46.0, 50.0, 37.0, 35.0, 47.0, 24.0, 43.0, 27.0, 20.0, 29.0, 26.0, 24.0, 17.0, 17.0, 11.0, 8.0, 8.0, 12.0, 5.0, 4.0, 3.0, 1.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.156064033508301, -5.960081100463867, -5.764098644256592, -5.568115711212158, -5.372132778167725, -5.176150321960449, -4.980167388916016, -4.784184455871582, -4.588201999664307, -4.392219066619873, -4.196236610412598, -4.000253677368164, -3.8042709827423096, -3.608288288116455, -3.4123053550720215, -3.216322660446167, -3.0203397274017334, -2.824357032775879, -2.6283740997314453, -2.432391405105591, -2.2364087104797363, -2.0404257774353027, -1.8444430828094482, -1.6484603881835938, -1.4524775743484497, -1.2564947605133057, -1.0605120658874512, -0.8645292520523071, -0.6685464978218079, -0.4725637435913086, -0.27658092975616455, -0.08059823513031006, 0.11538457870483398, 0.31136733293533325, 0.5073500871658325, 0.7033329010009766, 0.8993156552314758, 1.095298409461975, 1.2912812232971191, 1.4872639179229736, 1.6832467317581177, 1.8792295455932617, 2.075212240219116, 2.2711949348449707, 2.4671778678894043, 2.663160562515259, 2.8591432571411133, 3.055126190185547, 3.2511088848114014, 3.447091579437256, 3.6430745124816895, 3.839057207107544, 4.035039901733398, 4.231022834777832, 4.427005767822266, 4.622988224029541, 4.818971157073975, 5.014954090118408, 5.210936546325684, 5.406919479370117, 5.602902412414551, 5.798884868621826, 5.99486780166626, 6.190850257873535, 6.386833190917969]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 1.0, 4.0, 2.0, 6.0, 4.0, 10.0, 8.0, 14.0, 13.0, 18.0, 24.0, 22.0, 26.0, 24.0, 50.0, 47.0, 87.0, 184.0, 441.0, 1176.0, 4386.0, 21286.0, 874982.0, 3238203.0, 43019.0, 7062.0, 1899.0, 622.0, 256.0, 109.0, 60.0, 41.0, 36.0, 35.0, 21.0, 19.0, 19.0, 17.0, 13.0, 8.0, 5.0, 5.0, 3.0, 7.0, 3.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.84375, -1.782623291015625, -1.72149658203125, -1.660369873046875, -1.5992431640625, -1.538116455078125, -1.47698974609375, -1.415863037109375, -1.354736328125, -1.293609619140625, -1.23248291015625, -1.171356201171875, -1.1102294921875, -1.049102783203125, -0.98797607421875, -0.926849365234375, -0.86572265625, -0.804595947265625, -0.74346923828125, -0.682342529296875, -0.6212158203125, -0.560089111328125, -0.49896240234375, -0.437835693359375, -0.376708984375, -0.315582275390625, -0.25445556640625, -0.193328857421875, -0.1322021484375, -0.071075439453125, -0.00994873046875, 0.051177978515625, 0.1123046875, 0.173431396484375, 0.23455810546875, 0.295684814453125, 0.3568115234375, 0.417938232421875, 0.47906494140625, 0.540191650390625, 0.601318359375, 0.662445068359375, 0.72357177734375, 0.784698486328125, 0.8458251953125, 0.906951904296875, 0.96807861328125, 1.029205322265625, 1.09033203125, 1.151458740234375, 1.21258544921875, 1.273712158203125, 1.3348388671875, 1.395965576171875, 1.45709228515625, 1.518218994140625, 1.579345703125, 1.640472412109375, 1.70159912109375, 1.762725830078125, 1.8238525390625, 1.884979248046875, 1.94610595703125, 2.007232666015625, 2.068359375]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 11.0, 14.0, 9.0, 14.0, 15.0, 17.0, 20.0, 29.0, 35.0, 44.0, 47.0, 39.0, 52.0, 54.0, 61.0, 56.0, 50.0, 67.0, 56.0, 51.0, 57.0, 40.0, 38.0, 32.0, 24.0, 14.0, 19.0, 12.0, 9.0, 7.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.447998046875, -0.4272346496582031, -0.40647125244140625, -0.3857078552246094, -0.3649444580078125, -0.3441810607910156, -0.32341766357421875, -0.3026542663574219, -0.281890869140625, -0.2611274719238281, -0.24036407470703125, -0.21960067749023438, -0.1988372802734375, -0.17807388305664062, -0.15731048583984375, -0.13654708862304688, -0.11578369140625, -0.09502029418945312, -0.07425689697265625, -0.053493499755859375, -0.0327301025390625, -0.011966705322265625, 0.00879669189453125, 0.029560089111328125, 0.050323486328125, 0.07108688354492188, 0.09185028076171875, 0.11261367797851562, 0.1333770751953125, 0.15414047241210938, 0.17490386962890625, 0.19566726684570312, 0.2164306640625, 0.23719406127929688, 0.25795745849609375, 0.2787208557128906, 0.2994842529296875, 0.3202476501464844, 0.34101104736328125, 0.3617744445800781, 0.382537841796875, 0.4033012390136719, 0.42406463623046875, 0.4448280334472656, 0.4655914306640625, 0.4863548278808594, 0.5071182250976562, 0.5278816223144531, 0.54864501953125, 0.5694084167480469, 0.5901718139648438, 0.6109352111816406, 0.6316986083984375, 0.6524620056152344, 0.6732254028320312, 0.6939888000488281, 0.714752197265625, 0.7355155944824219, 0.7562789916992188, 0.7770423889160156, 0.7978057861328125, 0.8185691833496094, 0.8393325805664062, 0.8600959777832031, 0.880859375]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 8.0, 22.0, 101.0, 4193788.0, 310.0, 37.0, 11.0, 11.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.2421875, -13.4971923828125, -11.752197265625, -10.0072021484375, -8.26220703125, -6.5172119140625, -4.772216796875, -3.0272216796875, -1.2822265625, 0.4627685546875, 2.207763671875, 3.9527587890625, 5.69775390625, 7.4427490234375, 9.187744140625, 10.9327392578125, 12.677734375, 14.4227294921875, 16.167724609375, 17.9127197265625, 19.65771484375, 21.4027099609375, 23.147705078125, 24.8927001953125, 26.6376953125, 28.3826904296875, 30.127685546875, 31.8726806640625, 33.61767578125, 35.3626708984375, 37.107666015625, 38.8526611328125, 40.59765625, 42.3426513671875, 44.087646484375, 45.8326416015625, 47.57763671875, 49.3226318359375, 51.067626953125, 52.8126220703125, 54.5576171875, 56.3026123046875, 58.047607421875, 59.7926025390625, 61.53759765625, 63.2825927734375, 65.027587890625, 66.7725830078125, 68.517578125, 70.2625732421875, 72.007568359375, 73.7525634765625, 75.49755859375, 77.2425537109375, 78.987548828125, 80.7325439453125, 82.4775390625, 84.2225341796875, 85.967529296875, 87.7125244140625, 89.45751953125, 91.2025146484375, 92.947509765625, 94.6925048828125, 96.4375]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 5.0, 7.0, 21.0, 21.0, 30.0, 39.0, 74.0, 127.0, 311.0, 957.0, 1422.0, 588.0, 196.0, 113.0, 62.0, 38.0, 26.0, 17.0, 10.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.296875, -0.282928466796875, -0.26898193359375, -0.255035400390625, -0.2410888671875, -0.227142333984375, -0.21319580078125, -0.199249267578125, -0.185302734375, -0.171356201171875, -0.15740966796875, -0.143463134765625, -0.1295166015625, -0.115570068359375, -0.10162353515625, -0.087677001953125, -0.07373046875, -0.059783935546875, -0.04583740234375, -0.031890869140625, -0.0179443359375, -0.003997802734375, 0.00994873046875, 0.023895263671875, 0.037841796875, 0.051788330078125, 0.06573486328125, 0.079681396484375, 0.0936279296875, 0.107574462890625, 0.12152099609375, 0.135467529296875, 0.1494140625, 0.163360595703125, 0.17730712890625, 0.191253662109375, 0.2052001953125, 0.219146728515625, 0.23309326171875, 0.247039794921875, 0.260986328125, 0.274932861328125, 0.28887939453125, 0.302825927734375, 0.3167724609375, 0.330718994140625, 0.34466552734375, 0.358612060546875, 0.37255859375, 0.386505126953125, 0.40045166015625, 0.414398193359375, 0.4283447265625, 0.442291259765625, 0.45623779296875, 0.470184326171875, 0.484130859375, 0.498077392578125, 0.51202392578125, 0.525970458984375, 0.5399169921875, 0.553863525390625, 0.56781005859375, 0.581756591796875, 0.595703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 5.0, 4.0, 9.0, 15.0, 27.0, 42.0, 60.0, 104.0, 142.0, 186.0, 165.0, 99.0, 57.0, 31.0, 26.0, 23.0, 12.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5449100136756897, -0.5015302300453186, -0.4581504464149475, -0.4147706627845764, -0.3713908791542053, -0.32801109552383423, -0.28463128209114075, -0.24125149846076965, -0.19787171483039856, -0.15449193120002747, -0.11111214011907578, -0.06773234903812408, -0.02435256540775299, 0.019027218222618103, 0.06240701675415039, 0.10578680038452148, 0.14916658401489258, 0.19254636764526367, 0.23592615127563477, 0.27930593490600586, 0.32268571853637695, 0.36606550216674805, 0.40944531559944153, 0.4528250992298126, 0.4962048828601837, 0.5395846962928772, 0.5829644799232483, 0.6263442635536194, 0.6697240471839905, 0.7131038308143616, 0.7564836144447327, 0.7998633980751038, 0.8432432413101196, 0.8866230249404907, 0.9300028085708618, 0.9733825922012329, 1.016762375831604, 1.060142159461975, 1.1035219430923462, 1.1469017267227173, 1.1902815103530884, 1.2336612939834595, 1.2770410776138306, 1.3204208612442017, 1.3638006448745728, 1.4071804285049438, 1.450560212135315, 1.493939995765686, 1.5373198986053467, 1.5806996822357178, 1.6240794658660889, 1.66745924949646, 1.710839033126831, 1.7542188167572021, 1.7975986003875732, 1.8409783840179443, 1.8843581676483154, 1.9277379512786865, 1.9711177349090576, 2.0144975185394287, 2.0578773021698, 2.101257085800171, 2.144636869430542, 2.188016653060913, 2.231396436691284]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 5.0, 3.0, 6.0, 10.0, 10.0, 11.0, 15.0, 19.0, 23.0, 24.0, 32.0, 35.0, 34.0, 31.0, 29.0, 32.0, 49.0, 38.0, 44.0, 48.0, 57.0, 48.0, 34.0, 43.0, 50.0, 33.0, 27.0, 40.0, 30.0, 24.0, 20.0, 18.0, 16.0, 17.0, 8.0, 11.0, 12.0, 4.0, 5.0, 3.0, 3.0, 1.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5113065838813782, -0.49378257989883423, -0.47625860571861267, -0.4587346315383911, -0.44121062755584717, -0.4236866235733032, -0.40616264939308167, -0.3886386752128601, -0.37111467123031616, -0.3535906672477722, -0.33606669306755066, -0.3185427188873291, -0.30101871490478516, -0.2834947109222412, -0.26597073674201965, -0.2484467476606369, -0.23092275857925415, -0.2133987694978714, -0.19587478041648865, -0.1783507913351059, -0.16082680225372314, -0.1433028131723404, -0.12577882409095764, -0.10825483500957489, -0.09073084592819214, -0.07320685684680939, -0.055682867765426636, -0.038158878684043884, -0.020634889602661133, -0.0031109005212783813, 0.01441308856010437, 0.03193707764148712, 0.0494610071182251, 0.06698499619960785, 0.0845089852809906, 0.10203297436237335, 0.1195569634437561, 0.13708095252513885, 0.1546049416065216, 0.17212893068790436, 0.1896529197692871, 0.20717690885066986, 0.2247008979320526, 0.24222488701343536, 0.2597488760948181, 0.27727288007736206, 0.2947968542575836, 0.3123208284378052, 0.3298448324203491, 0.34736883640289307, 0.3648928105831146, 0.3824167847633362, 0.3999407887458801, 0.4174647927284241, 0.43498876690864563, 0.4525127410888672, 0.47003674507141113, 0.4875607490539551, 0.505084753036499, 0.5226086974143982, 0.5401327013969421, 0.5576567053794861, 0.5751806497573853, 0.5927046537399292, 0.6102286577224731]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 9.0, 11.0, 11.0, 20.0, 30.0, 35.0, 60.0, 91.0, 157.0, 229.0, 345.0, 525.0, 852.0, 1356.0, 2300.0, 3898.0, 7022.0, 13536.0, 28545.0, 64499.0, 172676.0, 395900.0, 211852.0, 76748.0, 32839.0, 15962.0, 8160.0, 4315.0, 2485.0, 1489.0, 932.0, 587.0, 385.0, 228.0, 147.0, 100.0, 73.0, 49.0, 35.0, 23.0, 19.0, 9.0, 10.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.293212890625, -0.28421783447265625, -0.2752227783203125, -0.26622772216796875, -0.257232666015625, -0.24823760986328125, -0.2392425537109375, -0.23024749755859375, -0.22125244140625, -0.21225738525390625, -0.2032623291015625, -0.19426727294921875, -0.185272216796875, -0.17627716064453125, -0.1672821044921875, -0.15828704833984375, -0.1492919921875, -0.14029693603515625, -0.1313018798828125, -0.12230682373046875, -0.113311767578125, -0.10431671142578125, -0.0953216552734375, -0.08632659912109375, -0.07733154296875, -0.06833648681640625, -0.0593414306640625, -0.05034637451171875, -0.041351318359375, -0.03235626220703125, -0.0233612060546875, -0.01436614990234375, -0.00537109375, 0.00362396240234375, 0.0126190185546875, 0.02161407470703125, 0.030609130859375, 0.03960418701171875, 0.0485992431640625, 0.05759429931640625, 0.06658935546875, 0.07558441162109375, 0.0845794677734375, 0.09357452392578125, 0.102569580078125, 0.11156463623046875, 0.1205596923828125, 0.12955474853515625, 0.1385498046875, 0.14754486083984375, 0.1565399169921875, 0.16553497314453125, 0.174530029296875, 0.18352508544921875, 0.1925201416015625, 0.20151519775390625, 0.21051025390625, 0.21950531005859375, 0.2285003662109375, 0.23749542236328125, 0.246490478515625, 0.25548553466796875, 0.2644805908203125, 0.27347564697265625, 0.282470703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 8.0, 10.0, 9.0, 17.0, 12.0, 21.0, 24.0, 31.0, 41.0, 33.0, 31.0, 36.0, 36.0, 34.0, 57.0, 59.0, 59.0, 41.0, 53.0, 45.0, 51.0, 41.0, 34.0, 35.0, 43.0, 30.0, 20.0, 19.0, 18.0, 7.0, 18.0, 3.0, 9.0, 3.0, 3.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.339111328125, -0.32689666748046875, -0.3146820068359375, -0.30246734619140625, -0.290252685546875, -0.27803802490234375, -0.2658233642578125, -0.25360870361328125, -0.24139404296875, -0.22917938232421875, -0.2169647216796875, -0.20475006103515625, -0.192535400390625, -0.18032073974609375, -0.1681060791015625, -0.15589141845703125, -0.1436767578125, -0.13146209716796875, -0.1192474365234375, -0.10703277587890625, -0.094818115234375, -0.08260345458984375, -0.0703887939453125, -0.05817413330078125, -0.04595947265625, -0.03374481201171875, -0.0215301513671875, -0.00931549072265625, 0.002899169921875, 0.01511383056640625, 0.0273284912109375, 0.03954315185546875, 0.0517578125, 0.06397247314453125, 0.0761871337890625, 0.08840179443359375, 0.100616455078125, 0.11283111572265625, 0.1250457763671875, 0.13726043701171875, 0.14947509765625, 0.16168975830078125, 0.1739044189453125, 0.18611907958984375, 0.198333740234375, 0.21054840087890625, 0.2227630615234375, 0.23497772216796875, 0.2471923828125, 0.25940704345703125, 0.2716217041015625, 0.28383636474609375, 0.296051025390625, 0.30826568603515625, 0.3204803466796875, 0.33269500732421875, 0.34490966796875, 0.35712432861328125, 0.3693389892578125, 0.38155364990234375, 0.393768310546875, 0.40598297119140625, 0.4181976318359375, 0.43041229248046875, 0.442626953125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 2.0, 3.0, 4.0, 4.0, 6.0, 14.0, 11.0, 8.0, 22.0, 33.0, 49.0, 95.0, 123.0, 216.0, 392.0, 681.0, 1404.0, 3334.0, 8996.0, 28500.0, 113722.0, 499199.0, 299948.0, 63492.0, 17577.0, 5957.0, 2388.0, 1051.0, 529.0, 297.0, 171.0, 100.0, 68.0, 47.0, 26.0, 30.0, 14.0, 10.0, 9.0, 9.0, 6.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.392578125, -0.3812980651855469, -0.37001800537109375, -0.3587379455566406, -0.3474578857421875, -0.3361778259277344, -0.32489776611328125, -0.3136177062988281, -0.302337646484375, -0.2910575866699219, -0.27977752685546875, -0.2684974670410156, -0.2572174072265625, -0.24593734741210938, -0.23465728759765625, -0.22337722778320312, -0.21209716796875, -0.20081710815429688, -0.18953704833984375, -0.17825698852539062, -0.1669769287109375, -0.15569686889648438, -0.14441680908203125, -0.13313674926757812, -0.121856689453125, -0.11057662963867188, -0.09929656982421875, -0.08801651000976562, -0.0767364501953125, -0.06545639038085938, -0.05417633056640625, -0.042896270751953125, -0.0316162109375, -0.020336151123046875, -0.00905609130859375, 0.002223968505859375, 0.0135040283203125, 0.024784088134765625, 0.03606414794921875, 0.047344207763671875, 0.058624267578125, 0.06990432739257812, 0.08118438720703125, 0.09246444702148438, 0.1037445068359375, 0.11502456665039062, 0.12630462646484375, 0.13758468627929688, 0.14886474609375, 0.16014480590820312, 0.17142486572265625, 0.18270492553710938, 0.1939849853515625, 0.20526504516601562, 0.21654510498046875, 0.22782516479492188, 0.239105224609375, 0.2503852844238281, 0.26166534423828125, 0.2729454040527344, 0.2842254638671875, 0.2955055236816406, 0.30678558349609375, 0.3180656433105469, 0.329345703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 4.0, 8.0, 6.0, 10.0, 15.0, 10.0, 16.0, 14.0, 17.0, 17.0, 21.0, 32.0, 30.0, 32.0, 28.0, 33.0, 43.0, 42.0, 54.0, 40.0, 29.0, 47.0, 50.0, 30.0, 33.0, 33.0, 34.0, 29.0, 13.0, 19.0, 22.0, 21.0, 26.0, 16.0, 20.0, 14.0, 20.0, 9.0, 16.0, 13.0, 3.0, 12.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.57666015625, -0.5589218139648438, -0.5411834716796875, -0.5234451293945312, -0.505706787109375, -0.48796844482421875, -0.4702301025390625, -0.45249176025390625, -0.43475341796875, -0.41701507568359375, -0.3992767333984375, -0.38153839111328125, -0.363800048828125, -0.34606170654296875, -0.3283233642578125, -0.31058502197265625, -0.2928466796875, -0.27510833740234375, -0.2573699951171875, -0.23963165283203125, -0.221893310546875, -0.20415496826171875, -0.1864166259765625, -0.16867828369140625, -0.15093994140625, -0.13320159912109375, -0.1154632568359375, -0.09772491455078125, -0.079986572265625, -0.06224822998046875, -0.0445098876953125, -0.02677154541015625, -0.009033203125, 0.00870513916015625, 0.0264434814453125, 0.04418182373046875, 0.061920166015625, 0.07965850830078125, 0.0973968505859375, 0.11513519287109375, 0.13287353515625, 0.15061187744140625, 0.1683502197265625, 0.18608856201171875, 0.203826904296875, 0.22156524658203125, 0.2393035888671875, 0.25704193115234375, 0.2747802734375, 0.29251861572265625, 0.3102569580078125, 0.32799530029296875, 0.345733642578125, 0.36347198486328125, 0.3812103271484375, 0.39894866943359375, 0.41668701171875, 0.43442535400390625, 0.4521636962890625, 0.46990203857421875, 0.487640380859375, 0.5053787231445312, 0.5231170654296875, 0.5408554077148438, 0.55859375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 9.0, 12.0, 10.0, 20.0, 33.0, 41.0, 46.0, 79.0, 118.0, 180.0, 309.0, 586.0, 1259.0, 2802.0, 7479.0, 25836.0, 123278.0, 604784.0, 222153.0, 41322.0, 10983.0, 3818.0, 1578.0, 833.0, 389.0, 247.0, 121.0, 85.0, 50.0, 27.0, 16.0, 12.0, 17.0, 7.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.1011962890625, -0.09857845306396484, -0.09596061706542969, -0.09334278106689453, -0.09072494506835938, -0.08810710906982422, -0.08548927307128906, -0.0828714370727539, -0.08025360107421875, -0.0776357650756836, -0.07501792907714844, -0.07240009307861328, -0.06978225708007812, -0.06716442108154297, -0.06454658508300781, -0.061928749084472656, -0.0593109130859375, -0.056693077087402344, -0.05407524108886719, -0.05145740509033203, -0.048839569091796875, -0.04622173309326172, -0.04360389709472656, -0.040986061096191406, -0.03836822509765625, -0.035750389099121094, -0.03313255310058594, -0.03051471710205078, -0.027896881103515625, -0.02527904510498047, -0.022661209106445312, -0.020043373107910156, -0.017425537109375, -0.014807701110839844, -0.012189865112304688, -0.009572029113769531, -0.006954193115234375, -0.004336357116699219, -0.0017185211181640625, 0.0008993148803710938, 0.00351715087890625, 0.006134986877441406, 0.008752822875976562, 0.011370658874511719, 0.013988494873046875, 0.01660633087158203, 0.019224166870117188, 0.021842002868652344, 0.0244598388671875, 0.027077674865722656, 0.029695510864257812, 0.03231334686279297, 0.034931182861328125, 0.03754901885986328, 0.04016685485839844, 0.042784690856933594, 0.04540252685546875, 0.048020362854003906, 0.05063819885253906, 0.05325603485107422, 0.055873870849609375, 0.05849170684814453, 0.06110954284667969, 0.06372737884521484, 0.06634521484375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 6.0, 4.0, 10.0, 10.0, 10.0, 20.0, 24.0, 29.0, 38.0, 47.0, 88.0, 100.0, 136.0, 122.0, 86.0, 71.0, 53.0, 34.0, 36.0, 20.0, 9.0, 4.0, 6.0, 11.0, 3.0, 5.0, 10.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.404783248901367e-05, -4.2280182242393494e-05, -4.0512531995773315e-05, -3.874488174915314e-05, -3.697723150253296e-05, -3.520958125591278e-05, -3.34419310092926e-05, -3.1674280762672424e-05, -2.9906630516052246e-05, -2.8138980269432068e-05, -2.637133002281189e-05, -2.460367977619171e-05, -2.2836029529571533e-05, -2.1068379282951355e-05, -1.9300729036331177e-05, -1.7533078789711e-05, -1.576542854309082e-05, -1.3997778296470642e-05, -1.2230128049850464e-05, -1.0462477803230286e-05, -8.694827556610107e-06, -6.927177309989929e-06, -5.159527063369751e-06, -3.3918768167495728e-06, -1.6242265701293945e-06, 1.434236764907837e-07, 1.911073923110962e-06, 3.67872416973114e-06, 5.446374416351318e-06, 7.214024662971497e-06, 8.981674909591675e-06, 1.0749325156211853e-05, 1.2516975402832031e-05, 1.428462564945221e-05, 1.6052275896072388e-05, 1.7819926142692566e-05, 1.9587576389312744e-05, 2.1355226635932922e-05, 2.31228768825531e-05, 2.489052712917328e-05, 2.6658177375793457e-05, 2.8425827622413635e-05, 3.0193477869033813e-05, 3.196112811565399e-05, 3.372877836227417e-05, 3.549642860889435e-05, 3.7264078855514526e-05, 3.9031729102134705e-05, 4.079937934875488e-05, 4.256702959537506e-05, 4.433467984199524e-05, 4.610233008861542e-05, 4.7869980335235596e-05, 4.9637630581855774e-05, 5.140528082847595e-05, 5.317293107509613e-05, 5.494058132171631e-05, 5.670823156833649e-05, 5.8475881814956665e-05, 6.024353206157684e-05, 6.201118230819702e-05, 6.37788325548172e-05, 6.554648280143738e-05, 6.731413304805756e-05, 6.908178329467773e-05]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 8.0, 2.0, 7.0, 3.0, 4.0, 2.0, 5.0, 10.0, 25.0, 13.0, 21.0, 23.0, 22.0, 37.0, 51.0, 70.0, 241.0, 14388.0, 1029056.0, 4094.0, 149.0, 79.0, 48.0, 25.0, 34.0, 28.0, 15.0, 10.0, 14.0, 12.0, 7.0, 10.0, 6.0, 4.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.396484375, -0.38385772705078125, -0.3712310791015625, -0.35860443115234375, -0.345977783203125, -0.33335113525390625, -0.3207244873046875, -0.30809783935546875, -0.29547119140625, -0.28284454345703125, -0.2702178955078125, -0.25759124755859375, -0.244964599609375, -0.23233795166015625, -0.2197113037109375, -0.20708465576171875, -0.1944580078125, -0.18183135986328125, -0.1692047119140625, -0.15657806396484375, -0.143951416015625, -0.13132476806640625, -0.1186981201171875, -0.10607147216796875, -0.09344482421875, -0.08081817626953125, -0.0681915283203125, -0.05556488037109375, -0.042938232421875, -0.03031158447265625, -0.0176849365234375, -0.00505828857421875, 0.007568359375, 0.02019500732421875, 0.0328216552734375, 0.04544830322265625, 0.058074951171875, 0.07070159912109375, 0.0833282470703125, 0.09595489501953125, 0.10858154296875, 0.12120819091796875, 0.1338348388671875, 0.14646148681640625, 0.159088134765625, 0.17171478271484375, 0.1843414306640625, 0.19696807861328125, 0.2095947265625, 0.22222137451171875, 0.2348480224609375, 0.24747467041015625, 0.260101318359375, 0.27272796630859375, 0.2853546142578125, 0.29798126220703125, 0.31060791015625, 0.32323455810546875, 0.3358612060546875, 0.34848785400390625, 0.361114501953125, 0.37374114990234375, 0.3863677978515625, 0.39899444580078125, 0.41162109375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 1.0, 3.0, 4.0, 6.0, 14.0, 8.0, 7.0, 8.0, 13.0, 19.0, 27.0, 33.0, 33.0, 46.0, 49.0, 49.0, 55.0, 67.0, 53.0, 73.0, 59.0, 52.0, 61.0, 47.0, 34.0, 27.0, 24.0, 26.0, 17.0, 17.0, 13.0, 10.0, 9.0, 7.0, 8.0, 4.0, 6.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0164337158203125, -0.015799522399902344, -0.015165328979492188, -0.014531135559082031, -0.013896942138671875, -0.013262748718261719, -0.012628555297851562, -0.011994361877441406, -0.01136016845703125, -0.010725975036621094, -0.010091781616210938, -0.009457588195800781, -0.008823394775390625, -0.008189201354980469, -0.0075550079345703125, -0.006920814514160156, -0.00628662109375, -0.005652427673339844, -0.0050182342529296875, -0.004384040832519531, -0.003749847412109375, -0.0031156539916992188, -0.0024814605712890625, -0.0018472671508789062, -0.00121307373046875, -0.0005788803100585938, 5.53131103515625e-05, 0.0006895065307617188, 0.001323699951171875, 0.0019578933715820312, 0.0025920867919921875, 0.0032262802124023438, 0.0038604736328125, 0.004494667053222656, 0.0051288604736328125, 0.005763053894042969, 0.006397247314453125, 0.007031440734863281, 0.0076656341552734375, 0.008299827575683594, 0.00893402099609375, 0.009568214416503906, 0.010202407836914062, 0.010836601257324219, 0.011470794677734375, 0.012104988098144531, 0.012739181518554688, 0.013373374938964844, 0.014007568359375, 0.014641761779785156, 0.015275955200195312, 0.01591014862060547, 0.016544342041015625, 0.01717853546142578, 0.017812728881835938, 0.018446922302246094, 0.01908111572265625, 0.019715309143066406, 0.020349502563476562, 0.02098369598388672, 0.021617889404296875, 0.02225208282470703, 0.022886276245117188, 0.023520469665527344, 0.0241546630859375]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 3.0, 11.0, 14.0, 26.0, 35.0, 62.0, 100.0, 150.0, 172.0, 146.0, 123.0, 51.0, 53.0, 20.0, 13.0, 9.0, 7.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.477413535118103, -0.4553607404232025, -0.4333079755306244, -0.4112551808357239, -0.38920241594314575, -0.36714962124824524, -0.3450968265533447, -0.3230440616607666, -0.3009912669658661, -0.2789384722709656, -0.25688570737838745, -0.23483291268348694, -0.21278013288974762, -0.1907273530960083, -0.1686745584011078, -0.14662177860736847, -0.12456899881362915, -0.10251621901988983, -0.08046343177556992, -0.05841064453125, -0.03635786473751068, -0.014305084943771362, 0.00774770975112915, 0.02980048954486847, 0.05185326933860779, 0.0739060491323471, 0.09595883637666702, 0.11801162362098694, 0.14006440341472626, 0.16211718320846558, 0.1841699779033661, 0.2062227576971054, 0.22827553749084473, 0.25032833218574524, 0.27238109707832336, 0.2944338917732239, 0.316486656665802, 0.3385394513607025, 0.360592246055603, 0.38264501094818115, 0.40469780564308167, 0.4267506003379822, 0.4488033652305603, 0.4708561599254608, 0.49290895462036133, 0.5149617195129395, 0.5370144844055176, 0.5590673089027405, 0.5811200737953186, 0.6031728386878967, 0.6252256631851196, 0.6472784280776978, 0.6693311929702759, 0.691383957862854, 0.7134367823600769, 0.735489547252655, 0.7575423717498779, 0.779595136642456, 0.801647961139679, 0.8237007260322571, 0.8457534909248352, 0.8678063154220581, 0.8898590803146362, 0.9119118452072144, 0.9339646100997925]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 6.0, 7.0, 8.0, 10.0, 17.0, 19.0, 29.0, 29.0, 44.0, 30.0, 31.0, 44.0, 48.0, 46.0, 45.0, 49.0, 62.0, 52.0, 56.0, 59.0, 45.0, 50.0, 33.0, 34.0, 34.0, 25.0, 23.0, 19.0, 13.0, 11.0, 4.0, 11.0, 2.0, 2.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.374891996383667, -0.3621973395347595, -0.34950268268585205, -0.3368080258369446, -0.3241133689880371, -0.31141871213912964, -0.29872405529022217, -0.2860293984413147, -0.2733347415924072, -0.26064008474349976, -0.24794542789459229, -0.23525077104568481, -0.22255611419677734, -0.20986145734786987, -0.1971667855978012, -0.18447212874889374, -0.17177745699882507, -0.1590828001499176, -0.14638814330101013, -0.13369348645210266, -0.1209988221526146, -0.10830416530370712, -0.09560950100421906, -0.08291484415531158, -0.07022018730640411, -0.05752553045749664, -0.044830869883298874, -0.032136209309101105, -0.019441552460193634, -0.006746895611286163, 0.005947768688201904, 0.018642425537109375, 0.03133705258369446, 0.04403170943260193, 0.0567263700067997, 0.06942103058099747, 0.08211568742990494, 0.09481034427881241, 0.10750500857830048, 0.12019966542720795, 0.13289432227611542, 0.1455889791250229, 0.15828363597393036, 0.17097830772399902, 0.1836729645729065, 0.19636762142181396, 0.20906227827072144, 0.2217569351196289, 0.23445159196853638, 0.24714624881744385, 0.2598409056663513, 0.2725355625152588, 0.28523021936416626, 0.29792487621307373, 0.3106195330619812, 0.32331418991088867, 0.33600884675979614, 0.3487035036087036, 0.3613981604576111, 0.37409281730651855, 0.386787474155426, 0.3994821310043335, 0.41217678785324097, 0.42487144470214844, 0.4375661313533783]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 5.0, 4.0, 8.0, 5.0, 9.0, 18.0, 22.0, 28.0, 32.0, 46.0, 72.0, 92.0, 150.0, 230.0, 318.0, 502.0, 839.0, 1501.0, 2586.0, 4830.0, 9223.0, 18370.0, 38922.0, 87838.0, 220991.0, 365720.0, 165878.0, 67388.0, 30787.0, 14913.0, 7735.0, 3978.0, 2174.0, 1242.0, 721.0, 466.0, 297.0, 182.0, 133.0, 93.0, 53.0, 41.0, 40.0, 26.0, 19.0, 9.0, 9.0, 7.0, 5.0, 2.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1292724609375, -0.12514877319335938, -0.12102508544921875, -0.11690139770507812, -0.1127777099609375, -0.10865402221679688, -0.10453033447265625, -0.10040664672851562, -0.096282958984375, -0.09215927124023438, -0.08803558349609375, -0.08391189575195312, -0.0797882080078125, -0.07566452026367188, -0.07154083251953125, -0.06741714477539062, -0.06329345703125, -0.059169769287109375, -0.05504608154296875, -0.050922393798828125, -0.0467987060546875, -0.042675018310546875, -0.03855133056640625, -0.034427642822265625, -0.030303955078125, -0.026180267333984375, -0.02205657958984375, -0.017932891845703125, -0.0138092041015625, -0.009685516357421875, -0.00556182861328125, -0.001438140869140625, 0.002685546875, 0.006809234619140625, 0.01093292236328125, 0.015056610107421875, 0.0191802978515625, 0.023303985595703125, 0.02742767333984375, 0.031551361083984375, 0.035675048828125, 0.039798736572265625, 0.04392242431640625, 0.048046112060546875, 0.0521697998046875, 0.056293487548828125, 0.06041717529296875, 0.06454086303710938, 0.06866455078125, 0.07278823852539062, 0.07691192626953125, 0.08103561401367188, 0.0851593017578125, 0.08928298950195312, 0.09340667724609375, 0.09753036499023438, 0.101654052734375, 0.10577774047851562, 0.10990142822265625, 0.11402511596679688, 0.1181488037109375, 0.12227249145507812, 0.12639617919921875, 0.13051986694335938, 0.1346435546875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 8.0, 4.0, 9.0, 9.0, 18.0, 17.0, 13.0, 23.0, 13.0, 34.0, 33.0, 26.0, 36.0, 36.0, 46.0, 43.0, 54.0, 64.0, 57.0, 49.0, 42.0, 45.0, 52.0, 38.0, 36.0, 31.0, 29.0, 26.0, 23.0, 13.0, 13.0, 11.0, 11.0, 9.0, 6.0, 8.0, 5.0, 7.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8779296875, -1.8259124755859375, -1.773895263671875, -1.7218780517578125, -1.66986083984375, -1.6178436279296875, -1.565826416015625, -1.5138092041015625, -1.4617919921875, -1.4097747802734375, -1.357757568359375, -1.3057403564453125, -1.25372314453125, -1.2017059326171875, -1.149688720703125, -1.0976715087890625, -1.045654296875, -0.9936370849609375, -0.941619873046875, -0.8896026611328125, -0.83758544921875, -0.7855682373046875, -0.733551025390625, -0.6815338134765625, -0.6295166015625, -0.5774993896484375, -0.525482177734375, -0.4734649658203125, -0.42144775390625, -0.3694305419921875, -0.317413330078125, -0.2653961181640625, -0.21337890625, -0.1613616943359375, -0.109344482421875, -0.0573272705078125, -0.00531005859375, 0.0467071533203125, 0.098724365234375, 0.1507415771484375, 0.2027587890625, 0.2547760009765625, 0.306793212890625, 0.3588104248046875, 0.41082763671875, 0.4628448486328125, 0.514862060546875, 0.5668792724609375, 0.618896484375, 0.6709136962890625, 0.722930908203125, 0.7749481201171875, 0.82696533203125, 0.8789825439453125, 0.930999755859375, 0.9830169677734375, 1.0350341796875, 1.0870513916015625, 1.139068603515625, 1.1910858154296875, 1.24310302734375, 1.2951202392578125, 1.347137451171875, 1.3991546630859375, 1.451171875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 6.0, 4.0, 2.0, 5.0, 7.0, 16.0, 14.0, 24.0, 30.0, 51.0, 45.0, 57.0, 65.0, 80.0, 343.0, 1045766.0, 1505.0, 156.0, 78.0, 53.0, 48.0, 47.0, 44.0, 29.0, 19.0, 20.0, 10.0, 11.0, 8.0, 7.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.91796875, -6.7298583984375, -6.541748046875, -6.3536376953125, -6.16552734375, -5.9774169921875, -5.789306640625, -5.6011962890625, -5.4130859375, -5.2249755859375, -5.036865234375, -4.8487548828125, -4.66064453125, -4.4725341796875, -4.284423828125, -4.0963134765625, -3.908203125, -3.7200927734375, -3.531982421875, -3.3438720703125, -3.15576171875, -2.9676513671875, -2.779541015625, -2.5914306640625, -2.4033203125, -2.2152099609375, -2.027099609375, -1.8389892578125, -1.65087890625, -1.4627685546875, -1.274658203125, -1.0865478515625, -0.8984375, -0.7103271484375, -0.522216796875, -0.3341064453125, -0.14599609375, 0.0421142578125, 0.230224609375, 0.4183349609375, 0.6064453125, 0.7945556640625, 0.982666015625, 1.1707763671875, 1.35888671875, 1.5469970703125, 1.735107421875, 1.9232177734375, 2.111328125, 2.2994384765625, 2.487548828125, 2.6756591796875, 2.86376953125, 3.0518798828125, 3.239990234375, 3.4281005859375, 3.6162109375, 3.8043212890625, 3.992431640625, 4.1805419921875, 4.36865234375, 4.5567626953125, 4.744873046875, 4.9329833984375, 5.12109375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 6.0, 4.0, 2.0, 4.0, 8.0, 18.0, 12.0, 27.0, 31.0, 50.0, 50.0, 50.0, 50.0, 66.0, 67.0, 79.0, 61.0, 58.0, 63.0, 49.0, 49.0, 48.0, 43.0, 27.0, 21.0, 19.0, 10.0, 11.0, 8.0, 8.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.755859375, -2.6807861328125, -2.605712890625, -2.5306396484375, -2.45556640625, -2.3804931640625, -2.305419921875, -2.2303466796875, -2.1552734375, -2.0802001953125, -2.005126953125, -1.9300537109375, -1.85498046875, -1.7799072265625, -1.704833984375, -1.6297607421875, -1.5546875, -1.4796142578125, -1.404541015625, -1.3294677734375, -1.25439453125, -1.1793212890625, -1.104248046875, -1.0291748046875, -0.9541015625, -0.8790283203125, -0.803955078125, -0.7288818359375, -0.65380859375, -0.5787353515625, -0.503662109375, -0.4285888671875, -0.353515625, -0.2784423828125, -0.203369140625, -0.1282958984375, -0.05322265625, 0.0218505859375, 0.096923828125, 0.1719970703125, 0.2470703125, 0.3221435546875, 0.397216796875, 0.4722900390625, 0.54736328125, 0.6224365234375, 0.697509765625, 0.7725830078125, 0.84765625, 0.9227294921875, 0.997802734375, 1.0728759765625, 1.14794921875, 1.2230224609375, 1.298095703125, 1.3731689453125, 1.4482421875, 1.5233154296875, 1.598388671875, 1.6734619140625, 1.74853515625, 1.8236083984375, 1.898681640625, 1.9737548828125, 2.048828125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 3.0, 4.0, 13.0, 6.0, 10.0, 11.0, 16.0, 28.0, 56.0, 119.0, 909.0, 47024.0, 995990.0, 3841.0, 290.0, 99.0, 41.0, 22.0, 18.0, 11.0, 15.0, 12.0, 3.0, 4.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2939453125, -0.2842254638671875, -0.274505615234375, -0.2647857666015625, -0.25506591796875, -0.2453460693359375, -0.235626220703125, -0.2259063720703125, -0.2161865234375, -0.2064666748046875, -0.196746826171875, -0.1870269775390625, -0.17730712890625, -0.1675872802734375, -0.157867431640625, -0.1481475830078125, -0.138427734375, -0.1287078857421875, -0.118988037109375, -0.1092681884765625, -0.09954833984375, -0.0898284912109375, -0.080108642578125, -0.0703887939453125, -0.0606689453125, -0.0509490966796875, -0.041229248046875, -0.0315093994140625, -0.02178955078125, -0.0120697021484375, -0.002349853515625, 0.0073699951171875, 0.01708984375, 0.0268096923828125, 0.036529541015625, 0.0462493896484375, 0.05596923828125, 0.0656890869140625, 0.075408935546875, 0.0851287841796875, 0.0948486328125, 0.1045684814453125, 0.114288330078125, 0.1240081787109375, 0.13372802734375, 0.1434478759765625, 0.153167724609375, 0.1628875732421875, 0.172607421875, 0.1823272705078125, 0.192047119140625, 0.2017669677734375, 0.21148681640625, 0.2212066650390625, 0.230926513671875, 0.2406463623046875, 0.2503662109375, 0.2600860595703125, 0.269805908203125, 0.2795257568359375, 0.28924560546875, 0.2989654541015625, 0.308685302734375, 0.3184051513671875, 0.328125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 2.0, 9.0, 11.0, 11.0, 22.0, 24.0, 53.0, 76.0, 184.0, 223.0, 162.0, 68.0, 49.0, 29.0, 21.0, 7.0, 9.0, 12.0, 7.0, 5.0, 5.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.110004425048828e-05, -2.0592473447322845e-05, -2.008490264415741e-05, -1.9577331840991974e-05, -1.9069761037826538e-05, -1.8562190234661102e-05, -1.8054619431495667e-05, -1.754704862833023e-05, -1.7039477825164795e-05, -1.653190702199936e-05, -1.6024336218833923e-05, -1.5516765415668488e-05, -1.5009194612503052e-05, -1.4501623809337616e-05, -1.399405300617218e-05, -1.3486482203006744e-05, -1.2978911399841309e-05, -1.2471340596675873e-05, -1.1963769793510437e-05, -1.1456198990345001e-05, -1.0948628187179565e-05, -1.044105738401413e-05, -9.933486580848694e-06, -9.425915777683258e-06, -8.918344974517822e-06, -8.410774171352386e-06, -7.90320336818695e-06, -7.395632565021515e-06, -6.888061761856079e-06, -6.380490958690643e-06, -5.8729201555252075e-06, -5.365349352359772e-06, -4.857778549194336e-06, -4.3502077460289e-06, -3.842636942863464e-06, -3.3350661396980286e-06, -2.8274953365325928e-06, -2.319924533367157e-06, -1.8123537302017212e-06, -1.3047829270362854e-06, -7.972121238708496e-07, -2.896413207054138e-07, 2.1792948246002197e-07, 7.255002856254578e-07, 1.2330710887908936e-06, 1.7406418919563293e-06, 2.248212695121765e-06, 2.755783498287201e-06, 3.2633543014526367e-06, 3.7709251046180725e-06, 4.278495907783508e-06, 4.786066710948944e-06, 5.29363751411438e-06, 5.801208317279816e-06, 6.3087791204452515e-06, 6.816349923610687e-06, 7.323920726776123e-06, 7.831491529941559e-06, 8.339062333106995e-06, 8.84663313627243e-06, 9.354203939437866e-06, 9.861774742603302e-06, 1.0369345545768738e-05, 1.0876916348934174e-05, 1.138448715209961e-05]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 7.0, 8.0, 7.0, 6.0, 10.0, 31.0, 43.0, 45.0, 147.0, 408.0, 2067.0, 22442.0, 948740.0, 69620.0, 3908.0, 698.0, 151.0, 80.0, 50.0, 24.0, 16.0, 14.0, 8.0, 4.0, 1.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.177734375, -0.1726055145263672, -0.16747665405273438, -0.16234779357910156, -0.15721893310546875, -0.15209007263183594, -0.14696121215820312, -0.1418323516845703, -0.1367034912109375, -0.1315746307373047, -0.12644577026367188, -0.12131690979003906, -0.11618804931640625, -0.11105918884277344, -0.10593032836914062, -0.10080146789550781, -0.095672607421875, -0.09054374694824219, -0.08541488647460938, -0.08028602600097656, -0.07515716552734375, -0.07002830505371094, -0.06489944458007812, -0.05977058410644531, -0.0546417236328125, -0.04951286315917969, -0.044384002685546875, -0.03925514221191406, -0.03412628173828125, -0.028997421264648438, -0.023868560791015625, -0.018739700317382812, -0.01361083984375, -0.008481979370117188, -0.003353118896484375, 0.0017757415771484375, 0.00690460205078125, 0.012033462524414062, 0.017162322998046875, 0.022291183471679688, 0.0274200439453125, 0.03254890441894531, 0.037677764892578125, 0.04280662536621094, 0.04793548583984375, 0.05306434631347656, 0.058193206787109375, 0.06332206726074219, 0.068450927734375, 0.07357978820800781, 0.07870864868164062, 0.08383750915527344, 0.08896636962890625, 0.09409523010253906, 0.09922409057617188, 0.10435295104980469, 0.1094818115234375, 0.11461067199707031, 0.11973953247070312, 0.12486839294433594, 0.12999725341796875, 0.13512611389160156, 0.14025497436523438, 0.1453838348388672, 0.1505126953125]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 1.0, 4.0, 9.0, 14.0, 17.0, 22.0, 28.0, 41.0, 65.0, 91.0, 110.0, 137.0, 141.0, 91.0, 48.0, 44.0, 30.0, 21.0, 25.0, 11.0, 13.0, 12.0, 5.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0243988037109375, -0.023578405380249023, -0.022758007049560547, -0.02193760871887207, -0.021117210388183594, -0.020296812057495117, -0.01947641372680664, -0.018656015396118164, -0.017835617065429688, -0.01701521873474121, -0.016194820404052734, -0.015374422073364258, -0.014554023742675781, -0.013733625411987305, -0.012913227081298828, -0.012092828750610352, -0.011272430419921875, -0.010452032089233398, -0.009631633758544922, -0.008811235427856445, -0.007990837097167969, -0.007170438766479492, -0.006350040435791016, -0.005529642105102539, -0.0047092437744140625, -0.003888845443725586, -0.0030684471130371094, -0.002248048782348633, -0.0014276504516601562, -0.0006072521209716797, 0.00021314620971679688, 0.0010335445404052734, 0.00185394287109375, 0.0026743412017822266, 0.003494739532470703, 0.00431513786315918, 0.005135536193847656, 0.005955934524536133, 0.006776332855224609, 0.007596731185913086, 0.008417129516601562, 0.009237527847290039, 0.010057926177978516, 0.010878324508666992, 0.011698722839355469, 0.012519121170043945, 0.013339519500732422, 0.014159917831420898, 0.014980316162109375, 0.01580071449279785, 0.016621112823486328, 0.017441511154174805, 0.01826190948486328, 0.019082307815551758, 0.019902706146240234, 0.02072310447692871, 0.021543502807617188, 0.022363901138305664, 0.02318429946899414, 0.024004697799682617, 0.024825096130371094, 0.02564549446105957, 0.026465892791748047, 0.027286291122436523, 0.028106689453125]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 13.0, 35.0, 115.0, 333.0, 351.0, 114.0, 38.0, 9.0, 8.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8259516954421997, -0.7229790091514587, -0.6200063228607178, -0.5170336365699768, -0.41406095027923584, -0.3110882639884949, -0.2081155776977539, -0.10514289140701294, -0.0021702051162719727, 0.100802481174469, 0.20377516746520996, 0.3067478537559509, 0.4097205400466919, 0.5126932263374329, 0.6156659126281738, 0.7186385989189148, 0.8216112852096558, 0.9245839715003967, 1.0275566577911377, 1.1305294036865234, 1.2335020303726196, 1.3364746570587158, 1.4394474029541016, 1.5424201488494873, 1.6453927755355835, 1.7483654022216797, 1.8513381481170654, 1.9543108940124512, 2.057283401489258, 2.1602561473846436, 2.2632288932800293, 2.366201639175415, 2.469174385070801, 2.5721471309661865, 2.6751198768615723, 2.778092384338379, 2.8810651302337646, 2.9840378761291504, 3.087010383605957, 3.1899831295013428, 3.2929558753967285, 3.3959286212921143, 3.4989013671875, 3.6018738746643066, 3.7048466205596924, 3.807819366455078, 3.9107918739318848, 4.01376485824585, 4.116737365722656, 4.219709873199463, 4.322682857513428, 4.425655364990234, 4.528628349304199, 4.631600856781006, 4.7345733642578125, 4.837546348571777, 4.940518856048584, 5.043491363525391, 5.1464643478393555, 5.249436855316162, 5.352409362792969, 5.455382347106934, 5.55835485458374, 5.661327838897705, 5.764300346374512]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 8.0, 7.0, 6.0, 11.0, 12.0, 17.0, 15.0, 17.0, 19.0, 30.0, 24.0, 31.0, 43.0, 29.0, 30.0, 38.0, 35.0, 40.0, 43.0, 50.0, 57.0, 40.0, 48.0, 33.0, 42.0, 33.0, 42.0, 26.0, 33.0, 34.0, 30.0, 16.0, 14.0, 15.0, 9.0, 8.0, 10.0, 4.0, 5.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4271254539489746, -2.3518643379211426, -2.2766032218933105, -2.2013418674468994, -2.1260807514190674, -2.0508196353912354, -1.9755585193634033, -1.9002974033355713, -1.8250361680984497, -1.7497750520706177, -1.674513816833496, -1.599252700805664, -1.523991584777832, -1.4487303495407104, -1.3734692335128784, -1.2982079982757568, -1.2229468822479248, -1.1476857662200928, -1.0724245309829712, -0.9971634149551392, -0.9219022393226624, -0.8466410636901855, -0.7713799476623535, -0.6961187720298767, -0.6208575963973999, -0.5455964207649231, -0.4703352749347687, -0.39507412910461426, -0.31981295347213745, -0.24455177783966064, -0.16929063200950623, -0.0940294861793518, -0.018768310546875, 0.05649285018444061, 0.13175401091575623, 0.20701517164707184, 0.28227633237838745, 0.35753750801086426, 0.4327986538410187, 0.5080597996711731, 0.5833209753036499, 0.6585821509361267, 0.7338433265686035, 0.8091044425964355, 0.8843656182289124, 0.9596267938613892, 1.0348879098892212, 1.1101491451263428, 1.1854102611541748, 1.2606713771820068, 1.3359326124191284, 1.4111937284469604, 1.486454963684082, 1.561716079711914, 1.636977195739746, 1.7122383117675781, 1.7874995470046997, 1.8627606630325317, 1.9380218982696533, 2.0132830142974854, 2.0885441303253174, 2.1638054847717285, 2.2390666007995605, 2.3143277168273926, 2.3895888328552246]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 5.0, 3.0, 5.0, 5.0, 14.0, 10.0, 8.0, 13.0, 13.0, 18.0, 24.0, 26.0, 31.0, 31.0, 69.0, 130.0, 366.0, 1186.0, 4414.0, 29050.0, 3083652.0, 1051195.0, 18500.0, 3691.0, 1058.0, 363.0, 123.0, 64.0, 47.0, 37.0, 28.0, 30.0, 14.0, 13.0, 14.0, 13.0, 7.0, 9.0, 5.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.89453125, -1.836944580078125, -1.77935791015625, -1.721771240234375, -1.6641845703125, -1.606597900390625, -1.54901123046875, -1.491424560546875, -1.433837890625, -1.376251220703125, -1.31866455078125, -1.261077880859375, -1.2034912109375, -1.145904541015625, -1.08831787109375, -1.030731201171875, -0.97314453125, -0.915557861328125, -0.85797119140625, -0.800384521484375, -0.7427978515625, -0.685211181640625, -0.62762451171875, -0.570037841796875, -0.512451171875, -0.454864501953125, -0.39727783203125, -0.339691162109375, -0.2821044921875, -0.224517822265625, -0.16693115234375, -0.109344482421875, -0.0517578125, 0.005828857421875, 0.06341552734375, 0.121002197265625, 0.1785888671875, 0.236175537109375, 0.29376220703125, 0.351348876953125, 0.408935546875, 0.466522216796875, 0.52410888671875, 0.581695556640625, 0.6392822265625, 0.696868896484375, 0.75445556640625, 0.812042236328125, 0.86962890625, 0.927215576171875, 0.98480224609375, 1.042388916015625, 1.0999755859375, 1.157562255859375, 1.21514892578125, 1.272735595703125, 1.330322265625, 1.387908935546875, 1.44549560546875, 1.503082275390625, 1.5606689453125, 1.618255615234375, 1.67584228515625, 1.733428955078125, 1.791015625]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 13.0, 15.0, 18.0, 22.0, 23.0, 29.0, 40.0, 31.0, 43.0, 69.0, 74.0, 64.0, 54.0, 61.0, 84.0, 58.0, 54.0, 56.0, 45.0, 30.0, 35.0, 22.0, 16.0, 9.0, 9.0, 7.0, 5.0, 4.0, 2.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2958984375, -0.2823486328125, -0.268798828125, -0.2552490234375, -0.24169921875, -0.2281494140625, -0.214599609375, -0.2010498046875, -0.1875, -0.1739501953125, -0.160400390625, -0.1468505859375, -0.13330078125, -0.1197509765625, -0.106201171875, -0.0926513671875, -0.0791015625, -0.0655517578125, -0.052001953125, -0.0384521484375, -0.02490234375, -0.0113525390625, 0.002197265625, 0.0157470703125, 0.029296875, 0.0428466796875, 0.056396484375, 0.0699462890625, 0.08349609375, 0.0970458984375, 0.110595703125, 0.1241455078125, 0.1376953125, 0.1512451171875, 0.164794921875, 0.1783447265625, 0.19189453125, 0.2054443359375, 0.218994140625, 0.2325439453125, 0.24609375, 0.2596435546875, 0.273193359375, 0.2867431640625, 0.30029296875, 0.3138427734375, 0.327392578125, 0.3409423828125, 0.3544921875, 0.3680419921875, 0.381591796875, 0.3951416015625, 0.40869140625, 0.4222412109375, 0.435791015625, 0.4493408203125, 0.462890625, 0.4764404296875, 0.489990234375, 0.5035400390625, 0.51708984375, 0.5306396484375, 0.544189453125, 0.5577392578125, 0.5712890625]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 7.0, 5.0, 20.0, 40.0, 148.0, 432.0, 10353.0, 4181463.0, 1370.0, 298.0, 91.0, 29.0, 8.0, 4.0, 2.0, 4.0, 7.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.62890625, -5.37640380859375, -5.1239013671875, -4.87139892578125, -4.618896484375, -4.36639404296875, -4.1138916015625, -3.86138916015625, -3.60888671875, -3.35638427734375, -3.1038818359375, -2.85137939453125, -2.598876953125, -2.34637451171875, -2.0938720703125, -1.84136962890625, -1.5888671875, -1.33636474609375, -1.0838623046875, -0.83135986328125, -0.578857421875, -0.32635498046875, -0.0738525390625, 0.17864990234375, 0.43115234375, 0.68365478515625, 0.9361572265625, 1.18865966796875, 1.441162109375, 1.69366455078125, 1.9461669921875, 2.19866943359375, 2.451171875, 2.70367431640625, 2.9561767578125, 3.20867919921875, 3.461181640625, 3.71368408203125, 3.9661865234375, 4.21868896484375, 4.47119140625, 4.72369384765625, 4.9761962890625, 5.22869873046875, 5.481201171875, 5.73370361328125, 5.9862060546875, 6.23870849609375, 6.4912109375, 6.74371337890625, 6.9962158203125, 7.24871826171875, 7.501220703125, 7.75372314453125, 8.0062255859375, 8.25872802734375, 8.51123046875, 8.76373291015625, 9.0162353515625, 9.26873779296875, 9.521240234375, 9.77374267578125, 10.0262451171875, 10.27874755859375, 10.53125]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 4.0, 3.0, 7.0, 4.0, 8.0, 14.0, 12.0, 19.0, 30.0, 46.0, 68.0, 78.0, 149.0, 285.0, 612.0, 1065.0, 811.0, 360.0, 170.0, 89.0, 77.0, 39.0, 34.0, 26.0, 18.0, 13.0, 11.0, 7.0, 4.0, 4.0, 3.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2861328125, -0.2781181335449219, -0.27010345458984375, -0.2620887756347656, -0.2540740966796875, -0.24605941772460938, -0.23804473876953125, -0.23003005981445312, -0.222015380859375, -0.21400070190429688, -0.20598602294921875, -0.19797134399414062, -0.1899566650390625, -0.18194198608398438, -0.17392730712890625, -0.16591262817382812, -0.15789794921875, -0.14988327026367188, -0.14186859130859375, -0.13385391235351562, -0.1258392333984375, -0.11782455444335938, -0.10980987548828125, -0.10179519653320312, -0.093780517578125, -0.08576583862304688, -0.07775115966796875, -0.06973648071289062, -0.0617218017578125, -0.053707122802734375, -0.04569244384765625, -0.037677764892578125, -0.0296630859375, -0.021648406982421875, -0.01363372802734375, -0.005619049072265625, 0.0023956298828125, 0.010410308837890625, 0.01842498779296875, 0.026439666748046875, 0.034454345703125, 0.042469024658203125, 0.05048370361328125, 0.058498382568359375, 0.0665130615234375, 0.07452774047851562, 0.08254241943359375, 0.09055709838867188, 0.09857177734375, 0.10658645629882812, 0.11460113525390625, 0.12261581420898438, 0.1306304931640625, 0.13864517211914062, 0.14665985107421875, 0.15467453002929688, 0.162689208984375, 0.17070388793945312, 0.17871856689453125, 0.18673324584960938, 0.1947479248046875, 0.20276260375976562, 0.21077728271484375, 0.21879196166992188, 0.226806640625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 9.0, 17.0, 35.0, 44.0, 75.0, 125.0, 193.0, 187.0, 122.0, 68.0, 52.0, 26.0, 17.0, 11.0, 7.0, 2.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5024560689926147, -0.4691631495952606, -0.4358702003955841, -0.40257728099823, -0.36928433179855347, -0.33599141240119934, -0.3026984930038452, -0.2694055438041687, -0.23611262440681458, -0.20281969010829926, -0.16952675580978394, -0.1362338364124298, -0.10294090211391449, -0.06964796781539917, -0.036355048418045044, -0.003062114119529724, 0.030230820178985596, 0.06352375447750092, 0.09681668132543564, 0.13010960817337036, 0.16340254247188568, 0.196695476770401, 0.22998839616775513, 0.26328134536743164, 0.29657426476478577, 0.3298671841621399, 0.3631601333618164, 0.39645305275917053, 0.42974597215652466, 0.46303892135620117, 0.4963318407535553, 0.5296247601509094, 0.5629177093505859, 0.5962106585502625, 0.6295035481452942, 0.6627964973449707, 0.6960894465446472, 0.7293823957443237, 0.7626752853393555, 0.795968234539032, 0.8292611837387085, 0.862554132938385, 0.8958470225334167, 0.9291399717330933, 0.9624329209327698, 0.9957258701324463, 1.029018759727478, 1.0623116493225098, 1.095604658126831, 1.1288975477218628, 1.162190556526184, 1.1954834461212158, 1.2287763357162476, 1.2620693445205688, 1.2953622341156006, 1.3286551237106323, 1.361948013305664, 1.3952409029006958, 1.428533911705017, 1.4618268013000488, 1.4951196908950806, 1.5284126996994019, 1.5617055892944336, 1.5949984788894653, 1.6282914876937866]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 8.0, 4.0, 9.0, 16.0, 13.0, 13.0, 11.0, 24.0, 18.0, 21.0, 23.0, 39.0, 40.0, 48.0, 46.0, 49.0, 38.0, 44.0, 64.0, 46.0, 52.0, 38.0, 45.0, 52.0, 33.0, 28.0, 32.0, 43.0, 18.0, 13.0, 19.0, 13.0, 11.0, 9.0, 3.0, 8.0, 2.0, 3.0, 3.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3722960650920868, -0.35986608266830444, -0.3474361002445221, -0.33500614762306213, -0.3225761651992798, -0.31014618277549744, -0.2977162003517151, -0.2852862477302551, -0.2728562653064728, -0.26042628288269043, -0.24799631536006927, -0.23556633293628693, -0.22313636541366577, -0.21070638298988342, -0.19827640056610107, -0.18584643304347992, -0.17341645061969757, -0.16098646819591522, -0.14855650067329407, -0.13612651824951172, -0.12369655072689056, -0.11126656830310822, -0.09883659332990646, -0.08640661835670471, -0.07397664338350296, -0.06154666841030121, -0.04911669343709946, -0.03668671473860741, -0.024256739765405655, -0.011826764792203903, 0.000603213906288147, 0.013033188879489899, 0.02546316385269165, 0.0378931388258934, 0.050323113799095154, 0.0627530962228775, 0.07518306374549866, 0.087613046169281, 0.10004302114248276, 0.11247299611568451, 0.12490297108888626, 0.137332946062088, 0.14976292848587036, 0.16219289600849152, 0.17462287843227386, 0.18705284595489502, 0.19948282837867737, 0.21191281080245972, 0.22434277832508087, 0.23677276074886322, 0.24920272827148438, 0.2616327106952667, 0.2740626931190491, 0.28649264574050903, 0.2989226281642914, 0.31135261058807373, 0.3237825930118561, 0.3362125754356384, 0.3486425578594208, 0.36107251048088074, 0.3735024929046631, 0.38593247532844543, 0.3983624577522278, 0.41079241037368774, 0.4232223927974701]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 6.0, 4.0, 9.0, 8.0, 20.0, 23.0, 28.0, 47.0, 50.0, 75.0, 118.0, 175.0, 274.0, 399.0, 613.0, 966.0, 1692.0, 2866.0, 5055.0, 9299.0, 18621.0, 43428.0, 146776.0, 519884.0, 198565.0, 53478.0, 21740.0, 10668.0, 5629.0, 3165.0, 1802.0, 1067.0, 708.0, 461.0, 275.0, 172.0, 113.0, 84.0, 62.0, 36.0, 23.0, 23.0, 13.0, 9.0, 10.0, 5.0, 3.0, 9.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.18212890625, -0.17552947998046875, -0.1689300537109375, -0.16233062744140625, -0.155731201171875, -0.14913177490234375, -0.1425323486328125, -0.13593292236328125, -0.12933349609375, -0.12273406982421875, -0.1161346435546875, -0.10953521728515625, -0.102935791015625, -0.09633636474609375, -0.0897369384765625, -0.08313751220703125, -0.0765380859375, -0.06993865966796875, -0.0633392333984375, -0.05673980712890625, -0.050140380859375, -0.04354095458984375, -0.0369415283203125, -0.03034210205078125, -0.02374267578125, -0.01714324951171875, -0.0105438232421875, -0.00394439697265625, 0.002655029296875, 0.00925445556640625, 0.0158538818359375, 0.02245330810546875, 0.029052734375, 0.03565216064453125, 0.0422515869140625, 0.04885101318359375, 0.055450439453125, 0.06204986572265625, 0.0686492919921875, 0.07524871826171875, 0.08184814453125, 0.08844757080078125, 0.0950469970703125, 0.10164642333984375, 0.108245849609375, 0.11484527587890625, 0.1214447021484375, 0.12804412841796875, 0.1346435546875, 0.14124298095703125, 0.1478424072265625, 0.15444183349609375, 0.161041259765625, 0.16764068603515625, 0.1742401123046875, 0.18083953857421875, 0.18743896484375, 0.19403839111328125, 0.2006378173828125, 0.20723724365234375, 0.213836669921875, 0.22043609619140625, 0.2270355224609375, 0.23363494873046875, 0.240234375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 4.0, 5.0, 9.0, 6.0, 8.0, 17.0, 23.0, 23.0, 22.0, 33.0, 36.0, 47.0, 54.0, 57.0, 61.0, 60.0, 78.0, 61.0, 59.0, 52.0, 61.0, 48.0, 39.0, 35.0, 35.0, 24.0, 9.0, 11.0, 9.0, 5.0, 7.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26025390625, -0.2511138916015625, -0.241973876953125, -0.2328338623046875, -0.22369384765625, -0.2145538330078125, -0.205413818359375, -0.1962738037109375, -0.1871337890625, -0.1779937744140625, -0.168853759765625, -0.1597137451171875, -0.15057373046875, -0.1414337158203125, -0.132293701171875, -0.1231536865234375, -0.114013671875, -0.1048736572265625, -0.095733642578125, -0.0865936279296875, -0.07745361328125, -0.0683135986328125, -0.059173583984375, -0.0500335693359375, -0.0408935546875, -0.0317535400390625, -0.022613525390625, -0.0134735107421875, -0.00433349609375, 0.0048065185546875, 0.013946533203125, 0.0230865478515625, 0.0322265625, 0.0413665771484375, 0.050506591796875, 0.0596466064453125, 0.06878662109375, 0.0779266357421875, 0.087066650390625, 0.0962066650390625, 0.1053466796875, 0.1144866943359375, 0.123626708984375, 0.1327667236328125, 0.14190673828125, 0.1510467529296875, 0.160186767578125, 0.1693267822265625, 0.178466796875, 0.1876068115234375, 0.196746826171875, 0.2058868408203125, 0.21502685546875, 0.2241668701171875, 0.233306884765625, 0.2424468994140625, 0.2515869140625, 0.2607269287109375, 0.269866943359375, 0.2790069580078125, 0.28814697265625, 0.2972869873046875, 0.306427001953125, 0.3155670166015625, 0.32470703125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 2.0, 8.0, 2.0, 10.0, 23.0, 33.0, 45.0, 74.0, 154.0, 323.0, 810.0, 2030.0, 6321.0, 23856.0, 152287.0, 737888.0, 98991.0, 17819.0, 5017.0, 1637.0, 600.0, 282.0, 134.0, 63.0, 41.0, 26.0, 20.0, 12.0, 11.0, 11.0, 3.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.265625, -0.256591796875, -0.24755859375, -0.238525390625, -0.2294921875, -0.220458984375, -0.21142578125, -0.202392578125, -0.193359375, -0.184326171875, -0.17529296875, -0.166259765625, -0.1572265625, -0.148193359375, -0.13916015625, -0.130126953125, -0.12109375, -0.112060546875, -0.10302734375, -0.093994140625, -0.0849609375, -0.075927734375, -0.06689453125, -0.057861328125, -0.048828125, -0.039794921875, -0.03076171875, -0.021728515625, -0.0126953125, -0.003662109375, 0.00537109375, 0.014404296875, 0.0234375, 0.032470703125, 0.04150390625, 0.050537109375, 0.0595703125, 0.068603515625, 0.07763671875, 0.086669921875, 0.095703125, 0.104736328125, 0.11376953125, 0.122802734375, 0.1318359375, 0.140869140625, 0.14990234375, 0.158935546875, 0.16796875, 0.177001953125, 0.18603515625, 0.195068359375, 0.2041015625, 0.213134765625, 0.22216796875, 0.231201171875, 0.240234375, 0.249267578125, 0.25830078125, 0.267333984375, 0.2763671875, 0.285400390625, 0.29443359375, 0.303466796875, 0.3125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 8.0, 5.0, 8.0, 26.0, 16.0, 31.0, 30.0, 25.0, 44.0, 42.0, 49.0, 48.0, 58.0, 67.0, 70.0, 55.0, 62.0, 43.0, 43.0, 42.0, 36.0, 46.0, 36.0, 26.0, 19.0, 12.0, 12.0, 8.0, 10.0, 9.0, 3.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.50390625, -0.488800048828125, -0.47369384765625, -0.458587646484375, -0.4434814453125, -0.428375244140625, -0.41326904296875, -0.398162841796875, -0.383056640625, -0.367950439453125, -0.35284423828125, -0.337738037109375, -0.3226318359375, -0.307525634765625, -0.29241943359375, -0.277313232421875, -0.26220703125, -0.247100830078125, -0.23199462890625, -0.216888427734375, -0.2017822265625, -0.186676025390625, -0.17156982421875, -0.156463623046875, -0.141357421875, -0.126251220703125, -0.11114501953125, -0.096038818359375, -0.0809326171875, -0.065826416015625, -0.05072021484375, -0.035614013671875, -0.0205078125, -0.005401611328125, 0.00970458984375, 0.024810791015625, 0.0399169921875, 0.055023193359375, 0.07012939453125, 0.085235595703125, 0.100341796875, 0.115447998046875, 0.13055419921875, 0.145660400390625, 0.1607666015625, 0.175872802734375, 0.19097900390625, 0.206085205078125, 0.22119140625, 0.236297607421875, 0.25140380859375, 0.266510009765625, 0.2816162109375, 0.296722412109375, 0.31182861328125, 0.326934814453125, 0.342041015625, 0.357147216796875, 0.37225341796875, 0.387359619140625, 0.4024658203125, 0.417572021484375, 0.43267822265625, 0.447784423828125, 0.462890625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 6.0, 16.0, 17.0, 33.0, 31.0, 42.0, 69.0, 97.0, 158.0, 221.0, 370.0, 616.0, 1136.0, 2112.0, 4125.0, 8627.0, 21913.0, 77474.0, 462809.0, 369217.0, 64244.0, 19250.0, 7884.0, 3692.0, 1825.0, 974.0, 562.0, 347.0, 249.0, 128.0, 84.0, 51.0, 51.0, 26.0, 34.0, 16.0, 9.0, 8.0, 3.0, 6.0, 8.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.046844482421875, -0.045330047607421875, -0.04381561279296875, -0.042301177978515625, -0.0407867431640625, -0.039272308349609375, -0.03775787353515625, -0.036243438720703125, -0.03472900390625, -0.033214569091796875, -0.03170013427734375, -0.030185699462890625, -0.0286712646484375, -0.027156829833984375, -0.02564239501953125, -0.024127960205078125, -0.022613525390625, -0.021099090576171875, -0.01958465576171875, -0.018070220947265625, -0.0165557861328125, -0.015041351318359375, -0.01352691650390625, -0.012012481689453125, -0.010498046875, -0.008983612060546875, -0.00746917724609375, -0.005954742431640625, -0.0044403076171875, -0.002925872802734375, -0.00141143798828125, 0.000102996826171875, 0.001617431640625, 0.003131866455078125, 0.00464630126953125, 0.006160736083984375, 0.0076751708984375, 0.009189605712890625, 0.01070404052734375, 0.012218475341796875, 0.01373291015625, 0.015247344970703125, 0.01676177978515625, 0.018276214599609375, 0.0197906494140625, 0.021305084228515625, 0.02281951904296875, 0.024333953857421875, 0.025848388671875, 0.027362823486328125, 0.02887725830078125, 0.030391693115234375, 0.0319061279296875, 0.033420562744140625, 0.03493499755859375, 0.036449432373046875, 0.0379638671875, 0.039478302001953125, 0.04099273681640625, 0.042507171630859375, 0.0440216064453125, 0.045536041259765625, 0.04705047607421875, 0.048564910888671875, 0.050079345703125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 7.0, 9.0, 20.0, 24.0, 38.0, 70.0, 106.0, 157.0, 174.0, 140.0, 82.0, 66.0, 27.0, 14.0, 16.0, 10.0, 6.0, 8.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.029273986816406e-05, -3.904476761817932e-05, -3.779679536819458e-05, -3.654882311820984e-05, -3.53008508682251e-05, -3.4052878618240356e-05, -3.2804906368255615e-05, -3.1556934118270874e-05, -3.0308961868286133e-05, -2.906098961830139e-05, -2.781301736831665e-05, -2.656504511833191e-05, -2.5317072868347168e-05, -2.4069100618362427e-05, -2.2821128368377686e-05, -2.1573156118392944e-05, -2.0325183868408203e-05, -1.9077211618423462e-05, -1.782923936843872e-05, -1.658126711845398e-05, -1.5333294868469238e-05, -1.4085322618484497e-05, -1.2837350368499756e-05, -1.1589378118515015e-05, -1.0341405868530273e-05, -9.093433618545532e-06, -7.845461368560791e-06, -6.59748911857605e-06, -5.349516868591309e-06, -4.101544618606567e-06, -2.853572368621826e-06, -1.605600118637085e-06, -3.5762786865234375e-07, 8.903443813323975e-07, 2.1383166313171387e-06, 3.38628888130188e-06, 4.634261131286621e-06, 5.882233381271362e-06, 7.1302056312561035e-06, 8.378177881240845e-06, 9.626150131225586e-06, 1.0874122381210327e-05, 1.2122094631195068e-05, 1.337006688117981e-05, 1.461803913116455e-05, 1.5866011381149292e-05, 1.7113983631134033e-05, 1.8361955881118774e-05, 1.9609928131103516e-05, 2.0857900381088257e-05, 2.2105872631072998e-05, 2.335384488105774e-05, 2.460181713104248e-05, 2.584978938102722e-05, 2.7097761631011963e-05, 2.8345733880996704e-05, 2.9593706130981445e-05, 3.0841678380966187e-05, 3.208965063095093e-05, 3.333762288093567e-05, 3.458559513092041e-05, 3.583356738090515e-05, 3.708153963088989e-05, 3.8329511880874634e-05, 3.9577484130859375e-05]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 9.0, 7.0, 18.0, 27.0, 60.0, 127.0, 316.0, 1329.0, 8343.0, 139053.0, 865889.0, 29092.0, 3271.0, 610.0, 203.0, 85.0, 40.0, 29.0, 15.0, 11.0, 3.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1500244140625, -0.14577007293701172, -0.14151573181152344, -0.13726139068603516, -0.13300704956054688, -0.1287527084350586, -0.12449836730957031, -0.12024402618408203, -0.11598968505859375, -0.11173534393310547, -0.10748100280761719, -0.1032266616821289, -0.09897232055664062, -0.09471797943115234, -0.09046363830566406, -0.08620929718017578, -0.0819549560546875, -0.07770061492919922, -0.07344627380371094, -0.06919193267822266, -0.06493759155273438, -0.060683250427246094, -0.05642890930175781, -0.05217456817626953, -0.04792022705078125, -0.04366588592529297, -0.03941154479980469, -0.035157203674316406, -0.030902862548828125, -0.026648521423339844, -0.022394180297851562, -0.01813983917236328, -0.013885498046875, -0.009631156921386719, -0.0053768157958984375, -0.0011224746704101562, 0.003131866455078125, 0.007386207580566406, 0.011640548706054688, 0.01589488983154297, 0.02014923095703125, 0.02440357208251953, 0.028657913208007812, 0.032912254333496094, 0.037166595458984375, 0.041420936584472656, 0.04567527770996094, 0.04992961883544922, 0.0541839599609375, 0.05843830108642578, 0.06269264221191406, 0.06694698333740234, 0.07120132446289062, 0.0754556655883789, 0.07971000671386719, 0.08396434783935547, 0.08821868896484375, 0.09247303009033203, 0.09672737121582031, 0.1009817123413086, 0.10523605346679688, 0.10949039459228516, 0.11374473571777344, 0.11799907684326172, 0.12225341796875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 5.0, 1.0, 3.0, 3.0, 5.0, 5.0, 10.0, 9.0, 9.0, 18.0, 15.0, 10.0, 23.0, 40.0, 24.0, 48.0, 46.0, 55.0, 75.0, 70.0, 73.0, 72.0, 69.0, 44.0, 45.0, 40.0, 29.0, 25.0, 30.0, 16.0, 19.0, 18.0, 13.0, 5.0, 8.0, 3.0, 3.0, 5.0, 3.0, 1.0, 4.0, 0.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.01088714599609375, -0.010561227798461914, -0.010235309600830078, -0.009909391403198242, -0.009583473205566406, -0.00925755500793457, -0.008931636810302734, -0.008605718612670898, -0.008279800415039062, -0.007953882217407227, -0.007627964019775391, -0.007302045822143555, -0.006976127624511719, -0.006650209426879883, -0.006324291229248047, -0.005998373031616211, -0.005672454833984375, -0.005346536636352539, -0.005020618438720703, -0.004694700241088867, -0.004368782043457031, -0.004042863845825195, -0.0037169456481933594, -0.0033910274505615234, -0.0030651092529296875, -0.0027391910552978516, -0.0024132728576660156, -0.0020873546600341797, -0.0017614364624023438, -0.0014355182647705078, -0.0011096000671386719, -0.0007836818695068359, -0.000457763671875, -0.00013184547424316406, 0.00019407272338867188, 0.0005199909210205078, 0.0008459091186523438, 0.0011718273162841797, 0.0014977455139160156, 0.0018236637115478516, 0.0021495819091796875, 0.0024755001068115234, 0.0028014183044433594, 0.0031273365020751953, 0.0034532546997070312, 0.003779172897338867, 0.004105091094970703, 0.004431009292602539, 0.004756927490234375, 0.005082845687866211, 0.005408763885498047, 0.005734682083129883, 0.006060600280761719, 0.006386518478393555, 0.006712436676025391, 0.0070383548736572266, 0.0073642730712890625, 0.0076901912689208984, 0.008016109466552734, 0.00834202766418457, 0.008667945861816406, 0.008993864059448242, 0.009319782257080078, 0.009645700454711914, 0.00997161865234375]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 12.0, 11.0, 14.0, 13.0, 21.0, 24.0, 45.0, 55.0, 72.0, 112.0, 113.0, 129.0, 107.0, 64.0, 41.0, 47.0, 31.0, 21.0, 16.0, 9.0, 8.0, 5.0, 8.0, 2.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3130538761615753, -0.30230289697647095, -0.29155194759368896, -0.2808009684085846, -0.2700500190258026, -0.25929903984069824, -0.24854807555675507, -0.2377971112728119, -0.2270461469888687, -0.21629518270492554, -0.20554421842098236, -0.19479325413703918, -0.18404227495193481, -0.17329132556915283, -0.16254034638404846, -0.15178938210010529, -0.1410384178161621, -0.13028745353221893, -0.11953648924827576, -0.10878551751375198, -0.09803455322980881, -0.08728358894586563, -0.07653261721134186, -0.06578165292739868, -0.055030688643455505, -0.04427972435951233, -0.033528756350278854, -0.02277778834104538, -0.012026824057102203, -0.001275859773159027, 0.009475111961364746, 0.020226076245307922, 0.03097701072692871, 0.04172797501087189, 0.05247894302010536, 0.06322991102933884, 0.07398087531328201, 0.08473183959722519, 0.09548281133174896, 0.10623377561569214, 0.11698473989963531, 0.1277357041835785, 0.13848666846752167, 0.14923763275146484, 0.1599886119365692, 0.1707395613193512, 0.18149054050445557, 0.19224150478839874, 0.20299246907234192, 0.2137434333562851, 0.22449439764022827, 0.23524537682533264, 0.24599632620811462, 0.256747305393219, 0.267498254776001, 0.27824923396110535, 0.2890002131462097, 0.2997511923313141, 0.31050214171409607, 0.32125312089920044, 0.3320040702819824, 0.3427550494670868, 0.35350602865219116, 0.36425697803497314, 0.3750079274177551]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 9.0, 11.0, 10.0, 21.0, 10.0, 20.0, 20.0, 35.0, 21.0, 39.0, 52.0, 51.0, 61.0, 52.0, 47.0, 70.0, 65.0, 67.0, 47.0, 48.0, 46.0, 43.0, 31.0, 29.0, 23.0, 24.0, 9.0, 13.0, 8.0, 8.0, 4.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23378704488277435, -0.2255488783121109, -0.21731069684028625, -0.2090725302696228, -0.20083436369895935, -0.1925961971282959, -0.18435801565647125, -0.1761198490858078, -0.16788166761398315, -0.1596435010433197, -0.15140531957149506, -0.1431671530008316, -0.13492898643016815, -0.1266908049583435, -0.11845263838768005, -0.1102144718170166, -0.10197630524635315, -0.0937381312251091, -0.08549996465444565, -0.0772617906332016, -0.06902362406253815, -0.0607854500412941, -0.05254727602005005, -0.0443091057240963, -0.03607093542814255, -0.027832765132188797, -0.019594592973589897, -0.011356420814990997, -0.0031182505190372467, 0.005119919776916504, 0.013358093798160553, 0.021596264094114304, 0.029834449291229248, 0.038072619587183, 0.04631078988313675, 0.0545489639043808, 0.06278713047504425, 0.0710253044962883, 0.07926347851753235, 0.0875016450881958, 0.09573981910943985, 0.1039779931306839, 0.11221615970134735, 0.1204543337225914, 0.12869250774383545, 0.1369306743144989, 0.14516884088516235, 0.153407022356987, 0.16164518892765045, 0.1698833554983139, 0.17812153697013855, 0.186359703540802, 0.19459787011146545, 0.2028360366821289, 0.21107421815395355, 0.219312384724617, 0.22755056619644165, 0.2357887327671051, 0.24402691423892975, 0.2522650957107544, 0.26050326228141785, 0.2687414288520813, 0.27697959542274475, 0.2852177619934082, 0.29345592856407166]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 2.0, 9.0, 6.0, 13.0, 22.0, 36.0, 37.0, 58.0, 94.0, 140.0, 195.0, 277.0, 422.0, 728.0, 1172.0, 1996.0, 3694.0, 7413.0, 16022.0, 39532.0, 115221.0, 402043.0, 311053.0, 88605.0, 32041.0, 13562.0, 6249.0, 3267.0, 1805.0, 1009.0, 592.0, 428.0, 257.0, 167.0, 103.0, 73.0, 63.0, 43.0, 40.0, 23.0, 9.0, 11.0, 6.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10504150390625, -0.10164070129394531, -0.09823989868164062, -0.09483909606933594, -0.09143829345703125, -0.08803749084472656, -0.08463668823242188, -0.08123588562011719, -0.0778350830078125, -0.07443428039550781, -0.07103347778320312, -0.06763267517089844, -0.06423187255859375, -0.06083106994628906, -0.057430267333984375, -0.05402946472167969, -0.050628662109375, -0.04722785949707031, -0.043827056884765625, -0.04042625427246094, -0.03702545166015625, -0.03362464904785156, -0.030223846435546875, -0.026823043823242188, -0.0234222412109375, -0.020021438598632812, -0.016620635986328125, -0.013219833374023438, -0.00981903076171875, -0.0064182281494140625, -0.003017425537109375, 0.0003833770751953125, 0.0037841796875, 0.0071849822998046875, 0.010585784912109375, 0.013986587524414062, 0.01738739013671875, 0.020788192749023438, 0.024188995361328125, 0.027589797973632812, 0.0309906005859375, 0.03439140319824219, 0.037792205810546875, 0.04119300842285156, 0.04459381103515625, 0.04799461364746094, 0.051395416259765625, 0.05479621887207031, 0.058197021484375, 0.06159782409667969, 0.06499862670898438, 0.06839942932128906, 0.07180023193359375, 0.07520103454589844, 0.07860183715820312, 0.08200263977050781, 0.0854034423828125, 0.08880424499511719, 0.09220504760742188, 0.09560585021972656, 0.09900665283203125, 0.10240745544433594, 0.10580825805664062, 0.10920906066894531, 0.11260986328125]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 6.0, 2.0, 6.0, 7.0, 5.0, 11.0, 17.0, 18.0, 27.0, 14.0, 29.0, 31.0, 36.0, 37.0, 47.0, 47.0, 49.0, 36.0, 50.0, 63.0, 63.0, 61.0, 53.0, 52.0, 27.0, 37.0, 27.0, 27.0, 21.0, 16.0, 14.0, 14.0, 13.0, 7.0, 8.0, 10.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.62158203125, -0.603240966796875, -0.58489990234375, -0.566558837890625, -0.5482177734375, -0.529876708984375, -0.51153564453125, -0.493194580078125, -0.474853515625, -0.456512451171875, -0.43817138671875, -0.419830322265625, -0.4014892578125, -0.383148193359375, -0.36480712890625, -0.346466064453125, -0.328125, -0.309783935546875, -0.29144287109375, -0.273101806640625, -0.2547607421875, -0.236419677734375, -0.21807861328125, -0.199737548828125, -0.181396484375, -0.163055419921875, -0.14471435546875, -0.126373291015625, -0.1080322265625, -0.089691162109375, -0.07135009765625, -0.053009033203125, -0.03466796875, -0.016326904296875, 0.00201416015625, 0.020355224609375, 0.0386962890625, 0.057037353515625, 0.07537841796875, 0.093719482421875, 0.112060546875, 0.130401611328125, 0.14874267578125, 0.167083740234375, 0.1854248046875, 0.203765869140625, 0.22210693359375, 0.240447998046875, 0.2587890625, 0.277130126953125, 0.29547119140625, 0.313812255859375, 0.3321533203125, 0.350494384765625, 0.36883544921875, 0.387176513671875, 0.405517578125, 0.423858642578125, 0.44219970703125, 0.460540771484375, 0.4788818359375, 0.497222900390625, 0.51556396484375, 0.533905029296875, 0.55224609375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 2.0, 9.0, 10.0, 10.0, 6.0, 20.0, 21.0, 25.0, 31.0, 23.0, 29.0, 37.0, 26.0, 37.0, 43.0, 48.0, 67.0, 374.0, 1043886.0, 3353.0, 78.0, 45.0, 35.0, 42.0, 45.0, 35.0, 29.0, 30.0, 23.0, 16.0, 20.0, 19.0, 15.0, 7.0, 9.0, 7.0, 9.0, 8.0, 5.0, 7.0, 3.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0], "bins": [-2.23828125, -2.171844482421875, -2.10540771484375, -2.038970947265625, -1.9725341796875, -1.906097412109375, -1.83966064453125, -1.773223876953125, -1.706787109375, -1.640350341796875, -1.57391357421875, -1.507476806640625, -1.4410400390625, -1.374603271484375, -1.30816650390625, -1.241729736328125, -1.17529296875, -1.108856201171875, -1.04241943359375, -0.975982666015625, -0.9095458984375, -0.843109130859375, -0.77667236328125, -0.710235595703125, -0.643798828125, -0.577362060546875, -0.51092529296875, -0.444488525390625, -0.3780517578125, -0.311614990234375, -0.24517822265625, -0.178741455078125, -0.1123046875, -0.045867919921875, 0.02056884765625, 0.087005615234375, 0.1534423828125, 0.219879150390625, 0.28631591796875, 0.352752685546875, 0.419189453125, 0.485626220703125, 0.55206298828125, 0.618499755859375, 0.6849365234375, 0.751373291015625, 0.81781005859375, 0.884246826171875, 0.95068359375, 1.017120361328125, 1.08355712890625, 1.149993896484375, 1.2164306640625, 1.282867431640625, 1.34930419921875, 1.415740966796875, 1.482177734375, 1.548614501953125, 1.61505126953125, 1.681488037109375, 1.7479248046875, 1.814361572265625, 1.88079833984375, 1.947235107421875, 2.013671875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 3.0, 10.0, 11.0, 9.0, 10.0, 21.0, 23.0, 30.0, 28.0, 28.0, 42.0, 28.0, 34.0, 37.0, 51.0, 43.0, 41.0, 56.0, 50.0, 32.0, 42.0, 30.0, 38.0, 42.0, 36.0, 44.0, 22.0, 21.0, 17.0, 14.0, 21.0, 10.0, 11.0, 13.0, 11.0, 4.0, 4.0, 7.0, 8.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0], "bins": [-0.54345703125, -0.5277862548828125, -0.512115478515625, -0.4964447021484375, -0.48077392578125, -0.4651031494140625, -0.449432373046875, -0.4337615966796875, -0.4180908203125, -0.4024200439453125, -0.386749267578125, -0.3710784912109375, -0.35540771484375, -0.3397369384765625, -0.324066162109375, -0.3083953857421875, -0.292724609375, -0.2770538330078125, -0.261383056640625, -0.2457122802734375, -0.23004150390625, -0.2143707275390625, -0.198699951171875, -0.1830291748046875, -0.1673583984375, -0.1516876220703125, -0.136016845703125, -0.1203460693359375, -0.10467529296875, -0.0890045166015625, -0.073333740234375, -0.0576629638671875, -0.0419921875, -0.0263214111328125, -0.010650634765625, 0.0050201416015625, 0.02069091796875, 0.0363616943359375, 0.052032470703125, 0.0677032470703125, 0.0833740234375, 0.0990447998046875, 0.114715576171875, 0.1303863525390625, 0.14605712890625, 0.1617279052734375, 0.177398681640625, 0.1930694580078125, 0.208740234375, 0.2244110107421875, 0.240081787109375, 0.2557525634765625, 0.27142333984375, 0.2870941162109375, 0.302764892578125, 0.3184356689453125, 0.3341064453125, 0.3497772216796875, 0.365447998046875, 0.3811187744140625, 0.39678955078125, 0.4124603271484375, 0.428131103515625, 0.4438018798828125, 0.45947265625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 7.0, 4.0, 3.0, 8.0, 5.0, 17.0, 16.0, 37.0, 52.0, 149.0, 320.0, 1250.0, 11520.0, 952338.0, 78973.0, 2863.0, 557.0, 179.0, 102.0, 46.0, 37.0, 20.0, 13.0, 8.0, 6.0, 5.0, 6.0, 5.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1253662109375, -0.11932182312011719, -0.11327743530273438, -0.10723304748535156, -0.10118865966796875, -0.09514427185058594, -0.08909988403320312, -0.08305549621582031, -0.0770111083984375, -0.07096672058105469, -0.06492233276367188, -0.05887794494628906, -0.05283355712890625, -0.04678916931152344, -0.040744781494140625, -0.03470039367675781, -0.028656005859375, -0.022611618041992188, -0.016567230224609375, -0.010522842407226562, -0.00447845458984375, 0.0015659332275390625, 0.007610321044921875, 0.013654708862304688, 0.0196990966796875, 0.025743484497070312, 0.031787872314453125, 0.03783226013183594, 0.04387664794921875, 0.04992103576660156, 0.055965423583984375, 0.06200981140136719, 0.06805419921875, 0.07409858703613281, 0.08014297485351562, 0.08618736267089844, 0.09223175048828125, 0.09827613830566406, 0.10432052612304688, 0.11036491394042969, 0.1164093017578125, 0.12245368957519531, 0.12849807739257812, 0.13454246520996094, 0.14058685302734375, 0.14663124084472656, 0.15267562866210938, 0.1587200164794922, 0.164764404296875, 0.1708087921142578, 0.17685317993164062, 0.18289756774902344, 0.18894195556640625, 0.19498634338378906, 0.20103073120117188, 0.2070751190185547, 0.2131195068359375, 0.2191638946533203, 0.22520828247070312, 0.23125267028808594, 0.23729705810546875, 0.24334144592285156, 0.24938583374023438, 0.2554302215576172, 0.261474609375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 9.0, 5.0, 3.0, 3.0, 7.0, 10.0, 7.0, 11.0, 26.0, 31.0, 30.0, 49.0, 66.0, 111.0, 129.0, 137.0, 104.0, 81.0, 48.0, 35.0, 30.0, 18.0, 10.0, 7.0, 8.0, 3.0, 7.0, 4.0, 1.0, 3.0, 4.0, 5.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.0311603546142578e-05, -1.0007061064243317e-05, -9.702518582344055e-06, -9.397976100444794e-06, -9.093433618545532e-06, -8.78889113664627e-06, -8.48434865474701e-06, -8.179806172847748e-06, -7.875263690948486e-06, -7.570721209049225e-06, -7.266178727149963e-06, -6.961636245250702e-06, -6.6570937633514404e-06, -6.352551281452179e-06, -6.0480087995529175e-06, -5.743466317653656e-06, -5.4389238357543945e-06, -5.134381353855133e-06, -4.829838871955872e-06, -4.52529639005661e-06, -4.220753908157349e-06, -3.916211426258087e-06, -3.6116689443588257e-06, -3.307126462459564e-06, -3.0025839805603027e-06, -2.6980414986610413e-06, -2.3934990167617798e-06, -2.0889565348625183e-06, -1.7844140529632568e-06, -1.4798715710639954e-06, -1.1753290891647339e-06, -8.707866072654724e-07, -5.662441253662109e-07, -2.6170164346694946e-07, 4.284083843231201e-08, 3.473833203315735e-07, 6.51925802230835e-07, 9.564682841300964e-07, 1.261010766029358e-06, 1.5655532479286194e-06, 1.8700957298278809e-06, 2.1746382117271423e-06, 2.479180693626404e-06, 2.7837231755256653e-06, 3.0882656574249268e-06, 3.3928081393241882e-06, 3.6973506212234497e-06, 4.001893103122711e-06, 4.306435585021973e-06, 4.610978066921234e-06, 4.915520548820496e-06, 5.220063030719757e-06, 5.5246055126190186e-06, 5.82914799451828e-06, 6.1336904764175415e-06, 6.438232958316803e-06, 6.7427754402160645e-06, 7.047317922115326e-06, 7.351860404014587e-06, 7.656402885913849e-06, 7.96094536781311e-06, 8.265487849712372e-06, 8.570030331611633e-06, 8.874572813510895e-06, 9.179115295410156e-06]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 7.0, 7.0, 6.0, 18.0, 10.0, 24.0, 45.0, 67.0, 107.0, 203.0, 442.0, 921.0, 2390.0, 7765.0, 40146.0, 751812.0, 215915.0, 20373.0, 4933.0, 1802.0, 714.0, 370.0, 207.0, 107.0, 58.0, 36.0, 23.0, 12.0, 10.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.1103515625, -0.10735416412353516, -0.10435676574707031, -0.10135936737060547, -0.09836196899414062, -0.09536457061767578, -0.09236717224121094, -0.0893697738647461, -0.08637237548828125, -0.0833749771118164, -0.08037757873535156, -0.07738018035888672, -0.07438278198242188, -0.07138538360595703, -0.06838798522949219, -0.06539058685302734, -0.0623931884765625, -0.059395790100097656, -0.05639839172363281, -0.05340099334716797, -0.050403594970703125, -0.04740619659423828, -0.04440879821777344, -0.041411399841308594, -0.03841400146484375, -0.035416603088378906, -0.03241920471191406, -0.02942180633544922, -0.026424407958984375, -0.02342700958251953, -0.020429611206054688, -0.017432212829589844, -0.014434814453125, -0.011437416076660156, -0.008440017700195312, -0.005442619323730469, -0.002445220947265625, 0.0005521774291992188, 0.0035495758056640625, 0.006546974182128906, 0.00954437255859375, 0.012541770935058594, 0.015539169311523438, 0.01853656768798828, 0.021533966064453125, 0.02453136444091797, 0.027528762817382812, 0.030526161193847656, 0.0335235595703125, 0.036520957946777344, 0.03951835632324219, 0.04251575469970703, 0.045513153076171875, 0.04851055145263672, 0.05150794982910156, 0.054505348205566406, 0.05750274658203125, 0.060500144958496094, 0.06349754333496094, 0.06649494171142578, 0.06949234008789062, 0.07248973846435547, 0.07548713684082031, 0.07848453521728516, 0.08148193359375]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 7.0, 4.0, 7.0, 5.0, 4.0, 13.0, 19.0, 24.0, 18.0, 32.0, 64.0, 99.0, 104.0, 209.0, 114.0, 92.0, 58.0, 34.0, 27.0, 23.0, 14.0, 5.0, 10.0, 6.0, 5.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.021820068359375, -0.020803451538085938, -0.019786834716796875, -0.018770217895507812, -0.01775360107421875, -0.016736984252929688, -0.015720367431640625, -0.014703750610351562, -0.0136871337890625, -0.012670516967773438, -0.011653900146484375, -0.010637283325195312, -0.00962066650390625, -0.008604049682617188, -0.007587432861328125, -0.0065708160400390625, -0.00555419921875, -0.0045375823974609375, -0.003520965576171875, -0.0025043487548828125, -0.00148773193359375, -0.0004711151123046875, 0.000545501708984375, 0.0015621185302734375, 0.0025787353515625, 0.0035953521728515625, 0.004611968994140625, 0.0056285858154296875, 0.00664520263671875, 0.0076618194580078125, 0.008678436279296875, 0.009695053100585938, 0.010711669921875, 0.011728286743164062, 0.012744903564453125, 0.013761520385742188, 0.01477813720703125, 0.015794754028320312, 0.016811370849609375, 0.017827987670898438, 0.0188446044921875, 0.019861221313476562, 0.020877838134765625, 0.021894454956054688, 0.02291107177734375, 0.023927688598632812, 0.024944305419921875, 0.025960922241210938, 0.0269775390625, 0.027994155883789062, 0.029010772705078125, 0.030027389526367188, 0.03104400634765625, 0.03206062316894531, 0.033077239990234375, 0.03409385681152344, 0.0351104736328125, 0.03612709045410156, 0.037143707275390625, 0.03816032409667969, 0.03917694091796875, 0.04019355773925781, 0.041210174560546875, 0.04222679138183594, 0.043243408203125]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 9.0, 30.0, 63.0, 198.0, 349.0, 213.0, 82.0, 30.0, 18.0, 4.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.687655448913574, -2.624556064605713, -2.5614569187164307, -2.4983575344085693, -2.435258150100708, -2.372159004211426, -2.3090596199035645, -2.245960235595703, -2.182861089706421, -2.1197617053985596, -2.0566625595092773, -1.993563175201416, -1.9304639101028442, -1.8673646450042725, -1.8042652606964111, -1.7411659955978394, -1.678066611289978, -1.6149673461914062, -1.551867961883545, -1.4887686967849731, -1.4256694316864014, -1.36257004737854, -1.2994707822799683, -1.2363715171813965, -1.1732721328735352, -1.1101728677749634, -1.047073483467102, -0.9839742183685303, -0.9208749532699585, -0.8577756285667419, -0.7946763038635254, -0.7315770387649536, -0.6684778928756714, -0.6053785681724548, -0.5422793030738831, -0.4791799783706665, -0.41608068346977234, -0.3529813885688782, -0.2898820638656616, -0.22678276896476746, -0.1636834740638733, -0.10058417171239853, -0.03748486936092377, 0.025614440441131592, 0.08871373534202576, 0.15181303024291992, 0.21491235494613647, 0.27801164984703064, 0.3411109447479248, 0.40421023964881897, 0.46730953454971313, 0.5304088592529297, 0.5935081243515015, 0.656607449054718, 0.7197067737579346, 0.7828060388565063, 0.8459053635597229, 0.9090046882629395, 0.9721039533615112, 1.035203218460083, 1.0983026027679443, 1.1614018678665161, 1.224501132965088, 1.2876005172729492, 1.350699782371521]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 6.0, 4.0, 5.0, 11.0, 11.0, 12.0, 9.0, 20.0, 23.0, 27.0, 24.0, 26.0, 40.0, 38.0, 37.0, 37.0, 35.0, 53.0, 42.0, 48.0, 43.0, 48.0, 43.0, 48.0, 37.0, 32.0, 37.0, 26.0, 35.0, 20.0, 32.0, 24.0, 15.0, 16.0, 15.0, 8.0, 3.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8283340334892273, -0.8035085797309875, -0.7786831855773926, -0.7538577318191528, -0.7290323376655579, -0.7042068839073181, -0.6793814897537231, -0.6545560359954834, -0.6297305822372437, -0.6049051284790039, -0.5800797343254089, -0.5552542805671692, -0.5304288864135742, -0.5056034326553345, -0.4807780086994171, -0.45595258474349976, -0.4311271905899048, -0.4063017666339874, -0.38147634267807007, -0.3566508889198303, -0.33182549476623535, -0.3070000410079956, -0.28217461705207825, -0.2573491930961609, -0.23252376914024353, -0.20769834518432617, -0.1828729212284088, -0.15804748237133026, -0.1332220584154129, -0.10839663445949554, -0.08357119560241699, -0.058745771646499634, -0.033920347690582275, -0.009094920009374619, 0.01573050767183304, 0.040555939078330994, 0.06538136303424835, 0.09020678699016571, 0.11503222584724426, 0.13985764980316162, 0.16468307375907898, 0.18950849771499634, 0.2143339216709137, 0.23915936052799225, 0.2639847993850708, 0.28881019353866577, 0.3136356472969055, 0.3384610712528229, 0.36328649520874023, 0.3881119191646576, 0.41293734312057495, 0.4377627968788147, 0.46258819103240967, 0.4874136447906494, 0.5122390985488892, 0.5370644927024841, 0.5618898868560791, 0.5867153406143188, 0.6115407347679138, 0.6363661885261536, 0.6611915826797485, 0.6860170364379883, 0.710842490196228, 0.735667884349823, 0.7604933381080627]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 5.0, 5.0, 4.0, 9.0, 10.0, 15.0, 20.0, 21.0, 38.0, 38.0, 65.0, 106.0, 173.0, 271.0, 447.0, 826.0, 1448.0, 3037.0, 6493.0, 19750.0, 170285.0, 3270290.0, 668688.0, 34601.0, 9210.0, 3880.0, 1998.0, 1010.0, 605.0, 323.0, 226.0, 140.0, 82.0, 64.0, 35.0, 25.0, 14.0, 9.0, 6.0, 8.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7021484375, -0.67999267578125, -0.6578369140625, -0.63568115234375, -0.613525390625, -0.59136962890625, -0.5692138671875, -0.54705810546875, -0.52490234375, -0.50274658203125, -0.4805908203125, -0.45843505859375, -0.436279296875, -0.41412353515625, -0.3919677734375, -0.36981201171875, -0.34765625, -0.32550048828125, -0.3033447265625, -0.28118896484375, -0.259033203125, -0.23687744140625, -0.2147216796875, -0.19256591796875, -0.17041015625, -0.14825439453125, -0.1260986328125, -0.10394287109375, -0.081787109375, -0.05963134765625, -0.0374755859375, -0.01531982421875, 0.0068359375, 0.02899169921875, 0.0511474609375, 0.07330322265625, 0.095458984375, 0.11761474609375, 0.1397705078125, 0.16192626953125, 0.18408203125, 0.20623779296875, 0.2283935546875, 0.25054931640625, 0.272705078125, 0.29486083984375, 0.3170166015625, 0.33917236328125, 0.361328125, 0.38348388671875, 0.4056396484375, 0.42779541015625, 0.449951171875, 0.47210693359375, 0.4942626953125, 0.51641845703125, 0.53857421875, 0.56072998046875, 0.5828857421875, 0.60504150390625, 0.627197265625, 0.64935302734375, 0.6715087890625, 0.69366455078125, 0.7158203125]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 5.0, 5.0, 11.0, 6.0, 8.0, 13.0, 12.0, 14.0, 19.0, 17.0, 26.0, 31.0, 43.0, 42.0, 62.0, 56.0, 57.0, 65.0, 47.0, 67.0, 52.0, 51.0, 39.0, 33.0, 44.0, 42.0, 25.0, 27.0, 27.0, 14.0, 12.0, 7.0, 7.0, 6.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.302978515625, -0.2938880920410156, -0.28479766845703125, -0.2757072448730469, -0.2666168212890625, -0.2575263977050781, -0.24843597412109375, -0.23934555053710938, -0.230255126953125, -0.22116470336914062, -0.21207427978515625, -0.20298385620117188, -0.1938934326171875, -0.18480300903320312, -0.17571258544921875, -0.16662216186523438, -0.15753173828125, -0.14844131469726562, -0.13935089111328125, -0.13026046752929688, -0.1211700439453125, -0.11207962036132812, -0.10298919677734375, -0.09389877319335938, -0.084808349609375, -0.07571792602539062, -0.06662750244140625, -0.057537078857421875, -0.0484466552734375, -0.039356231689453125, -0.03026580810546875, -0.021175384521484375, -0.0120849609375, -0.002994537353515625, 0.00609588623046875, 0.015186309814453125, 0.0242767333984375, 0.033367156982421875, 0.04245758056640625, 0.051548004150390625, 0.060638427734375, 0.06972885131835938, 0.07881927490234375, 0.08790969848632812, 0.0970001220703125, 0.10609054565429688, 0.11518096923828125, 0.12427139282226562, 0.13336181640625, 0.14245223999023438, 0.15154266357421875, 0.16063308715820312, 0.1697235107421875, 0.17881393432617188, 0.18790435791015625, 0.19699478149414062, 0.206085205078125, 0.21517562866210938, 0.22426605224609375, 0.23335647583007812, 0.2424468994140625, 0.2515373229980469, 0.26062774658203125, 0.2697181701660156, 0.27880859375]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 4.0, 11.0, 9.0, 8.0, 6.0, 11.0, 19.0, 25.0, 29.0, 56.0, 101.0, 187.0, 657.0, 3553.0, 69914.0, 4088250.0, 28278.0, 2256.0, 488.0, 167.0, 75.0, 49.0, 39.0, 29.0, 11.0, 5.0, 9.0, 10.0, 5.0, 2.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4072265625, -1.3576507568359375, -1.308074951171875, -1.2584991455078125, -1.20892333984375, -1.1593475341796875, -1.109771728515625, -1.0601959228515625, -1.0106201171875, -0.9610443115234375, -0.911468505859375, -0.8618927001953125, -0.81231689453125, -0.7627410888671875, -0.713165283203125, -0.6635894775390625, -0.614013671875, -0.5644378662109375, -0.514862060546875, -0.4652862548828125, -0.41571044921875, -0.3661346435546875, -0.316558837890625, -0.2669830322265625, -0.2174072265625, -0.1678314208984375, -0.118255615234375, -0.0686798095703125, -0.01910400390625, 0.0304718017578125, 0.080047607421875, 0.1296234130859375, 0.17919921875, 0.2287750244140625, 0.278350830078125, 0.3279266357421875, 0.37750244140625, 0.4270782470703125, 0.476654052734375, 0.5262298583984375, 0.5758056640625, 0.6253814697265625, 0.674957275390625, 0.7245330810546875, 0.77410888671875, 0.8236846923828125, 0.873260498046875, 0.9228363037109375, 0.972412109375, 1.0219879150390625, 1.071563720703125, 1.1211395263671875, 1.17071533203125, 1.2202911376953125, 1.269866943359375, 1.3194427490234375, 1.3690185546875, 1.4185943603515625, 1.468170166015625, 1.5177459716796875, 1.56732177734375, 1.6168975830078125, 1.666473388671875, 1.7160491943359375, 1.765625]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 3.0, 6.0, 9.0, 7.0, 8.0, 14.0, 22.0, 31.0, 52.0, 49.0, 89.0, 165.0, 328.0, 624.0, 1000.0, 753.0, 386.0, 207.0, 92.0, 54.0, 49.0, 24.0, 16.0, 15.0, 12.0, 8.0, 5.0, 8.0, 10.0, 8.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.1834716796875, -0.17847251892089844, -0.17347335815429688, -0.1684741973876953, -0.16347503662109375, -0.1584758758544922, -0.15347671508789062, -0.14847755432128906, -0.1434783935546875, -0.13847923278808594, -0.13348007202148438, -0.1284809112548828, -0.12348175048828125, -0.11848258972167969, -0.11348342895507812, -0.10848426818847656, -0.103485107421875, -0.09848594665527344, -0.09348678588867188, -0.08848762512207031, -0.08348846435546875, -0.07848930358886719, -0.07349014282226562, -0.06849098205566406, -0.0634918212890625, -0.05849266052246094, -0.053493499755859375, -0.04849433898925781, -0.04349517822265625, -0.03849601745605469, -0.033496856689453125, -0.028497695922851562, -0.02349853515625, -0.018499374389648438, -0.013500213623046875, -0.008501052856445312, -0.00350189208984375, 0.0014972686767578125, 0.006496429443359375, 0.011495590209960938, 0.0164947509765625, 0.021493911743164062, 0.026493072509765625, 0.03149223327636719, 0.03649139404296875, 0.04149055480957031, 0.046489715576171875, 0.05148887634277344, 0.056488037109375, 0.06148719787597656, 0.06648635864257812, 0.07148551940917969, 0.07648468017578125, 0.08148384094238281, 0.08648300170898438, 0.09148216247558594, 0.0964813232421875, 0.10148048400878906, 0.10647964477539062, 0.11147880554199219, 0.11647796630859375, 0.12147712707519531, 0.12647628784179688, 0.13147544860839844, 0.136474609375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 5.0, 8.0, 7.0, 6.0, 17.0, 15.0, 32.0, 51.0, 67.0, 78.0, 109.0, 156.0, 116.0, 102.0, 67.0, 58.0, 42.0, 22.0, 21.0, 9.0, 6.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37770017981529236, -0.3595159947872162, -0.3413317799568176, -0.32314759492874146, -0.3049634099006653, -0.2867791950702667, -0.26859501004219055, -0.250410795211792, -0.23222661018371582, -0.21404241025447845, -0.1958582103252411, -0.17767402529716492, -0.15948982536792755, -0.14130562543869019, -0.12312143296003342, -0.10493724048137665, -0.08675304055213928, -0.06856884062290192, -0.05038464814424515, -0.03220045194029808, -0.014016255736351013, 0.0041679441928863525, 0.02235213667154312, 0.04053632915019989, 0.058720529079437256, 0.07690472900867462, 0.09508892148733139, 0.11327311396598816, 0.13145731389522552, 0.1496415138244629, 0.16782569885253906, 0.18600989878177643, 0.20419412851333618, 0.22237832844257355, 0.2405625283718109, 0.2587467133998871, 0.27693092823028564, 0.2951151132583618, 0.313299298286438, 0.33148348331451416, 0.3496676981449127, 0.3678518831729889, 0.38603609800338745, 0.4042202830314636, 0.4224044680595398, 0.44058868288993835, 0.4587728679180145, 0.4769570827484131, 0.49514126777648926, 0.5133254528045654, 0.5315096378326416, 0.5496938824653625, 0.5678780674934387, 0.5860622525215149, 0.6042464375495911, 0.6224306225776672, 0.6406148672103882, 0.6587990522384644, 0.6769832372665405, 0.6951674818992615, 0.7133516669273376, 0.7315358519554138, 0.74972003698349, 0.7679042220115662, 0.7860884070396423]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 8.0, 4.0, 4.0, 11.0, 13.0, 11.0, 9.0, 20.0, 21.0, 22.0, 38.0, 37.0, 43.0, 35.0, 32.0, 37.0, 50.0, 46.0, 44.0, 37.0, 44.0, 39.0, 34.0, 45.0, 42.0, 53.0, 30.0, 32.0, 27.0, 28.0, 20.0, 20.0, 9.0, 12.0, 14.0, 11.0, 7.0, 2.0, 3.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2518153488636017, -0.24294771254062653, -0.23408006131649017, -0.22521242499351501, -0.21634477376937866, -0.2074771374464035, -0.19860950112342834, -0.189741849899292, -0.18087421357631683, -0.17200657725334167, -0.16313892602920532, -0.15427128970623016, -0.145403653383255, -0.13653600215911865, -0.1276683658361435, -0.11880072206258774, -0.10993307828903198, -0.10106543451547623, -0.09219779074192047, -0.08333015441894531, -0.07446251064538956, -0.0655948668718338, -0.056727226823568344, -0.04785958677530289, -0.03899194300174713, -0.030124301090836525, -0.02125665917992592, -0.012389017269015312, -0.003521375358104706, 0.00534626841545105, 0.014213908463716507, 0.023081548511981964, 0.03194919228553772, 0.040816836059093475, 0.04968447610735893, 0.05855211615562439, 0.06741975992918015, 0.0762874037027359, 0.08515504002571106, 0.09402268379926682, 0.10289032757282257, 0.11175797134637833, 0.12062561511993408, 0.12949325144290924, 0.1383608877658844, 0.14722853899002075, 0.1560961753129959, 0.16496381163597107, 0.17383146286010742, 0.18269909918308258, 0.19156675040721893, 0.2004343867301941, 0.20930203795433044, 0.2181696742773056, 0.22703731060028076, 0.23590496182441711, 0.24477259814739227, 0.25364023447036743, 0.2625078856945038, 0.27137553691864014, 0.2802431583404541, 0.28911080956459045, 0.2979784607887268, 0.30684608221054077, 0.3157137334346771]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 11.0, 6.0, 17.0, 15.0, 37.0, 59.0, 109.0, 189.0, 389.0, 869.0, 2096.0, 6622.0, 27468.0, 383015.0, 583091.0, 32642.0, 7634.0, 2438.0, 976.0, 390.0, 180.0, 113.0, 71.0, 43.0, 27.0, 12.0, 12.0, 8.0, 11.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2381591796875, -0.22684669494628906, -0.21553421020507812, -0.2042217254638672, -0.19290924072265625, -0.1815967559814453, -0.17028427124023438, -0.15897178649902344, -0.1476593017578125, -0.13634681701660156, -0.12503433227539062, -0.11372184753417969, -0.10240936279296875, -0.09109687805175781, -0.07978439331054688, -0.06847190856933594, -0.057159423828125, -0.04584693908691406, -0.034534454345703125, -0.023221969604492188, -0.01190948486328125, -0.0005970001220703125, 0.010715484619140625, 0.022027969360351562, 0.0333404541015625, 0.04465293884277344, 0.055965423583984375, 0.06727790832519531, 0.07859039306640625, 0.08990287780761719, 0.10121536254882812, 0.11252784729003906, 0.12384033203125, 0.13515281677246094, 0.14646530151367188, 0.1577777862548828, 0.16909027099609375, 0.1804027557373047, 0.19171524047851562, 0.20302772521972656, 0.2143402099609375, 0.22565269470214844, 0.23696517944335938, 0.2482776641845703, 0.25959014892578125, 0.2709026336669922, 0.2822151184082031, 0.29352760314941406, 0.304840087890625, 0.31615257263183594, 0.3274650573730469, 0.3387775421142578, 0.35009002685546875, 0.3614025115966797, 0.3727149963378906, 0.38402748107910156, 0.3953399658203125, 0.40665245056152344, 0.4179649353027344, 0.4292774200439453, 0.44058990478515625, 0.4519023895263672, 0.4632148742675781, 0.47452735900878906, 0.48583984375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 2.0, 7.0, 5.0, 16.0, 14.0, 13.0, 39.0, 47.0, 61.0, 54.0, 71.0, 75.0, 78.0, 82.0, 69.0, 79.0, 78.0, 54.0, 39.0, 36.0, 32.0, 18.0, 16.0, 8.0, 6.0, 6.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1494140625, -0.14076614379882812, -0.13211822509765625, -0.12347030639648438, -0.1148223876953125, -0.10617446899414062, -0.09752655029296875, -0.08887863159179688, -0.080230712890625, -0.07158279418945312, -0.06293487548828125, -0.054286956787109375, -0.0456390380859375, -0.036991119384765625, -0.02834320068359375, -0.019695281982421875, -0.01104736328125, -0.002399444580078125, 0.00624847412109375, 0.014896392822265625, 0.0235443115234375, 0.032192230224609375, 0.04084014892578125, 0.049488067626953125, 0.058135986328125, 0.06678390502929688, 0.07543182373046875, 0.08407974243164062, 0.0927276611328125, 0.10137557983398438, 0.11002349853515625, 0.11867141723632812, 0.1273193359375, 0.13596725463867188, 0.14461517333984375, 0.15326309204101562, 0.1619110107421875, 0.17055892944335938, 0.17920684814453125, 0.18785476684570312, 0.196502685546875, 0.20515060424804688, 0.21379852294921875, 0.22244644165039062, 0.2310943603515625, 0.23974227905273438, 0.24839019775390625, 0.2570381164550781, 0.26568603515625, 0.2743339538574219, 0.28298187255859375, 0.2916297912597656, 0.3002777099609375, 0.3089256286621094, 0.31757354736328125, 0.3262214660644531, 0.334869384765625, 0.3435173034667969, 0.35216522216796875, 0.3608131408691406, 0.3694610595703125, 0.3781089782714844, 0.38675689697265625, 0.3954048156738281, 0.404052734375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 3.0, 7.0, 4.0, 4.0, 7.0, 15.0, 15.0, 17.0, 25.0, 53.0, 90.0, 140.0, 305.0, 643.0, 1651.0, 4650.0, 15976.0, 79999.0, 630864.0, 263139.0, 36709.0, 9221.0, 2919.0, 1129.0, 395.0, 230.0, 122.0, 61.0, 51.0, 30.0, 11.0, 11.0, 9.0, 8.0, 6.0, 6.0, 8.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1776123046875, -0.17235374450683594, -0.16709518432617188, -0.1618366241455078, -0.15657806396484375, -0.1513195037841797, -0.14606094360351562, -0.14080238342285156, -0.1355438232421875, -0.13028526306152344, -0.12502670288085938, -0.11976814270019531, -0.11450958251953125, -0.10925102233886719, -0.10399246215820312, -0.09873390197753906, -0.093475341796875, -0.08821678161621094, -0.08295822143554688, -0.07769966125488281, -0.07244110107421875, -0.06718254089355469, -0.061923980712890625, -0.05666542053222656, -0.0514068603515625, -0.04614830017089844, -0.040889739990234375, -0.03563117980957031, -0.03037261962890625, -0.025114059448242188, -0.019855499267578125, -0.014596939086914062, -0.00933837890625, -0.0040798187255859375, 0.001178741455078125, 0.0064373016357421875, 0.01169586181640625, 0.016954421997070312, 0.022212982177734375, 0.027471542358398438, 0.0327301025390625, 0.03798866271972656, 0.043247222900390625, 0.04850578308105469, 0.05376434326171875, 0.05902290344238281, 0.06428146362304688, 0.06954002380371094, 0.074798583984375, 0.08005714416503906, 0.08531570434570312, 0.09057426452636719, 0.09583282470703125, 0.10109138488769531, 0.10634994506835938, 0.11160850524902344, 0.1168670654296875, 0.12212562561035156, 0.12738418579101562, 0.1326427459716797, 0.13790130615234375, 0.1431598663330078, 0.14841842651367188, 0.15367698669433594, 0.158935546875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 5.0, 11.0, 6.0, 6.0, 6.0, 20.0, 16.0, 7.0, 19.0, 14.0, 28.0, 28.0, 36.0, 40.0, 40.0, 28.0, 47.0, 38.0, 43.0, 42.0, 48.0, 48.0, 57.0, 27.0, 48.0, 35.0, 38.0, 42.0, 37.0, 18.0, 25.0, 19.0, 17.0, 15.0, 13.0, 5.0, 8.0, 3.0, 5.0, 5.0, 3.0, 5.0, 4.0, 4.0, 0.0, 1.0, 2.0, 4.0], "bins": [-0.331787109375, -0.322662353515625, -0.31353759765625, -0.304412841796875, -0.2952880859375, -0.286163330078125, -0.27703857421875, -0.267913818359375, -0.2587890625, -0.249664306640625, -0.24053955078125, -0.231414794921875, -0.2222900390625, -0.213165283203125, -0.20404052734375, -0.194915771484375, -0.185791015625, -0.176666259765625, -0.16754150390625, -0.158416748046875, -0.1492919921875, -0.140167236328125, -0.13104248046875, -0.121917724609375, -0.11279296875, -0.103668212890625, -0.09454345703125, -0.085418701171875, -0.0762939453125, -0.067169189453125, -0.05804443359375, -0.048919677734375, -0.039794921875, -0.030670166015625, -0.02154541015625, -0.012420654296875, -0.0032958984375, 0.005828857421875, 0.01495361328125, 0.024078369140625, 0.033203125, 0.042327880859375, 0.05145263671875, 0.060577392578125, 0.0697021484375, 0.078826904296875, 0.08795166015625, 0.097076416015625, 0.106201171875, 0.115325927734375, 0.12445068359375, 0.133575439453125, 0.1427001953125, 0.151824951171875, 0.16094970703125, 0.170074462890625, 0.17919921875, 0.188323974609375, 0.19744873046875, 0.206573486328125, 0.2156982421875, 0.224822998046875, 0.23394775390625, 0.243072509765625, 0.252197265625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 8.0, 10.0, 12.0, 13.0, 37.0, 40.0, 49.0, 103.0, 141.0, 219.0, 388.0, 616.0, 1215.0, 2223.0, 4602.0, 10938.0, 34632.0, 172833.0, 633183.0, 139494.0, 29456.0, 9636.0, 4001.0, 1979.0, 1151.0, 582.0, 364.0, 191.0, 141.0, 91.0, 63.0, 55.0, 30.0, 14.0, 9.0, 11.0, 8.0, 4.0, 5.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0294036865234375, -0.02843785285949707, -0.02747201919555664, -0.02650618553161621, -0.02554035186767578, -0.02457451820373535, -0.023608684539794922, -0.022642850875854492, -0.021677017211914062, -0.020711183547973633, -0.019745349884033203, -0.018779516220092773, -0.017813682556152344, -0.016847848892211914, -0.015882015228271484, -0.014916181564331055, -0.013950347900390625, -0.012984514236450195, -0.012018680572509766, -0.011052846908569336, -0.010087013244628906, -0.009121179580688477, -0.008155345916748047, -0.007189512252807617, -0.0062236785888671875, -0.005257844924926758, -0.004292011260986328, -0.0033261775970458984, -0.0023603439331054688, -0.001394510269165039, -0.0004286766052246094, 0.0005371570587158203, 0.00150299072265625, 0.0024688243865966797, 0.0034346580505371094, 0.004400491714477539, 0.005366325378417969, 0.0063321590423583984, 0.007297992706298828, 0.008263826370239258, 0.009229660034179688, 0.010195493698120117, 0.011161327362060547, 0.012127161026000977, 0.013092994689941406, 0.014058828353881836, 0.015024662017822266, 0.015990495681762695, 0.016956329345703125, 0.017922163009643555, 0.018887996673583984, 0.019853830337524414, 0.020819664001464844, 0.021785497665405273, 0.022751331329345703, 0.023717164993286133, 0.024682998657226562, 0.025648832321166992, 0.026614665985107422, 0.02758049964904785, 0.02854633331298828, 0.02951216697692871, 0.03047800064086914, 0.03144383430480957, 0.03240966796875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 0.0, 4.0, 6.0, 5.0, 4.0, 8.0, 5.0, 10.0, 19.0, 24.0, 36.0, 50.0, 80.0, 96.0, 122.0, 138.0, 119.0, 75.0, 49.0, 47.0, 31.0, 18.0, 11.0, 14.0, 4.0, 7.0, 3.0, 5.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.0265579223632812e-05, -1.968909054994583e-05, -1.911260187625885e-05, -1.853611320257187e-05, -1.7959624528884888e-05, -1.7383135855197906e-05, -1.6806647181510925e-05, -1.6230158507823944e-05, -1.5653669834136963e-05, -1.5077181160449982e-05, -1.4500692486763e-05, -1.392420381307602e-05, -1.3347715139389038e-05, -1.2771226465702057e-05, -1.2194737792015076e-05, -1.1618249118328094e-05, -1.1041760444641113e-05, -1.0465271770954132e-05, -9.888783097267151e-06, -9.31229442358017e-06, -8.735805749893188e-06, -8.159317076206207e-06, -7.582828402519226e-06, -7.006339728832245e-06, -6.429851055145264e-06, -5.8533623814582825e-06, -5.276873707771301e-06, -4.70038503408432e-06, -4.123896360397339e-06, -3.5474076867103577e-06, -2.9709190130233765e-06, -2.3944303393363953e-06, -1.817941665649414e-06, -1.2414529919624329e-06, -6.649643182754517e-07, -8.847564458847046e-08, 4.880130290985107e-07, 1.064501702785492e-06, 1.6409903764724731e-06, 2.2174790501594543e-06, 2.7939677238464355e-06, 3.3704563975334167e-06, 3.946945071220398e-06, 4.523433744907379e-06, 5.09992241859436e-06, 5.6764110922813416e-06, 6.252899765968323e-06, 6.829388439655304e-06, 7.405877113342285e-06, 7.982365787029266e-06, 8.558854460716248e-06, 9.135343134403229e-06, 9.71183180809021e-06, 1.0288320481777191e-05, 1.0864809155464172e-05, 1.1441297829151154e-05, 1.2017786502838135e-05, 1.2594275176525116e-05, 1.3170763850212097e-05, 1.3747252523899078e-05, 1.432374119758606e-05, 1.490022987127304e-05, 1.5476718544960022e-05, 1.6053207218647003e-05, 1.6629695892333984e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 9.0, 13.0, 10.0, 14.0, 24.0, 32.0, 52.0, 100.0, 181.0, 458.0, 1176.0, 4146.0, 19579.0, 153131.0, 746594.0, 103078.0, 14776.0, 3433.0, 1021.0, 370.0, 148.0, 75.0, 36.0, 34.0, 18.0, 15.0, 9.0, 4.0, 8.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042816162109375, -0.041408538818359375, -0.04000091552734375, -0.038593292236328125, -0.0371856689453125, -0.035778045654296875, -0.03437042236328125, -0.032962799072265625, -0.03155517578125, -0.030147552490234375, -0.02873992919921875, -0.027332305908203125, -0.0259246826171875, -0.024517059326171875, -0.02310943603515625, -0.021701812744140625, -0.020294189453125, -0.018886566162109375, -0.01747894287109375, -0.016071319580078125, -0.0146636962890625, -0.013256072998046875, -0.01184844970703125, -0.010440826416015625, -0.009033203125, -0.007625579833984375, -0.00621795654296875, -0.004810333251953125, -0.0034027099609375, -0.001995086669921875, -0.00058746337890625, 0.000820159912109375, 0.002227783203125, 0.003635406494140625, 0.00504302978515625, 0.006450653076171875, 0.0078582763671875, 0.009265899658203125, 0.01067352294921875, 0.012081146240234375, 0.01348876953125, 0.014896392822265625, 0.01630401611328125, 0.017711639404296875, 0.0191192626953125, 0.020526885986328125, 0.02193450927734375, 0.023342132568359375, 0.024749755859375, 0.026157379150390625, 0.02756500244140625, 0.028972625732421875, 0.0303802490234375, 0.031787872314453125, 0.03319549560546875, 0.034603118896484375, 0.0360107421875, 0.037418365478515625, 0.03882598876953125, 0.040233612060546875, 0.0416412353515625, 0.043048858642578125, 0.04445648193359375, 0.045864105224609375, 0.047271728515625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 3.0, 5.0, 9.0, 10.0, 14.0, 14.0, 17.0, 27.0, 36.0, 41.0, 45.0, 48.0, 63.0, 74.0, 94.0, 118.0, 67.0, 60.0, 36.0, 35.0, 39.0, 31.0, 20.0, 28.0, 17.0, 12.0, 5.0, 6.0, 9.0, 7.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006473541259765625, -0.006262838840484619, -0.006052136421203613, -0.005841434001922607, -0.0056307315826416016, -0.005420029163360596, -0.00520932674407959, -0.004998624324798584, -0.004787921905517578, -0.004577219486236572, -0.004366517066955566, -0.0041558146476745605, -0.003945112228393555, -0.003734409809112549, -0.003523707389831543, -0.003313004970550537, -0.0031023025512695312, -0.0028916001319885254, -0.0026808977127075195, -0.0024701952934265137, -0.002259492874145508, -0.002048790454864502, -0.001838088035583496, -0.0016273856163024902, -0.0014166831970214844, -0.0012059807777404785, -0.0009952783584594727, -0.0007845759391784668, -0.0005738735198974609, -0.0003631711006164551, -0.00015246868133544922, 5.823373794555664e-05, 0.0002689361572265625, 0.00047963857650756836, 0.0006903409957885742, 0.0009010434150695801, 0.001111745834350586, 0.0013224482536315918, 0.0015331506729125977, 0.0017438530921936035, 0.0019545555114746094, 0.0021652579307556152, 0.002375960350036621, 0.002586662769317627, 0.002797365188598633, 0.0030080676078796387, 0.0032187700271606445, 0.0034294724464416504, 0.0036401748657226562, 0.003850877285003662, 0.004061579704284668, 0.004272282123565674, 0.00448298454284668, 0.0046936869621276855, 0.004904389381408691, 0.005115091800689697, 0.005325794219970703, 0.005536496639251709, 0.005747199058532715, 0.005957901477813721, 0.0061686038970947266, 0.006379306316375732, 0.006590008735656738, 0.006800711154937744, 0.00701141357421875]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 11.0, 10.0, 32.0, 34.0, 52.0, 62.0, 90.0, 101.0, 148.0, 119.0, 94.0, 71.0, 55.0, 34.0, 23.0, 19.0, 7.0, 10.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28356653451919556, -0.2743428945541382, -0.2651192545890808, -0.25589561462402344, -0.24667198956012726, -0.23744834959506989, -0.2282247245311737, -0.21900108456611633, -0.20977744460105896, -0.2005538046360016, -0.1913301646709442, -0.18210653960704803, -0.17288289964199066, -0.1636592596769333, -0.1544356346130371, -0.14521199464797974, -0.13598835468292236, -0.126764714717865, -0.11754108220338821, -0.10831744968891144, -0.09909380972385406, -0.08987016975879669, -0.08064653724431992, -0.07142290472984314, -0.06219926476478577, -0.05297562852501869, -0.04375199228525162, -0.03452835604548454, -0.025304719805717468, -0.016081083565950394, -0.006857447326183319, 0.002366185188293457, 0.011589854955673218, 0.020813491195440292, 0.030037127435207367, 0.03926076367497444, 0.048484399914741516, 0.05770803615450859, 0.06693167239427567, 0.07615530490875244, 0.08537894487380981, 0.09460258483886719, 0.10382621735334396, 0.11304984986782074, 0.12227348983287811, 0.13149712979793549, 0.14072075486183167, 0.14994439482688904, 0.1591680347919464, 0.16839167475700378, 0.17761531472206116, 0.18683893978595734, 0.1960625797510147, 0.20528621971607208, 0.21450984477996826, 0.22373348474502563, 0.232957124710083, 0.24218076467514038, 0.25140440464019775, 0.2606280446052551, 0.2698516845703125, 0.2790752947330475, 0.28829893469810486, 0.29752257466316223, 0.3067462146282196]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 4.0, 10.0, 13.0, 18.0, 22.0, 30.0, 45.0, 69.0, 76.0, 68.0, 81.0, 80.0, 77.0, 71.0, 85.0, 74.0, 59.0, 35.0, 32.0, 23.0, 14.0, 11.0, 8.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13032345473766327, -0.12155041843652725, -0.11277738213539124, -0.10400435328483582, -0.0952313095331192, -0.08645828068256378, -0.07768524438142776, -0.06891220808029175, -0.06013917177915573, -0.051366135478019714, -0.0425930991768837, -0.03382006660103798, -0.025047030299901962, -0.016273993998765945, -0.007500961422920227, 0.0012720748782157898, 0.010045111179351807, 0.018818147480487823, 0.02759118191897869, 0.03636421635746956, 0.045137252658605576, 0.05391028895974159, 0.06268332153558731, 0.07145635783672333, 0.08022939413785934, 0.08900243043899536, 0.09777546674013138, 0.1065485030412674, 0.11532153189182281, 0.12409457564353943, 0.13286760449409485, 0.14164063334465027, 0.1504136621952057, 0.1591866910457611, 0.16795973479747772, 0.17673276364803314, 0.18550580739974976, 0.19427883625030518, 0.2030518651008606, 0.2118249088525772, 0.22059795260429382, 0.22937098145484924, 0.23814402520656586, 0.24691705405712128, 0.2556900978088379, 0.2644631266593933, 0.27323615550994873, 0.28200918436050415, 0.29078221321105957, 0.299555242061615, 0.3083282709121704, 0.3171013295650482, 0.32587435841560364, 0.33464738726615906, 0.3434204161167145, 0.3521934747695923, 0.3609665036201477, 0.3697395324707031, 0.37851256132125854, 0.38728561997413635, 0.3960586488246918, 0.4048316776752472, 0.4136047065258026, 0.4223777651786804, 0.43115079402923584]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 10.0, 19.0, 25.0, 47.0, 57.0, 102.0, 190.0, 284.0, 506.0, 929.0, 1525.0, 3015.0, 5802.0, 12667.0, 32302.0, 122543.0, 657589.0, 147304.0, 36200.0, 13835.0, 6325.0, 3309.0, 1687.0, 927.0, 541.0, 308.0, 200.0, 116.0, 60.0, 52.0, 24.0, 20.0, 5.0, 7.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.335205078125, -0.3252143859863281, -0.31522369384765625, -0.3052330017089844, -0.2952423095703125, -0.2852516174316406, -0.27526092529296875, -0.2652702331542969, -0.255279541015625, -0.24528884887695312, -0.23529815673828125, -0.22530746459960938, -0.2153167724609375, -0.20532608032226562, -0.19533538818359375, -0.18534469604492188, -0.17535400390625, -0.16536331176757812, -0.15537261962890625, -0.14538192749023438, -0.1353912353515625, -0.12540054321289062, -0.11540985107421875, -0.10541915893554688, -0.095428466796875, -0.08543777465820312, -0.07544708251953125, -0.06545639038085938, -0.0554656982421875, -0.045475006103515625, -0.03548431396484375, -0.025493621826171875, -0.0155029296875, -0.005512237548828125, 0.00447845458984375, 0.014469146728515625, 0.0244598388671875, 0.034450531005859375, 0.04444122314453125, 0.054431915283203125, 0.064422607421875, 0.07441329956054688, 0.08440399169921875, 0.09439468383789062, 0.1043853759765625, 0.11437606811523438, 0.12436676025390625, 0.13435745239257812, 0.14434814453125, 0.15433883666992188, 0.16432952880859375, 0.17432022094726562, 0.1843109130859375, 0.19430160522460938, 0.20429229736328125, 0.21428298950195312, 0.224273681640625, 0.23426437377929688, 0.24425506591796875, 0.2542457580566406, 0.2642364501953125, 0.2742271423339844, 0.28421783447265625, 0.2942085266113281, 0.30419921875]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 8.0, 9.0, 20.0, 11.0, 31.0, 36.0, 55.0, 64.0, 62.0, 77.0, 93.0, 74.0, 76.0, 84.0, 63.0, 73.0, 52.0, 35.0, 26.0, 20.0, 9.0, 9.0, 7.0, 6.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28125, -0.2651519775390625, -0.249053955078125, -0.2329559326171875, -0.21685791015625, -0.2007598876953125, -0.184661865234375, -0.1685638427734375, -0.1524658203125, -0.1363677978515625, -0.120269775390625, -0.1041717529296875, -0.08807373046875, -0.0719757080078125, -0.055877685546875, -0.0397796630859375, -0.023681640625, -0.0075836181640625, 0.008514404296875, 0.0246124267578125, 0.04071044921875, 0.0568084716796875, 0.072906494140625, 0.0890045166015625, 0.1051025390625, 0.1212005615234375, 0.137298583984375, 0.1533966064453125, 0.16949462890625, 0.1855926513671875, 0.201690673828125, 0.2177886962890625, 0.23388671875, 0.2499847412109375, 0.266082763671875, 0.2821807861328125, 0.29827880859375, 0.3143768310546875, 0.330474853515625, 0.3465728759765625, 0.3626708984375, 0.3787689208984375, 0.394866943359375, 0.4109649658203125, 0.42706298828125, 0.4431610107421875, 0.459259033203125, 0.4753570556640625, 0.491455078125, 0.5075531005859375, 0.523651123046875, 0.5397491455078125, 0.55584716796875, 0.5719451904296875, 0.588043212890625, 0.6041412353515625, 0.6202392578125, 0.6363372802734375, 0.652435302734375, 0.6685333251953125, 0.68463134765625, 0.7007293701171875, 0.716827392578125, 0.7329254150390625, 0.7490234375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 6.0, 3.0, 5.0, 8.0, 14.0, 11.0, 14.0, 13.0, 25.0, 26.0, 42.0, 40.0, 58.0, 75.0, 74.0, 188.0, 409.0, 1666.0, 20922.0, 948494.0, 71593.0, 3587.0, 546.0, 220.0, 140.0, 79.0, 71.0, 51.0, 35.0, 27.0, 26.0, 23.0, 21.0, 10.0, 9.0, 10.0, 5.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.0751953125, -1.044189453125, -1.01318359375, -0.982177734375, -0.951171875, -0.920166015625, -0.88916015625, -0.858154296875, -0.8271484375, -0.796142578125, -0.76513671875, -0.734130859375, -0.703125, -0.672119140625, -0.64111328125, -0.610107421875, -0.5791015625, -0.548095703125, -0.51708984375, -0.486083984375, -0.455078125, -0.424072265625, -0.39306640625, -0.362060546875, -0.3310546875, -0.300048828125, -0.26904296875, -0.238037109375, -0.20703125, -0.176025390625, -0.14501953125, -0.114013671875, -0.0830078125, -0.052001953125, -0.02099609375, 0.010009765625, 0.041015625, 0.072021484375, 0.10302734375, 0.134033203125, 0.1650390625, 0.196044921875, 0.22705078125, 0.258056640625, 0.2890625, 0.320068359375, 0.35107421875, 0.382080078125, 0.4130859375, 0.444091796875, 0.47509765625, 0.506103515625, 0.537109375, 0.568115234375, 0.59912109375, 0.630126953125, 0.6611328125, 0.692138671875, 0.72314453125, 0.754150390625, 0.78515625, 0.816162109375, 0.84716796875, 0.878173828125, 0.9091796875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 8.0, 11.0, 6.0, 6.0, 7.0, 14.0, 14.0, 20.0, 17.0, 27.0, 33.0, 38.0, 44.0, 37.0, 50.0, 45.0, 56.0, 46.0, 59.0, 44.0, 47.0, 49.0, 49.0, 41.0, 47.0, 30.0, 34.0, 23.0, 20.0, 23.0, 11.0, 12.0, 10.0, 9.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33447265625, -0.3241767883300781, -0.31388092041015625, -0.3035850524902344, -0.2932891845703125, -0.2829933166503906, -0.27269744873046875, -0.2624015808105469, -0.252105712890625, -0.24180984497070312, -0.23151397705078125, -0.22121810913085938, -0.2109222412109375, -0.20062637329101562, -0.19033050537109375, -0.18003463745117188, -0.16973876953125, -0.15944290161132812, -0.14914703369140625, -0.13885116577148438, -0.1285552978515625, -0.11825942993164062, -0.10796356201171875, -0.09766769409179688, -0.087371826171875, -0.07707595825195312, -0.06678009033203125, -0.056484222412109375, -0.0461883544921875, -0.035892486572265625, -0.02559661865234375, -0.015300750732421875, -0.0050048828125, 0.005290985107421875, 0.01558685302734375, 0.025882720947265625, 0.0361785888671875, 0.046474456787109375, 0.05677032470703125, 0.06706619262695312, 0.077362060546875, 0.08765792846679688, 0.09795379638671875, 0.10824966430664062, 0.1185455322265625, 0.12884140014648438, 0.13913726806640625, 0.14943313598632812, 0.15972900390625, 0.17002487182617188, 0.18032073974609375, 0.19061660766601562, 0.2009124755859375, 0.21120834350585938, 0.22150421142578125, 0.23180007934570312, 0.242095947265625, 0.2523918151855469, 0.26268768310546875, 0.2729835510253906, 0.2832794189453125, 0.2935752868652344, 0.30387115478515625, 0.3141670227050781, 0.324462890625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 5.0, 6.0, 6.0, 2.0, 7.0, 9.0, 9.0, 7.0, 18.0, 19.0, 52.0, 97.0, 250.0, 886.0, 3959.0, 39459.0, 954423.0, 43568.0, 4198.0, 995.0, 292.0, 117.0, 55.0, 43.0, 22.0, 14.0, 10.0, 8.0, 8.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.18310546875, -0.17729568481445312, -0.17148590087890625, -0.16567611694335938, -0.1598663330078125, -0.15405654907226562, -0.14824676513671875, -0.14243698120117188, -0.136627197265625, -0.13081741333007812, -0.12500762939453125, -0.11919784545898438, -0.1133880615234375, -0.10757827758789062, -0.10176849365234375, -0.09595870971679688, -0.09014892578125, -0.08433914184570312, -0.07852935791015625, -0.07271957397460938, -0.0669097900390625, -0.061100006103515625, -0.05529022216796875, -0.049480438232421875, -0.043670654296875, -0.037860870361328125, -0.03205108642578125, -0.026241302490234375, -0.0204315185546875, -0.014621734619140625, -0.00881195068359375, -0.003002166748046875, 0.0028076171875, 0.008617401123046875, 0.01442718505859375, 0.020236968994140625, 0.0260467529296875, 0.031856536865234375, 0.03766632080078125, 0.043476104736328125, 0.049285888671875, 0.055095672607421875, 0.06090545654296875, 0.06671524047851562, 0.0725250244140625, 0.07833480834960938, 0.08414459228515625, 0.08995437622070312, 0.09576416015625, 0.10157394409179688, 0.10738372802734375, 0.11319351196289062, 0.1190032958984375, 0.12481307983398438, 0.13062286376953125, 0.13643264770507812, 0.142242431640625, 0.14805221557617188, 0.15386199951171875, 0.15967178344726562, 0.1654815673828125, 0.17129135131835938, 0.17710113525390625, 0.18291091918945312, 0.188720703125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 2.0, 4.0, 4.0, 4.0, 14.0, 10.0, 16.0, 33.0, 36.0, 83.0, 153.0, 212.0, 160.0, 83.0, 53.0, 39.0, 25.0, 15.0, 8.0, 11.0, 8.0, 2.0, 7.0, 3.0, 8.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7940998077392578e-05, -1.7449259757995605e-05, -1.6957521438598633e-05, -1.646578311920166e-05, -1.5974044799804688e-05, -1.5482306480407715e-05, -1.4990568161010742e-05, -1.449882984161377e-05, -1.4007091522216797e-05, -1.3515353202819824e-05, -1.3023614883422852e-05, -1.2531876564025879e-05, -1.2040138244628906e-05, -1.1548399925231934e-05, -1.1056661605834961e-05, -1.0564923286437988e-05, -1.0073184967041016e-05, -9.581446647644043e-06, -9.08970832824707e-06, -8.597970008850098e-06, -8.106231689453125e-06, -7.614493370056152e-06, -7.12275505065918e-06, -6.631016731262207e-06, -6.139278411865234e-06, -5.647540092468262e-06, -5.155801773071289e-06, -4.664063453674316e-06, -4.172325134277344e-06, -3.680586814880371e-06, -3.1888484954833984e-06, -2.6971101760864258e-06, -2.205371856689453e-06, -1.7136335372924805e-06, -1.2218952178955078e-06, -7.301568984985352e-07, -2.384185791015625e-07, 2.5331974029541016e-07, 7.450580596923828e-07, 1.2367963790893555e-06, 1.7285346984863281e-06, 2.2202730178833008e-06, 2.7120113372802734e-06, 3.203749656677246e-06, 3.6954879760742188e-06, 4.187226295471191e-06, 4.678964614868164e-06, 5.170702934265137e-06, 5.662441253662109e-06, 6.154179573059082e-06, 6.645917892456055e-06, 7.137656211853027e-06, 7.62939453125e-06, 8.121132850646973e-06, 8.612871170043945e-06, 9.104609489440918e-06, 9.59634780883789e-06, 1.0088086128234863e-05, 1.0579824447631836e-05, 1.1071562767028809e-05, 1.1563301086425781e-05, 1.2055039405822754e-05, 1.2546777725219727e-05, 1.30385160446167e-05, 1.3530254364013672e-05]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 10.0, 10.0, 14.0, 15.0, 24.0, 37.0, 62.0, 100.0, 211.0, 465.0, 1269.0, 3856.0, 17912.0, 304661.0, 686248.0, 26189.0, 4837.0, 1509.0, 557.0, 234.0, 109.0, 67.0, 52.0, 31.0, 21.0, 10.0, 8.0, 5.0, 6.0, 0.0, 4.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.150390625, -0.1461048126220703, -0.14181900024414062, -0.13753318786621094, -0.13324737548828125, -0.12896156311035156, -0.12467575073242188, -0.12038993835449219, -0.1161041259765625, -0.11181831359863281, -0.10753250122070312, -0.10324668884277344, -0.09896087646484375, -0.09467506408691406, -0.09038925170898438, -0.08610343933105469, -0.081817626953125, -0.07753181457519531, -0.07324600219726562, -0.06896018981933594, -0.06467437744140625, -0.06038856506347656, -0.056102752685546875, -0.05181694030761719, -0.0475311279296875, -0.04324531555175781, -0.038959503173828125, -0.03467369079589844, -0.03038787841796875, -0.026102066040039062, -0.021816253662109375, -0.017530441284179688, -0.01324462890625, -0.008958816528320312, -0.004673004150390625, -0.0003871917724609375, 0.00389862060546875, 0.008184432983398438, 0.012470245361328125, 0.016756057739257812, 0.0210418701171875, 0.025327682495117188, 0.029613494873046875, 0.03389930725097656, 0.03818511962890625, 0.04247093200683594, 0.046756744384765625, 0.05104255676269531, 0.055328369140625, 0.05961418151855469, 0.06389999389648438, 0.06818580627441406, 0.07247161865234375, 0.07675743103027344, 0.08104324340820312, 0.08532905578613281, 0.0896148681640625, 0.09390068054199219, 0.09818649291992188, 0.10247230529785156, 0.10675811767578125, 0.11104393005371094, 0.11532974243164062, 0.11961555480957031, 0.1239013671875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 4.0, 8.0, 12.0, 14.0, 13.0, 18.0, 32.0, 39.0, 54.0, 79.0, 117.0, 153.0, 127.0, 76.0, 80.0, 48.0, 37.0, 29.0, 18.0, 12.0, 6.0, 3.0, 5.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.03936767578125, -0.038074493408203125, -0.03678131103515625, -0.035488128662109375, -0.0341949462890625, -0.032901763916015625, -0.03160858154296875, -0.030315399169921875, -0.029022216796875, -0.027729034423828125, -0.02643585205078125, -0.025142669677734375, -0.0238494873046875, -0.022556304931640625, -0.02126312255859375, -0.019969940185546875, -0.0186767578125, -0.017383575439453125, -0.01609039306640625, -0.014797210693359375, -0.0135040283203125, -0.012210845947265625, -0.01091766357421875, -0.009624481201171875, -0.008331298828125, -0.007038116455078125, -0.00574493408203125, -0.004451751708984375, -0.0031585693359375, -0.001865386962890625, -0.00057220458984375, 0.000720977783203125, 0.00201416015625, 0.003307342529296875, 0.00460052490234375, 0.005893707275390625, 0.0071868896484375, 0.008480072021484375, 0.00977325439453125, 0.011066436767578125, 0.012359619140625, 0.013652801513671875, 0.01494598388671875, 0.016239166259765625, 0.0175323486328125, 0.018825531005859375, 0.02011871337890625, 0.021411895751953125, 0.022705078125, 0.023998260498046875, 0.02529144287109375, 0.026584625244140625, 0.0278778076171875, 0.029170989990234375, 0.03046417236328125, 0.031757354736328125, 0.033050537109375, 0.034343719482421875, 0.03563690185546875, 0.036930084228515625, 0.0382232666015625, 0.039516448974609375, 0.04080963134765625, 0.042102813720703125, 0.04339599609375]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 9.0, 23.0, 37.0, 47.0, 140.0, 180.0, 204.0, 153.0, 91.0, 51.0, 22.0, 18.0, 7.0, 9.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5272629857063293, -0.4985676407814026, -0.46987229585647583, -0.44117698073387146, -0.4124816358089447, -0.38378629088401794, -0.3550909757614136, -0.3263956308364868, -0.29770028591156006, -0.2690049409866333, -0.24030961096286774, -0.21161428093910217, -0.18291893601417542, -0.15422359108924866, -0.1255282610654831, -0.09683293104171753, -0.06813758611679077, -0.03944224864244461, -0.01074691116809845, 0.01794842630624771, 0.04664376378059387, 0.07533910870552063, 0.1040344387292862, 0.13272976875305176, 0.16142511367797852, 0.19012045860290527, 0.21881578862667084, 0.2475111186504364, 0.27620646357536316, 0.3049018085002899, 0.3335971236228943, 0.36229246854782104, 0.390987753868103, 0.4196830987930298, 0.44837844371795654, 0.4770737588405609, 0.5057691335678101, 0.5344644784927368, 0.5631597638130188, 0.5918551087379456, 0.6205504536628723, 0.6492457985877991, 0.6779411435127258, 0.7066364884376526, 0.7353317737579346, 0.7640271186828613, 0.7927224636077881, 0.8214178085327148, 0.8501131534576416, 0.8788084983825684, 0.9075038433074951, 0.9361991882324219, 0.9648945331573486, 0.9935898780822754, 1.0222852230072021, 1.050980567932129, 1.0796759128570557, 1.1083712577819824, 1.1370666027069092, 1.165761947631836, 1.1944572925567627, 1.2231526374816895, 1.2518479824066162, 1.280543327331543, 1.3092385530471802]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 7.0, 7.0, 7.0, 9.0, 18.0, 12.0, 22.0, 12.0, 24.0, 30.0, 24.0, 33.0, 35.0, 22.0, 40.0, 38.0, 51.0, 42.0, 53.0, 44.0, 42.0, 54.0, 43.0, 41.0, 37.0, 36.0, 35.0, 32.0, 25.0, 26.0, 16.0, 22.0, 12.0, 13.0, 9.0, 7.0, 10.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37177786231040955, -0.35603827238082886, -0.3402986526489258, -0.3245590627193451, -0.3088194727897644, -0.29307985305786133, -0.27734026312828064, -0.26160067319869995, -0.24586106836795807, -0.2301214635372162, -0.2143818736076355, -0.19864226877689362, -0.18290266394615173, -0.16716307401657104, -0.15142346918582916, -0.13568386435508728, -0.11994427442550659, -0.1042046770453453, -0.08846507966518402, -0.07272547483444214, -0.05698587745428085, -0.04124628007411957, -0.025506675243377686, -0.0097670778632164, 0.005972519516944885, 0.02171211875975132, 0.037451718002557755, 0.05319131910800934, 0.06893091648817062, 0.08467051386833191, 0.10041011869907379, 0.11614971607923508, 0.13188934326171875, 0.14762894809246063, 0.16336853802204132, 0.1791081428527832, 0.1948477327823639, 0.21058733761310577, 0.22632694244384766, 0.24206653237342834, 0.25780612230300903, 0.2735457122325897, 0.2892853319644928, 0.3050249218940735, 0.3207645118236542, 0.33650410175323486, 0.35224372148513794, 0.36798331141471863, 0.3837229311466217, 0.3994625210762024, 0.41520214080810547, 0.43094173073768616, 0.44668132066726685, 0.4624209403991699, 0.4781605303287506, 0.4939001202583313, 0.5096397399902344, 0.5253793597221375, 0.5411189198493958, 0.5568585395812988, 0.5725981593132019, 0.5883377194404602, 0.6040773391723633, 0.6198169589042664, 0.6355565190315247]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 5.0, 5.0, 10.0, 8.0, 8.0, 17.0, 23.0, 31.0, 29.0, 42.0, 69.0, 72.0, 118.0, 177.0, 283.0, 408.0, 656.0, 1187.0, 2088.0, 4385.0, 10444.0, 42519.0, 825234.0, 3049629.0, 222437.0, 20239.0, 7002.0, 3046.0, 1606.0, 884.0, 554.0, 309.0, 223.0, 160.0, 96.0, 57.0, 68.0, 42.0, 29.0, 22.0, 11.0, 15.0, 7.0, 4.0, 5.0, 10.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.423583984375, -0.40959930419921875, -0.3956146240234375, -0.38162994384765625, -0.367645263671875, -0.35366058349609375, -0.3396759033203125, -0.32569122314453125, -0.31170654296875, -0.29772186279296875, -0.2837371826171875, -0.26975250244140625, -0.255767822265625, -0.24178314208984375, -0.2277984619140625, -0.21381378173828125, -0.1998291015625, -0.18584442138671875, -0.1718597412109375, -0.15787506103515625, -0.143890380859375, -0.12990570068359375, -0.1159210205078125, -0.10193634033203125, -0.08795166015625, -0.07396697998046875, -0.0599822998046875, -0.04599761962890625, -0.032012939453125, -0.01802825927734375, -0.0040435791015625, 0.00994110107421875, 0.02392578125, 0.03791046142578125, 0.0518951416015625, 0.06587982177734375, 0.079864501953125, 0.09384918212890625, 0.1078338623046875, 0.12181854248046875, 0.13580322265625, 0.14978790283203125, 0.1637725830078125, 0.17775726318359375, 0.191741943359375, 0.20572662353515625, 0.2197113037109375, 0.23369598388671875, 0.2476806640625, 0.26166534423828125, 0.2756500244140625, 0.28963470458984375, 0.303619384765625, 0.31760406494140625, 0.3315887451171875, 0.34557342529296875, 0.35955810546875, 0.37354278564453125, 0.3875274658203125, 0.40151214599609375, 0.415496826171875, 0.42948150634765625, 0.4434661865234375, 0.45745086669921875, 0.471435546875]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 6.0, 5.0, 10.0, 1.0, 8.0, 6.0, 7.0, 13.0, 8.0, 13.0, 17.0, 16.0, 21.0, 14.0, 32.0, 27.0, 33.0, 30.0, 28.0, 34.0, 38.0, 30.0, 46.0, 33.0, 47.0, 43.0, 43.0, 46.0, 35.0, 32.0, 25.0, 29.0, 28.0, 34.0, 22.0, 15.0, 15.0, 25.0, 20.0, 15.0, 10.0, 7.0, 10.0, 5.0, 2.0, 5.0, 6.0, 2.0, 8.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.184814453125, -0.17955780029296875, -0.1743011474609375, -0.16904449462890625, -0.163787841796875, -0.15853118896484375, -0.1532745361328125, -0.14801788330078125, -0.14276123046875, -0.13750457763671875, -0.1322479248046875, -0.12699127197265625, -0.121734619140625, -0.11647796630859375, -0.1112213134765625, -0.10596466064453125, -0.1007080078125, -0.09545135498046875, -0.0901947021484375, -0.08493804931640625, -0.079681396484375, -0.07442474365234375, -0.0691680908203125, -0.06391143798828125, -0.05865478515625, -0.05339813232421875, -0.0481414794921875, -0.04288482666015625, -0.037628173828125, -0.03237152099609375, -0.0271148681640625, -0.02185821533203125, -0.0166015625, -0.01134490966796875, -0.0060882568359375, -0.00083160400390625, 0.004425048828125, 0.00968170166015625, 0.0149383544921875, 0.02019500732421875, 0.02545166015625, 0.03070831298828125, 0.0359649658203125, 0.04122161865234375, 0.046478271484375, 0.05173492431640625, 0.0569915771484375, 0.06224822998046875, 0.0675048828125, 0.07276153564453125, 0.0780181884765625, 0.08327484130859375, 0.088531494140625, 0.09378814697265625, 0.0990447998046875, 0.10430145263671875, 0.10955810546875, 0.11481475830078125, 0.1200714111328125, 0.12532806396484375, 0.130584716796875, 0.13584136962890625, 0.1410980224609375, 0.14635467529296875, 0.151611328125]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 3.0, 3.0, 6.0, 5.0, 10.0, 7.0, 11.0, 11.0, 15.0, 15.0, 37.0, 39.0, 46.0, 77.0, 122.0, 206.0, 748.0, 5431.0, 1522983.0, 2657565.0, 5659.0, 726.0, 191.0, 91.0, 65.0, 68.0, 31.0, 29.0, 13.0, 15.0, 18.0, 5.0, 9.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.62890625, -1.58489990234375, -1.5408935546875, -1.49688720703125, -1.452880859375, -1.40887451171875, -1.3648681640625, -1.32086181640625, -1.27685546875, -1.23284912109375, -1.1888427734375, -1.14483642578125, -1.100830078125, -1.05682373046875, -1.0128173828125, -0.96881103515625, -0.9248046875, -0.88079833984375, -0.8367919921875, -0.79278564453125, -0.748779296875, -0.70477294921875, -0.6607666015625, -0.61676025390625, -0.57275390625, -0.52874755859375, -0.4847412109375, -0.44073486328125, -0.396728515625, -0.35272216796875, -0.3087158203125, -0.26470947265625, -0.220703125, -0.17669677734375, -0.1326904296875, -0.08868408203125, -0.044677734375, -0.00067138671875, 0.0433349609375, 0.08734130859375, 0.13134765625, 0.17535400390625, 0.2193603515625, 0.26336669921875, 0.307373046875, 0.35137939453125, 0.3953857421875, 0.43939208984375, 0.4833984375, 0.52740478515625, 0.5714111328125, 0.61541748046875, 0.659423828125, 0.70343017578125, 0.7474365234375, 0.79144287109375, 0.83544921875, 0.87945556640625, 0.9234619140625, 0.96746826171875, 1.011474609375, 1.05548095703125, 1.0994873046875, 1.14349365234375, 1.1875]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 2.0, 4.0, 5.0, 11.0, 22.0, 27.0, 31.0, 40.0, 64.0, 126.0, 296.0, 724.0, 1213.0, 808.0, 332.0, 137.0, 70.0, 45.0, 31.0, 23.0, 10.0, 9.0, 16.0, 10.0, 6.0, 4.0, 2.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10369873046875, -0.0993051528930664, -0.09491157531738281, -0.09051799774169922, -0.08612442016601562, -0.08173084259033203, -0.07733726501464844, -0.07294368743896484, -0.06855010986328125, -0.06415653228759766, -0.05976295471191406, -0.05536937713623047, -0.050975799560546875, -0.04658222198486328, -0.04218864440917969, -0.037795066833496094, -0.0334014892578125, -0.029007911682128906, -0.024614334106445312, -0.02022075653076172, -0.015827178955078125, -0.011433601379394531, -0.0070400238037109375, -0.0026464462280273438, 0.00174713134765625, 0.006140708923339844, 0.010534286499023438, 0.014927864074707031, 0.019321441650390625, 0.02371501922607422, 0.028108596801757812, 0.032502174377441406, 0.036895751953125, 0.041289329528808594, 0.04568290710449219, 0.05007648468017578, 0.054470062255859375, 0.05886363983154297, 0.06325721740722656, 0.06765079498291016, 0.07204437255859375, 0.07643795013427734, 0.08083152770996094, 0.08522510528564453, 0.08961868286132812, 0.09401226043701172, 0.09840583801269531, 0.1027994155883789, 0.1071929931640625, 0.1115865707397461, 0.11598014831542969, 0.12037372589111328, 0.12476730346679688, 0.12916088104248047, 0.13355445861816406, 0.13794803619384766, 0.14234161376953125, 0.14673519134521484, 0.15112876892089844, 0.15552234649658203, 0.15991592407226562, 0.16430950164794922, 0.1687030792236328, 0.1730966567993164, 0.177490234375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 6.0, 10.0, 12.0, 31.0, 39.0, 52.0, 82.0, 104.0, 139.0, 110.0, 116.0, 70.0, 59.0, 37.0, 32.0, 27.0, 23.0, 12.0, 9.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2836915850639343, -0.2709067463874817, -0.25812193751335144, -0.24533711373806, -0.23255228996276855, -0.21976745128631592, -0.20698264241218567, -0.19419780373573303, -0.18141299486160278, -0.16862817108631134, -0.1558433473110199, -0.14305852353572845, -0.130273699760437, -0.11748886853456497, -0.10470404475927353, -0.09191922098398209, -0.07913438975811005, -0.0663495659828186, -0.05356474220752716, -0.04077991470694542, -0.027995090931653976, -0.015210263431072235, -0.0024254396557807922, 0.01035938411951065, 0.023144207894802094, 0.035929031670093536, 0.04871385544538498, 0.06149868294596672, 0.07428351044654846, 0.0870683342218399, 0.09985315799713135, 0.11263798177242279, 0.12542280554771423, 0.13820762932300568, 0.15099245309829712, 0.16377727687358856, 0.17656210064888, 0.18934693932533264, 0.2021317481994629, 0.21491658687591553, 0.22770139575004578, 0.24048621952533722, 0.25327104330062866, 0.2660558819770813, 0.27884069085121155, 0.2916255295276642, 0.30441033840179443, 0.31719517707824707, 0.3299800157546997, 0.34276485443115234, 0.3555496633052826, 0.36833450198173523, 0.3811193108558655, 0.3939041495323181, 0.40668895840644836, 0.419473797082901, 0.43225860595703125, 0.4450434446334839, 0.45782825350761414, 0.4706130921840668, 0.483397901058197, 0.49618273973464966, 0.5089675784111023, 0.5217523574829102, 0.5345371961593628]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 5.0, 10.0, 3.0, 5.0, 13.0, 6.0, 13.0, 18.0, 24.0, 15.0, 29.0, 31.0, 34.0, 33.0, 30.0, 36.0, 44.0, 44.0, 41.0, 48.0, 42.0, 53.0, 41.0, 39.0, 39.0, 42.0, 43.0, 36.0, 36.0, 27.0, 22.0, 18.0, 16.0, 16.0, 7.0, 9.0, 8.0, 8.0, 3.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2305736392736435, -0.22390788793563843, -0.21724213659763336, -0.2105763852596283, -0.20391061902046204, -0.19724488258361816, -0.1905791163444519, -0.18391336500644684, -0.17724761366844177, -0.1705818623304367, -0.16391611099243164, -0.15725035965442657, -0.1505846083164215, -0.14391884207725525, -0.13725309073925018, -0.13058733940124512, -0.12392158806324005, -0.11725583672523499, -0.11059008538722992, -0.10392432659864426, -0.09725857526063919, -0.09059282392263412, -0.08392706513404846, -0.0772613137960434, -0.07059556245803833, -0.06392981112003326, -0.0572640560567379, -0.050598300993442535, -0.04393254965543747, -0.037266798317432404, -0.03060104325413704, -0.023935288190841675, -0.017269551753997803, -0.010603798553347588, -0.0039380453526973724, 0.0027277078479528427, 0.009393461048603058, 0.016059212386608124, 0.022724967449903488, 0.029390722513198853, 0.03605647385120392, 0.042722225189208984, 0.04938798025250435, 0.05605373531579971, 0.06271948665380478, 0.06938523799180984, 0.07605099678039551, 0.08271674811840057, 0.08938249945640564, 0.0960482507944107, 0.10271400213241577, 0.10937976092100143, 0.1160455122590065, 0.12271126359701157, 0.12937702238559723, 0.1360427737236023, 0.14270852506160736, 0.14937427639961243, 0.1560400277376175, 0.16270577907562256, 0.16937154531478882, 0.1760372817516327, 0.18270304799079895, 0.18936879932880402, 0.19603455066680908]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 7.0, 5.0, 12.0, 19.0, 25.0, 36.0, 59.0, 69.0, 133.0, 181.0, 259.0, 441.0, 831.0, 1404.0, 2723.0, 5952.0, 14071.0, 41521.0, 170920.0, 560404.0, 179648.0, 42631.0, 14581.0, 6222.0, 2941.0, 1449.0, 789.0, 484.0, 252.0, 183.0, 84.0, 70.0, 40.0, 36.0, 20.0, 14.0, 13.0, 9.0, 2.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.091552734375, -0.0891122817993164, -0.08667182922363281, -0.08423137664794922, -0.08179092407226562, -0.07935047149658203, -0.07691001892089844, -0.07446956634521484, -0.07202911376953125, -0.06958866119384766, -0.06714820861816406, -0.06470775604248047, -0.062267303466796875, -0.05982685089111328, -0.05738639831542969, -0.054945945739746094, -0.0525054931640625, -0.050065040588378906, -0.04762458801269531, -0.04518413543701172, -0.042743682861328125, -0.04030323028564453, -0.03786277770996094, -0.035422325134277344, -0.03298187255859375, -0.030541419982910156, -0.028100967407226562, -0.02566051483154297, -0.023220062255859375, -0.02077960968017578, -0.018339157104492188, -0.015898704528808594, -0.013458251953125, -0.011017799377441406, -0.008577346801757812, -0.006136894226074219, -0.003696441650390625, -0.0012559890747070312, 0.0011844635009765625, 0.0036249160766601562, 0.00606536865234375, 0.008505821228027344, 0.010946273803710938, 0.013386726379394531, 0.015827178955078125, 0.01826763153076172, 0.020708084106445312, 0.023148536682128906, 0.0255889892578125, 0.028029441833496094, 0.030469894409179688, 0.03291034698486328, 0.035350799560546875, 0.03779125213623047, 0.04023170471191406, 0.042672157287597656, 0.04511260986328125, 0.047553062438964844, 0.04999351501464844, 0.05243396759033203, 0.054874420166015625, 0.05731487274169922, 0.05975532531738281, 0.062195777893066406, 0.06463623046875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 3.0, 5.0, 7.0, 13.0, 14.0, 16.0, 18.0, 37.0, 35.0, 36.0, 37.0, 56.0, 42.0, 69.0, 57.0, 64.0, 66.0, 76.0, 50.0, 38.0, 60.0, 50.0, 32.0, 25.0, 31.0, 19.0, 11.0, 4.0, 6.0, 8.0, 4.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.184814453125, -0.178985595703125, -0.17315673828125, -0.167327880859375, -0.1614990234375, -0.155670166015625, -0.14984130859375, -0.144012451171875, -0.13818359375, -0.132354736328125, -0.12652587890625, -0.120697021484375, -0.1148681640625, -0.109039306640625, -0.10321044921875, -0.097381591796875, -0.091552734375, -0.085723876953125, -0.07989501953125, -0.074066162109375, -0.0682373046875, -0.062408447265625, -0.05657958984375, -0.050750732421875, -0.044921875, -0.039093017578125, -0.03326416015625, -0.027435302734375, -0.0216064453125, -0.015777587890625, -0.00994873046875, -0.004119873046875, 0.001708984375, 0.007537841796875, 0.01336669921875, 0.019195556640625, 0.0250244140625, 0.030853271484375, 0.03668212890625, 0.042510986328125, 0.04833984375, 0.054168701171875, 0.05999755859375, 0.065826416015625, 0.0716552734375, 0.077484130859375, 0.08331298828125, 0.089141845703125, 0.094970703125, 0.100799560546875, 0.10662841796875, 0.112457275390625, 0.1182861328125, 0.124114990234375, 0.12994384765625, 0.135772705078125, 0.1416015625, 0.147430419921875, 0.15325927734375, 0.159088134765625, 0.1649169921875, 0.170745849609375, 0.17657470703125, 0.182403564453125, 0.188232421875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 3.0, 5.0, 4.0, 4.0, 5.0, 14.0, 20.0, 29.0, 54.0, 79.0, 163.0, 381.0, 1024.0, 3487.0, 15701.0, 115726.0, 735406.0, 151688.0, 18646.0, 4093.0, 1178.0, 443.0, 170.0, 71.0, 50.0, 36.0, 24.0, 13.0, 7.0, 5.0, 6.0, 7.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12310791015625, -0.11943912506103516, -0.11577033996582031, -0.11210155487060547, -0.10843276977539062, -0.10476398468017578, -0.10109519958496094, -0.0974264144897461, -0.09375762939453125, -0.0900888442993164, -0.08642005920410156, -0.08275127410888672, -0.07908248901367188, -0.07541370391845703, -0.07174491882324219, -0.06807613372802734, -0.0644073486328125, -0.060738563537597656, -0.05706977844238281, -0.05340099334716797, -0.049732208251953125, -0.04606342315673828, -0.04239463806152344, -0.038725852966308594, -0.03505706787109375, -0.031388282775878906, -0.027719497680664062, -0.02405071258544922, -0.020381927490234375, -0.01671314239501953, -0.013044357299804688, -0.009375572204589844, -0.005706787109375, -0.0020380020141601562, 0.0016307830810546875, 0.005299568176269531, 0.008968353271484375, 0.012637138366699219, 0.016305923461914062, 0.019974708557128906, 0.02364349365234375, 0.027312278747558594, 0.030981063842773438, 0.03464984893798828, 0.038318634033203125, 0.04198741912841797, 0.04565620422363281, 0.049324989318847656, 0.0529937744140625, 0.056662559509277344, 0.06033134460449219, 0.06400012969970703, 0.06766891479492188, 0.07133769989013672, 0.07500648498535156, 0.0786752700805664, 0.08234405517578125, 0.0860128402709961, 0.08968162536621094, 0.09335041046142578, 0.09701919555664062, 0.10068798065185547, 0.10435676574707031, 0.10802555084228516, 0.1116943359375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 9.0, 8.0, 11.0, 8.0, 13.0, 14.0, 24.0, 17.0, 27.0, 26.0, 35.0, 35.0, 42.0, 38.0, 45.0, 36.0, 49.0, 52.0, 49.0, 41.0, 44.0, 47.0, 36.0, 42.0, 35.0, 30.0, 35.0, 21.0, 20.0, 16.0, 14.0, 18.0, 11.0, 12.0, 6.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.269775390625, -0.2617378234863281, -0.25370025634765625, -0.24566268920898438, -0.2376251220703125, -0.22958755493164062, -0.22154998779296875, -0.21351242065429688, -0.205474853515625, -0.19743728637695312, -0.18939971923828125, -0.18136215209960938, -0.1733245849609375, -0.16528701782226562, -0.15724945068359375, -0.14921188354492188, -0.14117431640625, -0.13313674926757812, -0.12509918212890625, -0.11706161499023438, -0.1090240478515625, -0.10098648071289062, -0.09294891357421875, -0.08491134643554688, -0.076873779296875, -0.06883621215820312, -0.06079864501953125, -0.052761077880859375, -0.0447235107421875, -0.036685943603515625, -0.02864837646484375, -0.020610809326171875, -0.0125732421875, -0.004535675048828125, 0.00350189208984375, 0.011539459228515625, 0.0195770263671875, 0.027614593505859375, 0.03565216064453125, 0.043689727783203125, 0.051727294921875, 0.059764862060546875, 0.06780242919921875, 0.07583999633789062, 0.0838775634765625, 0.09191513061523438, 0.09995269775390625, 0.10799026489257812, 0.11602783203125, 0.12406539916992188, 0.13210296630859375, 0.14014053344726562, 0.1481781005859375, 0.15621566772460938, 0.16425323486328125, 0.17229080200195312, 0.180328369140625, 0.18836593627929688, 0.19640350341796875, 0.20444107055664062, 0.2124786376953125, 0.22051620483398438, 0.22855377197265625, 0.23659133911132812, 0.24462890625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 0.0, 6.0, 4.0, 4.0, 7.0, 5.0, 19.0, 11.0, 25.0, 23.0, 53.0, 100.0, 190.0, 387.0, 924.0, 2851.0, 10806.0, 67567.0, 760950.0, 178755.0, 19040.0, 4429.0, 1358.0, 530.0, 227.0, 124.0, 74.0, 30.0, 27.0, 11.0, 3.0, 9.0, 5.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0287628173828125, -0.02749466896057129, -0.026226520538330078, -0.024958372116088867, -0.023690223693847656, -0.022422075271606445, -0.021153926849365234, -0.019885778427124023, -0.018617630004882812, -0.0173494815826416, -0.01608133316040039, -0.01481318473815918, -0.013545036315917969, -0.012276887893676758, -0.011008739471435547, -0.009740591049194336, -0.008472442626953125, -0.007204294204711914, -0.005936145782470703, -0.004667997360229492, -0.0033998489379882812, -0.0021317005157470703, -0.0008635520935058594, 0.00040459632873535156, 0.0016727447509765625, 0.0029408931732177734, 0.004209041595458984, 0.005477190017700195, 0.006745338439941406, 0.008013486862182617, 0.009281635284423828, 0.010549783706665039, 0.01181793212890625, 0.013086080551147461, 0.014354228973388672, 0.015622377395629883, 0.016890525817871094, 0.018158674240112305, 0.019426822662353516, 0.020694971084594727, 0.021963119506835938, 0.02323126792907715, 0.02449941635131836, 0.02576756477355957, 0.02703571319580078, 0.028303861618041992, 0.029572010040283203, 0.030840158462524414, 0.032108306884765625, 0.033376455307006836, 0.03464460372924805, 0.03591275215148926, 0.03718090057373047, 0.03844904899597168, 0.03971719741821289, 0.0409853458404541, 0.04225349426269531, 0.04352164268493652, 0.044789791107177734, 0.046057939529418945, 0.047326087951660156, 0.04859423637390137, 0.04986238479614258, 0.05113053321838379, 0.052398681640625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 7.0, 12.0, 9.0, 15.0, 16.0, 27.0, 37.0, 69.0, 74.0, 101.0, 112.0, 151.0, 101.0, 77.0, 55.0, 28.0, 23.0, 22.0, 18.0, 16.0, 9.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3232231140136719e-05, -1.2774020433425903e-05, -1.2315809726715088e-05, -1.1857599020004272e-05, -1.1399388313293457e-05, -1.0941177606582642e-05, -1.0482966899871826e-05, -1.002475619316101e-05, -9.566545486450195e-06, -9.10833477973938e-06, -8.650124073028564e-06, -8.191913366317749e-06, -7.733702659606934e-06, -7.275491952896118e-06, -6.817281246185303e-06, -6.359070539474487e-06, -5.900859832763672e-06, -5.4426491260528564e-06, -4.984438419342041e-06, -4.526227712631226e-06, -4.06801700592041e-06, -3.6098062992095947e-06, -3.1515955924987793e-06, -2.693384885787964e-06, -2.2351741790771484e-06, -1.776963472366333e-06, -1.3187527656555176e-06, -8.605420589447021e-07, -4.023313522338867e-07, 5.587935447692871e-08, 5.140900611877441e-07, 9.723007678985596e-07, 1.430511474609375e-06, 1.8887221813201904e-06, 2.346932888031006e-06, 2.8051435947418213e-06, 3.2633543014526367e-06, 3.721565008163452e-06, 4.179775714874268e-06, 4.637986421585083e-06, 5.0961971282958984e-06, 5.554407835006714e-06, 6.012618541717529e-06, 6.470829248428345e-06, 6.92903995513916e-06, 7.387250661849976e-06, 7.845461368560791e-06, 8.303672075271606e-06, 8.761882781982422e-06, 9.220093488693237e-06, 9.678304195404053e-06, 1.0136514902114868e-05, 1.0594725608825684e-05, 1.1052936315536499e-05, 1.1511147022247314e-05, 1.196935772895813e-05, 1.2427568435668945e-05, 1.288577914237976e-05, 1.3343989849090576e-05, 1.3802200555801392e-05, 1.4260411262512207e-05, 1.4718621969223022e-05, 1.5176832675933838e-05, 1.5635043382644653e-05, 1.609325408935547e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 2.0, 5.0, 4.0, 3.0, 6.0, 8.0, 18.0, 15.0, 21.0, 30.0, 25.0, 45.0, 87.0, 161.0, 279.0, 549.0, 1352.0, 3207.0, 8798.0, 31547.0, 218522.0, 659542.0, 95574.0, 18530.0, 5979.0, 2251.0, 931.0, 426.0, 251.0, 131.0, 80.0, 53.0, 30.0, 23.0, 12.0, 11.0, 6.0, 9.0, 8.0, 8.0, 5.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03094482421875, -0.029987096786499023, -0.029029369354248047, -0.02807164192199707, -0.027113914489746094, -0.026156187057495117, -0.02519845962524414, -0.024240732192993164, -0.023283004760742188, -0.02232527732849121, -0.021367549896240234, -0.020409822463989258, -0.01945209503173828, -0.018494367599487305, -0.017536640167236328, -0.01657891273498535, -0.015621185302734375, -0.014663457870483398, -0.013705730438232422, -0.012748003005981445, -0.011790275573730469, -0.010832548141479492, -0.009874820709228516, -0.008917093276977539, -0.007959365844726562, -0.007001638412475586, -0.006043910980224609, -0.005086183547973633, -0.004128456115722656, -0.0031707286834716797, -0.002213001251220703, -0.0012552738189697266, -0.00029754638671875, 0.0006601810455322266, 0.0016179084777832031, 0.0025756359100341797, 0.0035333633422851562, 0.004491090774536133, 0.005448818206787109, 0.006406545639038086, 0.0073642730712890625, 0.008322000503540039, 0.009279727935791016, 0.010237455368041992, 0.011195182800292969, 0.012152910232543945, 0.013110637664794922, 0.014068365097045898, 0.015026092529296875, 0.01598381996154785, 0.016941547393798828, 0.017899274826049805, 0.01885700225830078, 0.019814729690551758, 0.020772457122802734, 0.02173018455505371, 0.022687911987304688, 0.023645639419555664, 0.02460336685180664, 0.025561094284057617, 0.026518821716308594, 0.02747654914855957, 0.028434276580810547, 0.029392004013061523, 0.0303497314453125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 7.0, 6.0, 8.0, 7.0, 15.0, 16.0, 17.0, 30.0, 39.0, 49.0, 43.0, 58.0, 95.0, 64.0, 93.0, 65.0, 89.0, 60.0, 54.0, 41.0, 24.0, 27.0, 22.0, 14.0, 10.0, 2.0, 5.0, 7.0, 4.0, 4.0, 7.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004848480224609375, -0.0046749114990234375, -0.0045013427734375, -0.0043277740478515625, -0.004154205322265625, -0.0039806365966796875, -0.00380706787109375, -0.0036334991455078125, -0.003459930419921875, -0.0032863616943359375, -0.00311279296875, -0.0029392242431640625, -0.002765655517578125, -0.0025920867919921875, -0.00241851806640625, -0.0022449493408203125, -0.002071380615234375, -0.0018978118896484375, -0.0017242431640625, -0.0015506744384765625, -0.001377105712890625, -0.0012035369873046875, -0.00102996826171875, -0.0008563995361328125, -0.000682830810546875, -0.0005092620849609375, -0.000335693359375, -0.0001621246337890625, 1.1444091796875e-05, 0.0001850128173828125, 0.00035858154296875, 0.0005321502685546875, 0.000705718994140625, 0.0008792877197265625, 0.0010528564453125, 0.0012264251708984375, 0.001399993896484375, 0.0015735626220703125, 0.00174713134765625, 0.0019207000732421875, 0.002094268798828125, 0.0022678375244140625, 0.00244140625, 0.0026149749755859375, 0.002788543701171875, 0.0029621124267578125, 0.00313568115234375, 0.0033092498779296875, 0.003482818603515625, 0.0036563873291015625, 0.0038299560546875, 0.0040035247802734375, 0.004177093505859375, 0.0043506622314453125, 0.00452423095703125, 0.0046977996826171875, 0.004871368408203125, 0.0050449371337890625, 0.005218505859375, 0.0053920745849609375, 0.005565643310546875, 0.0057392120361328125, 0.00591278076171875, 0.0060863494873046875, 0.006259918212890625]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 7.0, 11.0, 16.0, 45.0, 58.0, 144.0, 171.0, 209.0, 129.0, 73.0, 55.0, 35.0, 18.0, 8.0, 8.0, 4.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42667779326438904, -0.4148869514465332, -0.40309613943099976, -0.3913052976131439, -0.3795144557952881, -0.36772364377975464, -0.3559328019618988, -0.34414196014404297, -0.3323511481285095, -0.3205603063106537, -0.30876949429512024, -0.2969786524772644, -0.28518784046173096, -0.2733969986438751, -0.2616061568260193, -0.24981532990932465, -0.23802450299263, -0.22623367607593536, -0.21444284915924072, -0.2026520073413849, -0.19086118042469025, -0.1790703535079956, -0.16727951169013977, -0.15548868477344513, -0.1436978578567505, -0.13190703094005585, -0.12011619657278061, -0.10832536220550537, -0.09653453528881073, -0.08474370837211609, -0.07295287400484085, -0.06116203963756561, -0.04937121272087097, -0.03758038207888603, -0.025789551436901093, -0.013998720794916153, -0.0022078901529312134, 0.009582940489053726, 0.021373771131038666, 0.033164605498313904, 0.044955432415008545, 0.056746263056993484, 0.06853709369897842, 0.08032792806625366, 0.0921187549829483, 0.10390958189964294, 0.11570041626691818, 0.12749125063419342, 0.13928207755088806, 0.1510729044675827, 0.16286373138427734, 0.17465457320213318, 0.18644540011882782, 0.19823622703552246, 0.2100270688533783, 0.22181789577007294, 0.23360872268676758, 0.24539954960346222, 0.25719037652015686, 0.2689812183380127, 0.28077203035354614, 0.292562872171402, 0.3043537139892578, 0.31614452600479126, 0.3279353678226471]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 4.0, 9.0, 2.0, 5.0, 8.0, 14.0, 11.0, 20.0, 19.0, 30.0, 34.0, 51.0, 42.0, 47.0, 55.0, 53.0, 55.0, 71.0, 59.0, 52.0, 60.0, 56.0, 46.0, 51.0, 35.0, 27.0, 26.0, 15.0, 14.0, 4.0, 7.0, 7.0, 7.0, 8.0, 4.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15987694263458252, -0.15445472300052643, -0.14903250336647034, -0.14361026883125305, -0.13818804919719696, -0.13276582956314087, -0.12734359502792358, -0.12192137539386749, -0.1164991557598114, -0.11107693612575531, -0.10565470904111862, -0.10023248195648193, -0.09481026232242584, -0.08938804268836975, -0.08396581560373306, -0.07854358851909637, -0.07312136888504028, -0.06769914925098419, -0.062276922166347504, -0.056854698807001114, -0.051432475447654724, -0.046010252088308334, -0.040588028728961945, -0.035165805369615555, -0.029743582010269165, -0.024321358650922775, -0.018899135291576385, -0.013476911932229996, -0.008054688572883606, -0.002632465213537216, 0.0027897581458091736, 0.008211981505155563, 0.01363418996334076, 0.01905641332268715, 0.02447863668203354, 0.02990086004137993, 0.03532308340072632, 0.04074530676007271, 0.0461675301194191, 0.05158975347876549, 0.05701197683811188, 0.06243420019745827, 0.06785642355680466, 0.07327865064144135, 0.07870087027549744, 0.08412308990955353, 0.08954531699419022, 0.0949675440788269, 0.100389763712883, 0.10581198334693909, 0.11123421043157578, 0.11665643751621246, 0.12207865715026855, 0.12750087678432465, 0.13292309641838074, 0.13834533095359802, 0.1437675505876541, 0.1491897702217102, 0.1546120047569275, 0.16003422439098358, 0.16545644402503967, 0.17087866365909576, 0.17630088329315186, 0.18172311782836914, 0.18714533746242523]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 7.0, 2.0, 8.0, 3.0, 9.0, 16.0, 19.0, 47.0, 56.0, 98.0, 120.0, 180.0, 252.0, 368.0, 561.0, 863.0, 1337.0, 2078.0, 3264.0, 5380.0, 9599.0, 18808.0, 43497.0, 138106.0, 501233.0, 212344.0, 58422.0, 23396.0, 11487.0, 6459.0, 3699.0, 2334.0, 1545.0, 970.0, 631.0, 425.0, 300.0, 194.0, 131.0, 101.0, 56.0, 53.0, 28.0, 26.0, 20.0, 9.0, 2.0, 7.0, 3.0, 6.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.1549072265625, -0.15030288696289062, -0.14569854736328125, -0.14109420776367188, -0.1364898681640625, -0.13188552856445312, -0.12728118896484375, -0.12267684936523438, -0.118072509765625, -0.11346817016601562, -0.10886383056640625, -0.10425949096679688, -0.0996551513671875, -0.09505081176757812, -0.09044647216796875, -0.08584213256835938, -0.08123779296875, -0.07663345336914062, -0.07202911376953125, -0.06742477416992188, -0.0628204345703125, -0.058216094970703125, -0.05361175537109375, -0.049007415771484375, -0.044403076171875, -0.039798736572265625, -0.03519439697265625, -0.030590057373046875, -0.0259857177734375, -0.021381378173828125, -0.01677703857421875, -0.012172698974609375, -0.007568359375, -0.002964019775390625, 0.00164031982421875, 0.006244659423828125, 0.0108489990234375, 0.015453338623046875, 0.02005767822265625, 0.024662017822265625, 0.029266357421875, 0.033870697021484375, 0.03847503662109375, 0.043079376220703125, 0.0476837158203125, 0.052288055419921875, 0.05689239501953125, 0.061496734619140625, 0.06610107421875, 0.07070541381835938, 0.07530975341796875, 0.07991409301757812, 0.0845184326171875, 0.08912277221679688, 0.09372711181640625, 0.09833145141601562, 0.102935791015625, 0.10754013061523438, 0.11214447021484375, 0.11674880981445312, 0.1213531494140625, 0.12595748901367188, 0.13056182861328125, 0.13516616821289062, 0.1397705078125]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 8.0, 13.0, 30.0, 40.0, 55.0, 67.0, 85.0, 103.0, 117.0, 115.0, 94.0, 86.0, 78.0, 40.0, 42.0, 12.0, 13.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.381591796875, -0.3613548278808594, -0.34111785888671875, -0.3208808898925781, -0.3006439208984375, -0.2804069519042969, -0.26016998291015625, -0.23993301391601562, -0.219696044921875, -0.19945907592773438, -0.17922210693359375, -0.15898513793945312, -0.1387481689453125, -0.11851119995117188, -0.09827423095703125, -0.07803726196289062, -0.05780029296875, -0.037563323974609375, -0.01732635498046875, 0.002910614013671875, 0.0231475830078125, 0.043384552001953125, 0.06362152099609375, 0.08385848999023438, 0.104095458984375, 0.12433242797851562, 0.14456939697265625, 0.16480636596679688, 0.1850433349609375, 0.20528030395507812, 0.22551727294921875, 0.24575424194335938, 0.2659912109375, 0.2862281799316406, 0.30646514892578125, 0.3267021179199219, 0.3469390869140625, 0.3671760559082031, 0.38741302490234375, 0.4076499938964844, 0.427886962890625, 0.4481239318847656, 0.46836090087890625, 0.4885978698730469, 0.5088348388671875, 0.5290718078613281, 0.5493087768554688, 0.5695457458496094, 0.58978271484375, 0.6100196838378906, 0.6302566528320312, 0.6504936218261719, 0.6707305908203125, 0.6909675598144531, 0.7112045288085938, 0.7314414978027344, 0.751678466796875, 0.7719154357910156, 0.7921524047851562, 0.8123893737792969, 0.8326263427734375, 0.8528633117675781, 0.8731002807617188, 0.8933372497558594, 0.91357421875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 7.0, 7.0, 17.0, 11.0, 19.0, 18.0, 26.0, 38.0, 46.0, 64.0, 85.0, 95.0, 131.0, 207.0, 379.0, 973.0, 4717.0, 42419.0, 906391.0, 83161.0, 7188.0, 1283.0, 423.0, 236.0, 129.0, 109.0, 85.0, 63.0, 40.0, 44.0, 28.0, 27.0, 19.0, 11.0, 14.0, 8.0, 12.0, 5.0, 4.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.458251953125, -0.4441986083984375, -0.430145263671875, -0.4160919189453125, -0.40203857421875, -0.3879852294921875, -0.373931884765625, -0.3598785400390625, -0.3458251953125, -0.3317718505859375, -0.317718505859375, -0.3036651611328125, -0.28961181640625, -0.2755584716796875, -0.261505126953125, -0.2474517822265625, -0.2333984375, -0.2193450927734375, -0.205291748046875, -0.1912384033203125, -0.17718505859375, -0.1631317138671875, -0.149078369140625, -0.1350250244140625, -0.1209716796875, -0.1069183349609375, -0.092864990234375, -0.0788116455078125, -0.06475830078125, -0.0507049560546875, -0.036651611328125, -0.0225982666015625, -0.008544921875, 0.0055084228515625, 0.019561767578125, 0.0336151123046875, 0.04766845703125, 0.0617218017578125, 0.075775146484375, 0.0898284912109375, 0.1038818359375, 0.1179351806640625, 0.131988525390625, 0.1460418701171875, 0.16009521484375, 0.1741485595703125, 0.188201904296875, 0.2022552490234375, 0.21630859375, 0.2303619384765625, 0.244415283203125, 0.2584686279296875, 0.27252197265625, 0.2865753173828125, 0.300628662109375, 0.3146820068359375, 0.3287353515625, 0.3427886962890625, 0.356842041015625, 0.3708953857421875, 0.38494873046875, 0.3990020751953125, 0.413055419921875, 0.4271087646484375, 0.441162109375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 4.0, 5.0, 10.0, 5.0, 12.0, 14.0, 16.0, 17.0, 26.0, 27.0, 33.0, 24.0, 42.0, 32.0, 43.0, 51.0, 48.0, 45.0, 51.0, 59.0, 51.0, 41.0, 50.0, 32.0, 41.0, 35.0, 29.0, 31.0, 18.0, 19.0, 18.0, 18.0, 13.0, 6.0, 10.0, 5.0, 6.0, 4.0, 5.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.27978515625, -0.2710380554199219, -0.26229095458984375, -0.2535438537597656, -0.2447967529296875, -0.23604965209960938, -0.22730255126953125, -0.21855545043945312, -0.209808349609375, -0.20106124877929688, -0.19231414794921875, -0.18356704711914062, -0.1748199462890625, -0.16607284545898438, -0.15732574462890625, -0.14857864379882812, -0.13983154296875, -0.13108444213867188, -0.12233734130859375, -0.11359024047851562, -0.1048431396484375, -0.09609603881835938, -0.08734893798828125, -0.07860183715820312, -0.069854736328125, -0.061107635498046875, -0.05236053466796875, -0.043613433837890625, -0.0348663330078125, -0.026119232177734375, -0.01737213134765625, -0.008625030517578125, 0.0001220703125, 0.008869171142578125, 0.01761627197265625, 0.026363372802734375, 0.0351104736328125, 0.043857574462890625, 0.05260467529296875, 0.061351776123046875, 0.070098876953125, 0.07884597778320312, 0.08759307861328125, 0.09634017944335938, 0.1050872802734375, 0.11383438110351562, 0.12258148193359375, 0.13132858276367188, 0.14007568359375, 0.14882278442382812, 0.15756988525390625, 0.16631698608398438, 0.1750640869140625, 0.18381118774414062, 0.19255828857421875, 0.20130538940429688, 0.210052490234375, 0.21879959106445312, 0.22754669189453125, 0.23629379272460938, 0.2450408935546875, 0.2537879943847656, 0.26253509521484375, 0.2712821960449219, 0.280029296875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 6.0, 15.0, 13.0, 16.0, 19.0, 42.0, 56.0, 110.0, 229.0, 523.0, 1566.0, 5718.0, 40438.0, 872883.0, 112799.0, 10338.0, 2406.0, 743.0, 265.0, 155.0, 85.0, 39.0, 33.0, 18.0, 9.0, 4.0, 5.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.1707763671875, -0.16598892211914062, -0.16120147705078125, -0.15641403198242188, -0.1516265869140625, -0.14683914184570312, -0.14205169677734375, -0.13726425170898438, -0.132476806640625, -0.12768936157226562, -0.12290191650390625, -0.11811447143554688, -0.1133270263671875, -0.10853958129882812, -0.10375213623046875, -0.09896469116210938, -0.09417724609375, -0.08938980102539062, -0.08460235595703125, -0.07981491088867188, -0.0750274658203125, -0.07024002075195312, -0.06545257568359375, -0.060665130615234375, -0.055877685546875, -0.051090240478515625, -0.04630279541015625, -0.041515350341796875, -0.0367279052734375, -0.031940460205078125, -0.02715301513671875, -0.022365570068359375, -0.017578125, -0.012790679931640625, -0.00800323486328125, -0.003215789794921875, 0.0015716552734375, 0.006359100341796875, 0.01114654541015625, 0.015933990478515625, 0.020721435546875, 0.025508880615234375, 0.03029632568359375, 0.035083770751953125, 0.0398712158203125, 0.044658660888671875, 0.04944610595703125, 0.054233551025390625, 0.05902099609375, 0.06380844116210938, 0.06859588623046875, 0.07338333129882812, 0.0781707763671875, 0.08295822143554688, 0.08774566650390625, 0.09253311157226562, 0.097320556640625, 0.10210800170898438, 0.10689544677734375, 0.11168289184570312, 0.1164703369140625, 0.12125778198242188, 0.12604522705078125, 0.13083267211914062, 0.1356201171875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 2.0, 3.0, 14.0, 10.0, 19.0, 31.0, 28.0, 48.0, 74.0, 88.0, 167.0, 170.0, 97.0, 64.0, 59.0, 25.0, 23.0, 25.0, 11.0, 10.0, 5.0, 7.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5616416931152344e-05, -1.5128403902053833e-05, -1.4640390872955322e-05, -1.4152377843856812e-05, -1.36643648147583e-05, -1.317635178565979e-05, -1.268833875656128e-05, -1.2200325727462769e-05, -1.1712312698364258e-05, -1.1224299669265747e-05, -1.0736286640167236e-05, -1.0248273611068726e-05, -9.760260581970215e-06, -9.272247552871704e-06, -8.784234523773193e-06, -8.296221494674683e-06, -7.808208465576172e-06, -7.320195436477661e-06, -6.83218240737915e-06, -6.34416937828064e-06, -5.856156349182129e-06, -5.368143320083618e-06, -4.880130290985107e-06, -4.392117261886597e-06, -3.904104232788086e-06, -3.416091203689575e-06, -2.9280781745910645e-06, -2.4400651454925537e-06, -1.952052116394043e-06, -1.4640390872955322e-06, -9.760260581970215e-07, -4.880130290985107e-07, 0.0, 4.880130290985107e-07, 9.760260581970215e-07, 1.4640390872955322e-06, 1.952052116394043e-06, 2.4400651454925537e-06, 2.9280781745910645e-06, 3.416091203689575e-06, 3.904104232788086e-06, 4.392117261886597e-06, 4.880130290985107e-06, 5.368143320083618e-06, 5.856156349182129e-06, 6.34416937828064e-06, 6.83218240737915e-06, 7.320195436477661e-06, 7.808208465576172e-06, 8.296221494674683e-06, 8.784234523773193e-06, 9.272247552871704e-06, 9.760260581970215e-06, 1.0248273611068726e-05, 1.0736286640167236e-05, 1.1224299669265747e-05, 1.1712312698364258e-05, 1.2200325727462769e-05, 1.268833875656128e-05, 1.317635178565979e-05, 1.36643648147583e-05, 1.4152377843856812e-05, 1.4640390872955322e-05, 1.5128403902053833e-05, 1.5616416931152344e-05]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 6.0, 2.0, 8.0, 4.0, 7.0, 10.0, 17.0, 23.0, 30.0, 25.0, 54.0, 90.0, 150.0, 351.0, 1019.0, 3974.0, 26115.0, 905590.0, 100095.0, 8219.0, 1714.0, 549.0, 203.0, 88.0, 60.0, 38.0, 27.0, 17.0, 14.0, 14.0, 8.0, 5.0, 8.0, 8.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1922607421875, -0.18556594848632812, -0.17887115478515625, -0.17217636108398438, -0.1654815673828125, -0.15878677368164062, -0.15209197998046875, -0.14539718627929688, -0.138702392578125, -0.13200759887695312, -0.12531280517578125, -0.11861801147460938, -0.1119232177734375, -0.10522842407226562, -0.09853363037109375, -0.09183883666992188, -0.08514404296875, -0.07844924926757812, -0.07175445556640625, -0.06505966186523438, -0.0583648681640625, -0.051670074462890625, -0.04497528076171875, -0.038280487060546875, -0.031585693359375, -0.024890899658203125, -0.01819610595703125, -0.011501312255859375, -0.0048065185546875, 0.001888275146484375, 0.00858306884765625, 0.015277862548828125, 0.02197265625, 0.028667449951171875, 0.03536224365234375, 0.042057037353515625, 0.0487518310546875, 0.055446624755859375, 0.06214141845703125, 0.06883621215820312, 0.075531005859375, 0.08222579956054688, 0.08892059326171875, 0.09561538696289062, 0.1023101806640625, 0.10900497436523438, 0.11569976806640625, 0.12239456176757812, 0.12908935546875, 0.13578414916992188, 0.14247894287109375, 0.14917373657226562, 0.1558685302734375, 0.16256332397460938, 0.16925811767578125, 0.17595291137695312, 0.182647705078125, 0.18934249877929688, 0.19603729248046875, 0.20273208618164062, 0.2094268798828125, 0.21612167358398438, 0.22281646728515625, 0.22951126098632812, 0.2362060546875]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 2.0, 2.0, 4.0, 3.0, 5.0, 7.0, 6.0, 9.0, 9.0, 14.0, 12.0, 34.0, 48.0, 80.0, 123.0, 166.0, 156.0, 98.0, 60.0, 38.0, 28.0, 21.0, 17.0, 14.0, 7.0, 8.0, 7.0, 4.0, 6.0, 4.0, 0.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048309326171875, -0.046781063079833984, -0.04525279998779297, -0.04372453689575195, -0.04219627380371094, -0.04066801071166992, -0.039139747619628906, -0.03761148452758789, -0.036083221435546875, -0.03455495834350586, -0.033026695251464844, -0.03149843215942383, -0.029970169067382812, -0.028441905975341797, -0.02691364288330078, -0.025385379791259766, -0.02385711669921875, -0.022328853607177734, -0.02080059051513672, -0.019272327423095703, -0.017744064331054688, -0.016215801239013672, -0.014687538146972656, -0.01315927505493164, -0.011631011962890625, -0.01010274887084961, -0.008574485778808594, -0.007046222686767578, -0.0055179595947265625, -0.003989696502685547, -0.0024614334106445312, -0.0009331703186035156, 0.0005950927734375, 0.0021233558654785156, 0.0036516189575195312, 0.005179882049560547, 0.0067081451416015625, 0.008236408233642578, 0.009764671325683594, 0.01129293441772461, 0.012821197509765625, 0.01434946060180664, 0.015877723693847656, 0.017405986785888672, 0.018934249877929688, 0.020462512969970703, 0.02199077606201172, 0.023519039154052734, 0.02504730224609375, 0.026575565338134766, 0.02810382843017578, 0.029632091522216797, 0.031160354614257812, 0.03268861770629883, 0.034216880798339844, 0.03574514389038086, 0.037273406982421875, 0.03880167007446289, 0.040329933166503906, 0.04185819625854492, 0.04338645935058594, 0.04491472244262695, 0.04644298553466797, 0.047971248626708984, 0.04949951171875]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 8.0, 18.0, 53.0, 95.0, 233.0, 290.0, 167.0, 77.0, 31.0, 15.0, 9.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5648092031478882, -1.530989170074463, -1.497169017791748, -1.4633489847183228, -1.429528832435608, -1.3957087993621826, -1.3618886470794678, -1.3280686140060425, -1.2942485809326172, -1.260428547859192, -1.226608395576477, -1.1927883625030518, -1.158968210220337, -1.1251481771469116, -1.0913281440734863, -1.0575079917907715, -1.0236878395080566, -0.9898677468299866, -0.9560476541519165, -0.9222276210784912, -0.8884075284004211, -0.8545874357223511, -0.820767343044281, -0.7869472503662109, -0.7531272172927856, -0.7193071246147156, -0.6854870319366455, -0.6516669988632202, -0.6178469061851501, -0.5840268135070801, -0.55020672082901, -0.5163866281509399, -0.48256659507751465, -0.4487465023994446, -0.4149264395236969, -0.38110634684562683, -0.34728628396987915, -0.3134661912918091, -0.279646098613739, -0.24582602083683014, -0.21200594305992126, -0.1781858652830124, -0.14436578750610352, -0.11054569482803345, -0.07672561705112457, -0.0429055392742157, -0.00908544659614563, 0.024734631180763245, 0.05855470895767212, 0.092374786734581, 0.12619486451148987, 0.16001495718955994, 0.1938350349664688, 0.22765511274337769, 0.26147520542144775, 0.2952952980995178, 0.3291153609752655, 0.36293545365333557, 0.39675551652908325, 0.4305756092071533, 0.4643957018852234, 0.49821576476097107, 0.5320358276367188, 0.5658559203147888, 0.5996760129928589]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 6.0, 8.0, 13.0, 24.0, 22.0, 43.0, 54.0, 44.0, 44.0, 74.0, 67.0, 67.0, 70.0, 63.0, 74.0, 58.0, 55.0, 51.0, 37.0, 29.0, 25.0, 18.0, 22.0, 11.0, 8.0, 6.0, 6.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49517568945884705, -0.47226420044898987, -0.4493526816368103, -0.4264411926269531, -0.40352967381477356, -0.3806181848049164, -0.3577066659927368, -0.33479517698287964, -0.31188368797302246, -0.2889721989631653, -0.2660606801509857, -0.24314919114112854, -0.22023767232894897, -0.1973261833190918, -0.17441467940807343, -0.15150317549705505, -0.1285916566848755, -0.10568015277385712, -0.08276864886283875, -0.05985715240240097, -0.0369456484913826, -0.014034144580364227, 0.008877351880073547, 0.03178885579109192, 0.05470035970211029, 0.07761186361312866, 0.10052336752414703, 0.12343486398458481, 0.14634636044502258, 0.16925787925720215, 0.19216936826705933, 0.2150808721780777, 0.23799240589141846, 0.26090389490127563, 0.2838154137134552, 0.3067269027233124, 0.32963842153549194, 0.3525499105453491, 0.3754613995552063, 0.39837291836738586, 0.42128443717956543, 0.4441959261894226, 0.4671074450016022, 0.49001893401145935, 0.5129304528236389, 0.5358419418334961, 0.5587534308433533, 0.5816649198532104, 0.6045764684677124, 0.6274879574775696, 0.6503994464874268, 0.6733109951019287, 0.6962224841117859, 0.7191339731216431, 0.7420454621315002, 0.7649569511413574, 0.7878684401512146, 0.8107799291610718, 0.833691418170929, 0.8566029667854309, 0.8795144557952881, 0.9024259448051453, 0.9253374338150024, 0.9482489824295044, 0.9711604714393616]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 11.0, 7.0, 10.0, 14.0, 23.0, 25.0, 37.0, 45.0, 88.0, 129.0, 172.0, 248.0, 367.0, 560.0, 911.0, 1515.0, 2492.0, 4735.0, 9707.0, 30600.0, 250841.0, 2427804.0, 1311144.0, 115765.0, 20135.0, 7778.0, 3837.0, 1991.0, 1164.0, 712.0, 478.0, 314.0, 185.0, 128.0, 91.0, 59.0, 45.0, 27.0, 25.0, 16.0, 7.0, 10.0, 6.0, 11.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.2822265625, -0.2736320495605469, -0.26503753662109375, -0.2564430236816406, -0.2478485107421875, -0.23925399780273438, -0.23065948486328125, -0.22206497192382812, -0.213470458984375, -0.20487594604492188, -0.19628143310546875, -0.18768692016601562, -0.1790924072265625, -0.17049789428710938, -0.16190338134765625, -0.15330886840820312, -0.14471435546875, -0.13611984252929688, -0.12752532958984375, -0.11893081665039062, -0.1103363037109375, -0.10174179077148438, -0.09314727783203125, -0.08455276489257812, -0.075958251953125, -0.06736373901367188, -0.05876922607421875, -0.050174713134765625, -0.0415802001953125, -0.032985687255859375, -0.02439117431640625, -0.015796661376953125, -0.0072021484375, 0.001392364501953125, 0.00998687744140625, 0.018581390380859375, 0.0271759033203125, 0.035770416259765625, 0.04436492919921875, 0.052959442138671875, 0.061553955078125, 0.07014846801757812, 0.07874298095703125, 0.08733749389648438, 0.0959320068359375, 0.10452651977539062, 0.11312103271484375, 0.12171554565429688, 0.13031005859375, 0.13890457153320312, 0.14749908447265625, 0.15609359741210938, 0.1646881103515625, 0.17328262329101562, 0.18187713623046875, 0.19047164916992188, 0.199066162109375, 0.20766067504882812, 0.21625518798828125, 0.22484970092773438, 0.2334442138671875, 0.24203872680664062, 0.25063323974609375, 0.2592277526855469, 0.267822265625]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 6.0, 4.0, 5.0, 15.0, 8.0, 22.0, 14.0, 18.0, 36.0, 44.0, 49.0, 45.0, 44.0, 53.0, 56.0, 47.0, 62.0, 65.0, 47.0, 49.0, 51.0, 35.0, 39.0, 40.0, 26.0, 26.0, 23.0, 18.0, 15.0, 11.0, 10.0, 6.0, 9.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.2568359375, -0.2503662109375, -0.243896484375, -0.2374267578125, -0.23095703125, -0.2244873046875, -0.218017578125, -0.2115478515625, -0.205078125, -0.1986083984375, -0.192138671875, -0.1856689453125, -0.17919921875, -0.1727294921875, -0.166259765625, -0.1597900390625, -0.1533203125, -0.1468505859375, -0.140380859375, -0.1339111328125, -0.12744140625, -0.1209716796875, -0.114501953125, -0.1080322265625, -0.1015625, -0.0950927734375, -0.088623046875, -0.0821533203125, -0.07568359375, -0.0692138671875, -0.062744140625, -0.0562744140625, -0.0498046875, -0.0433349609375, -0.036865234375, -0.0303955078125, -0.02392578125, -0.0174560546875, -0.010986328125, -0.0045166015625, 0.001953125, 0.0084228515625, 0.014892578125, 0.0213623046875, 0.02783203125, 0.0343017578125, 0.040771484375, 0.0472412109375, 0.0537109375, 0.0601806640625, 0.066650390625, 0.0731201171875, 0.07958984375, 0.0860595703125, 0.092529296875, 0.0989990234375, 0.10546875, 0.1119384765625, 0.118408203125, 0.1248779296875, 0.13134765625, 0.1378173828125, 0.144287109375, 0.1507568359375, 0.1572265625]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 5.0, 3.0, 12.0, 13.0, 13.0, 16.0, 23.0, 28.0, 46.0, 62.0, 127.0, 305.0, 961.0, 5287.0, 94076.0, 4050887.0, 37992.0, 3259.0, 674.0, 225.0, 85.0, 62.0, 35.0, 20.0, 15.0, 7.0, 11.0, 9.0, 7.0, 6.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74169921875, -0.7187957763671875, -0.695892333984375, -0.6729888916015625, -0.65008544921875, -0.6271820068359375, -0.604278564453125, -0.5813751220703125, -0.5584716796875, -0.5355682373046875, -0.512664794921875, -0.4897613525390625, -0.46685791015625, -0.4439544677734375, -0.421051025390625, -0.3981475830078125, -0.375244140625, -0.3523406982421875, -0.329437255859375, -0.3065338134765625, -0.28363037109375, -0.2607269287109375, -0.237823486328125, -0.2149200439453125, -0.1920166015625, -0.1691131591796875, -0.146209716796875, -0.1233062744140625, -0.10040283203125, -0.0774993896484375, -0.054595947265625, -0.0316925048828125, -0.0087890625, 0.0141143798828125, 0.037017822265625, 0.0599212646484375, 0.08282470703125, 0.1057281494140625, 0.128631591796875, 0.1515350341796875, 0.1744384765625, 0.1973419189453125, 0.220245361328125, 0.2431488037109375, 0.26605224609375, 0.2889556884765625, 0.311859130859375, 0.3347625732421875, 0.357666015625, 0.3805694580078125, 0.403472900390625, 0.4263763427734375, 0.44927978515625, 0.4721832275390625, 0.495086669921875, 0.5179901123046875, 0.5408935546875, 0.5637969970703125, 0.586700439453125, 0.6096038818359375, 0.63250732421875, 0.6554107666015625, 0.678314208984375, 0.7012176513671875, 0.72412109375]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 5.0, 6.0, 8.0, 7.0, 14.0, 11.0, 17.0, 25.0, 47.0, 61.0, 99.0, 186.0, 338.0, 566.0, 898.0, 687.0, 468.0, 209.0, 142.0, 70.0, 42.0, 32.0, 33.0, 20.0, 12.0, 19.0, 11.0, 12.0, 5.0, 1.0, 9.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08184814453125, -0.07934188842773438, -0.07683563232421875, -0.07432937622070312, -0.0718231201171875, -0.06931686401367188, -0.06681060791015625, -0.06430435180664062, -0.061798095703125, -0.059291839599609375, -0.05678558349609375, -0.054279327392578125, -0.0517730712890625, -0.049266815185546875, -0.04676055908203125, -0.044254302978515625, -0.041748046875, -0.039241790771484375, -0.03673553466796875, -0.034229278564453125, -0.0317230224609375, -0.029216766357421875, -0.02671051025390625, -0.024204254150390625, -0.021697998046875, -0.019191741943359375, -0.01668548583984375, -0.014179229736328125, -0.0116729736328125, -0.009166717529296875, -0.00666046142578125, -0.004154205322265625, -0.00164794921875, 0.000858306884765625, 0.00336456298828125, 0.005870819091796875, 0.0083770751953125, 0.010883331298828125, 0.01338958740234375, 0.015895843505859375, 0.018402099609375, 0.020908355712890625, 0.02341461181640625, 0.025920867919921875, 0.0284271240234375, 0.030933380126953125, 0.03343963623046875, 0.035945892333984375, 0.0384521484375, 0.040958404541015625, 0.04346466064453125, 0.045970916748046875, 0.0484771728515625, 0.050983428955078125, 0.05348968505859375, 0.055995941162109375, 0.058502197265625, 0.061008453369140625, 0.06351470947265625, 0.06602096557617188, 0.0685272216796875, 0.07103347778320312, 0.07353973388671875, 0.07604598999023438, 0.07855224609375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 8.0, 5.0, 8.0, 16.0, 16.0, 15.0, 28.0, 50.0, 93.0, 134.0, 174.0, 158.0, 97.0, 75.0, 49.0, 28.0, 18.0, 9.0, 9.0, 9.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45745858550071716, -0.4438287913799286, -0.43019899725914, -0.41656923294067383, -0.40293943881988525, -0.3893096446990967, -0.3756798505783081, -0.36205005645751953, -0.34842029213905334, -0.33479049801826477, -0.3211607038974762, -0.30753093957901, -0.29390114545822144, -0.28027135133743286, -0.2666415572166443, -0.2530117630958557, -0.23938198387622833, -0.22575218975543976, -0.21212241053581238, -0.1984926164150238, -0.18486283719539642, -0.17123304307460785, -0.15760326385498047, -0.1439734697341919, -0.13034367561340332, -0.11671388894319534, -0.10308410227298737, -0.08945430815219879, -0.07582452893257141, -0.06219473481178284, -0.04856494814157486, -0.03493516147136688, -0.021305382251739502, -0.00767559465020895, 0.005954192951321602, 0.01958398148417473, 0.033213768154382706, 0.04684355854988098, 0.06047334522008896, 0.07410313189029694, 0.08773291856050491, 0.10136270523071289, 0.11499249190092087, 0.12862227857112885, 0.14225207269191742, 0.1558818519115448, 0.16951164603233337, 0.18314144015312195, 0.19677121937274933, 0.2104010134935379, 0.22403079271316528, 0.23766058683395386, 0.25129038095474243, 0.264920175075531, 0.2785499393939972, 0.29217973351478577, 0.30580952763557434, 0.3194393217563629, 0.3330691158771515, 0.3466988801956177, 0.36032867431640625, 0.3739584684371948, 0.3875882625579834, 0.401218056678772, 0.41484782099723816]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 9.0, 13.0, 9.0, 20.0, 16.0, 20.0, 18.0, 23.0, 33.0, 46.0, 35.0, 46.0, 59.0, 57.0, 39.0, 37.0, 47.0, 40.0, 44.0, 49.0, 54.0, 42.0, 35.0, 36.0, 29.0, 32.0, 26.0, 18.0, 18.0, 16.0, 9.0, 10.0, 4.0, 5.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.21785898506641388, -0.21156637370586395, -0.20527376234531403, -0.1989811509847641, -0.19268853962421417, -0.18639592826366425, -0.18010330200195312, -0.1738106906414032, -0.16751807928085327, -0.16122546792030334, -0.15493285655975342, -0.1486402451992035, -0.14234763383865356, -0.13605502247810364, -0.1297624111175537, -0.12346979230642319, -0.11717718839645386, -0.11088457703590393, -0.104591965675354, -0.09829935431480408, -0.09200674295425415, -0.08571413159370422, -0.0794215127825737, -0.07312890142202377, -0.06683629006147385, -0.06054367870092392, -0.05425106734037399, -0.04795845225453377, -0.04166584089398384, -0.035373229533433914, -0.02908061444759369, -0.022788003087043762, -0.01649537682533264, -0.01020276453346014, -0.003910152241587639, 0.002382460981607437, 0.008675072342157364, 0.01496768370270729, 0.021260298788547516, 0.027552910149097443, 0.03384552150964737, 0.040138132870197296, 0.04643074423074722, 0.05272335931658745, 0.059015970677137375, 0.0653085857629776, 0.07160119712352753, 0.07789380848407745, 0.08418641984462738, 0.09047903120517731, 0.09677164256572723, 0.10306425392627716, 0.10935686528682709, 0.11564947664737701, 0.12194209545850754, 0.12823471426963806, 0.134527325630188, 0.14081993699073792, 0.14711254835128784, 0.15340515971183777, 0.1596977710723877, 0.16599038243293762, 0.17228299379348755, 0.17857560515403748, 0.1848682165145874]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 6.0, 1.0, 3.0, 4.0, 4.0, 4.0, 5.0, 3.0, 7.0, 9.0, 28.0, 21.0, 38.0, 57.0, 64.0, 111.0, 196.0, 266.0, 501.0, 868.0, 1529.0, 2752.0, 5301.0, 12075.0, 41414.0, 328998.0, 560613.0, 64244.0, 15599.0, 6316.0, 3206.0, 1718.0, 1012.0, 612.0, 328.0, 211.0, 139.0, 92.0, 74.0, 35.0, 25.0, 19.0, 7.0, 8.0, 5.0, 4.0, 8.0, 7.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.08587646484375, -0.08328437805175781, -0.08069229125976562, -0.07810020446777344, -0.07550811767578125, -0.07291603088378906, -0.07032394409179688, -0.06773185729980469, -0.0651397705078125, -0.06254768371582031, -0.059955596923828125, -0.05736351013183594, -0.05477142333984375, -0.05217933654785156, -0.049587249755859375, -0.04699516296386719, -0.044403076171875, -0.04181098937988281, -0.039218902587890625, -0.03662681579589844, -0.03403472900390625, -0.03144264221191406, -0.028850555419921875, -0.026258468627929688, -0.0236663818359375, -0.021074295043945312, -0.018482208251953125, -0.015890121459960938, -0.01329803466796875, -0.010705947875976562, -0.008113861083984375, -0.0055217742919921875, -0.0029296875, -0.0003376007080078125, 0.002254486083984375, 0.0048465728759765625, 0.00743865966796875, 0.010030746459960938, 0.012622833251953125, 0.015214920043945312, 0.0178070068359375, 0.020399093627929688, 0.022991180419921875, 0.025583267211914062, 0.02817535400390625, 0.030767440795898438, 0.033359527587890625, 0.03595161437988281, 0.038543701171875, 0.04113578796386719, 0.043727874755859375, 0.04631996154785156, 0.04891204833984375, 0.05150413513183594, 0.054096221923828125, 0.05668830871582031, 0.0592803955078125, 0.06187248229980469, 0.06446456909179688, 0.06705665588378906, 0.06964874267578125, 0.07224082946777344, 0.07483291625976562, 0.07742500305175781, 0.08001708984375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 6.0, 4.0, 8.0, 11.0, 21.0, 17.0, 24.0, 30.0, 37.0, 44.0, 54.0, 58.0, 69.0, 62.0, 64.0, 66.0, 61.0, 64.0, 60.0, 62.0, 42.0, 38.0, 25.0, 28.0, 19.0, 12.0, 9.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1717529296875, -0.16596031188964844, -0.16016769409179688, -0.1543750762939453, -0.14858245849609375, -0.1427898406982422, -0.13699722290039062, -0.13120460510253906, -0.1254119873046875, -0.11961936950683594, -0.11382675170898438, -0.10803413391113281, -0.10224151611328125, -0.09644889831542969, -0.09065628051757812, -0.08486366271972656, -0.079071044921875, -0.07327842712402344, -0.06748580932617188, -0.06169319152832031, -0.05590057373046875, -0.05010795593261719, -0.044315338134765625, -0.03852272033691406, -0.0327301025390625, -0.026937484741210938, -0.021144866943359375, -0.015352249145507812, -0.00955963134765625, -0.0037670135498046875, 0.002025604248046875, 0.007818222045898438, 0.01361083984375, 0.019403457641601562, 0.025196075439453125, 0.030988693237304688, 0.03678131103515625, 0.04257392883300781, 0.048366546630859375, 0.05415916442871094, 0.0599517822265625, 0.06574440002441406, 0.07153701782226562, 0.07732963562011719, 0.08312225341796875, 0.08891487121582031, 0.09470748901367188, 0.10050010681152344, 0.106292724609375, 0.11208534240722656, 0.11787796020507812, 0.12367057800292969, 0.12946319580078125, 0.1352558135986328, 0.14104843139648438, 0.14684104919433594, 0.1526336669921875, 0.15842628479003906, 0.16421890258789062, 0.1700115203857422, 0.17580413818359375, 0.1815967559814453, 0.18738937377929688, 0.19318199157714844, 0.198974609375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 2.0, 5.0, 7.0, 15.0, 10.0, 26.0, 40.0, 56.0, 107.0, 233.0, 532.0, 1370.0, 4996.0, 25992.0, 579441.0, 408577.0, 20509.0, 4315.0, 1354.0, 478.0, 219.0, 94.0, 44.0, 32.0, 29.0, 16.0, 13.0, 4.0, 4.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.127685546875, -0.123809814453125, -0.11993408203125, -0.116058349609375, -0.1121826171875, -0.108306884765625, -0.10443115234375, -0.100555419921875, -0.0966796875, -0.092803955078125, -0.08892822265625, -0.085052490234375, -0.0811767578125, -0.077301025390625, -0.07342529296875, -0.069549560546875, -0.065673828125, -0.061798095703125, -0.05792236328125, -0.054046630859375, -0.0501708984375, -0.046295166015625, -0.04241943359375, -0.038543701171875, -0.03466796875, -0.030792236328125, -0.02691650390625, -0.023040771484375, -0.0191650390625, -0.015289306640625, -0.01141357421875, -0.007537841796875, -0.003662109375, 0.000213623046875, 0.00408935546875, 0.007965087890625, 0.0118408203125, 0.015716552734375, 0.01959228515625, 0.023468017578125, 0.02734375, 0.031219482421875, 0.03509521484375, 0.038970947265625, 0.0428466796875, 0.046722412109375, 0.05059814453125, 0.054473876953125, 0.058349609375, 0.062225341796875, 0.06610107421875, 0.069976806640625, 0.0738525390625, 0.077728271484375, 0.08160400390625, 0.085479736328125, 0.08935546875, 0.093231201171875, 0.09710693359375, 0.100982666015625, 0.1048583984375, 0.108734130859375, 0.11260986328125, 0.116485595703125, 0.120361328125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 3.0, 9.0, 5.0, 10.0, 14.0, 11.0, 17.0, 17.0, 20.0, 25.0, 31.0, 24.0, 32.0, 34.0, 30.0, 45.0, 40.0, 54.0, 43.0, 52.0, 36.0, 41.0, 40.0, 38.0, 40.0, 34.0, 32.0, 32.0, 29.0, 20.0, 24.0, 21.0, 18.0, 17.0, 11.0, 16.0, 8.0, 8.0, 4.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.274658203125, -0.26700592041015625, -0.2593536376953125, -0.25170135498046875, -0.244049072265625, -0.23639678955078125, -0.2287445068359375, -0.22109222412109375, -0.21343994140625, -0.20578765869140625, -0.1981353759765625, -0.19048309326171875, -0.182830810546875, -0.17517852783203125, -0.1675262451171875, -0.15987396240234375, -0.1522216796875, -0.14456939697265625, -0.1369171142578125, -0.12926483154296875, -0.121612548828125, -0.11396026611328125, -0.1063079833984375, -0.09865570068359375, -0.09100341796875, -0.08335113525390625, -0.0756988525390625, -0.06804656982421875, -0.060394287109375, -0.05274200439453125, -0.0450897216796875, -0.03743743896484375, -0.02978515625, -0.02213287353515625, -0.0144805908203125, -0.00682830810546875, 0.000823974609375, 0.00847625732421875, 0.0161285400390625, 0.02378082275390625, 0.03143310546875, 0.03908538818359375, 0.0467376708984375, 0.05438995361328125, 0.062042236328125, 0.06969451904296875, 0.0773468017578125, 0.08499908447265625, 0.0926513671875, 0.10030364990234375, 0.1079559326171875, 0.11560821533203125, 0.123260498046875, 0.13091278076171875, 0.1385650634765625, 0.14621734619140625, 0.15386962890625, 0.16152191162109375, 0.1691741943359375, 0.17682647705078125, 0.184478759765625, 0.19213104248046875, 0.1997833251953125, 0.20743560791015625, 0.215087890625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 6.0, 12.0, 15.0, 16.0, 26.0, 36.0, 54.0, 128.0, 256.0, 606.0, 1897.0, 8058.0, 63085.0, 756528.0, 195760.0, 17067.0, 3280.0, 983.0, 327.0, 178.0, 76.0, 61.0, 34.0, 22.0, 6.0, 15.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0298309326171875, -0.028826475143432617, -0.027822017669677734, -0.02681756019592285, -0.02581310272216797, -0.024808645248413086, -0.023804187774658203, -0.02279973030090332, -0.021795272827148438, -0.020790815353393555, -0.019786357879638672, -0.01878190040588379, -0.017777442932128906, -0.016772985458374023, -0.01576852798461914, -0.014764070510864258, -0.013759613037109375, -0.012755155563354492, -0.01175069808959961, -0.010746240615844727, -0.009741783142089844, -0.008737325668334961, -0.007732868194580078, -0.006728410720825195, -0.0057239532470703125, -0.00471949577331543, -0.003715038299560547, -0.002710580825805664, -0.0017061233520507812, -0.0007016658782958984, 0.0003027915954589844, 0.0013072490692138672, 0.00231170654296875, 0.003316164016723633, 0.004320621490478516, 0.0053250789642333984, 0.006329536437988281, 0.007333993911743164, 0.008338451385498047, 0.00934290885925293, 0.010347366333007812, 0.011351823806762695, 0.012356281280517578, 0.013360738754272461, 0.014365196228027344, 0.015369653701782227, 0.01637411117553711, 0.017378568649291992, 0.018383026123046875, 0.019387483596801758, 0.02039194107055664, 0.021396398544311523, 0.022400856018066406, 0.02340531349182129, 0.024409770965576172, 0.025414228439331055, 0.026418685913085938, 0.02742314338684082, 0.028427600860595703, 0.029432058334350586, 0.03043651580810547, 0.03144097328186035, 0.032445430755615234, 0.03344988822937012, 0.034454345703125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 6.0, 6.0, 11.0, 13.0, 34.0, 48.0, 68.0, 96.0, 154.0, 133.0, 117.0, 87.0, 87.0, 58.0, 29.0, 21.0, 14.0, 10.0, 9.0, 2.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8835067749023438e-05, -1.840386539697647e-05, -1.7972663044929504e-05, -1.7541460692882538e-05, -1.711025834083557e-05, -1.6679055988788605e-05, -1.6247853636741638e-05, -1.581665128469467e-05, -1.5385448932647705e-05, -1.4954246580600739e-05, -1.4523044228553772e-05, -1.4091841876506805e-05, -1.3660639524459839e-05, -1.3229437172412872e-05, -1.2798234820365906e-05, -1.236703246831894e-05, -1.1935830116271973e-05, -1.1504627764225006e-05, -1.107342541217804e-05, -1.0642223060131073e-05, -1.0211020708084106e-05, -9.77981835603714e-06, -9.348616003990173e-06, -8.917413651943207e-06, -8.48621129989624e-06, -8.055008947849274e-06, -7.623806595802307e-06, -7.1926042437553406e-06, -6.761401891708374e-06, -6.3301995396614075e-06, -5.898997187614441e-06, -5.467794835567474e-06, -5.036592483520508e-06, -4.605390131473541e-06, -4.174187779426575e-06, -3.742985427379608e-06, -3.3117830753326416e-06, -2.880580723285675e-06, -2.4493783712387085e-06, -2.018176019191742e-06, -1.5869736671447754e-06, -1.1557713150978088e-06, -7.245689630508423e-07, -2.9336661100387573e-07, 1.3783574104309082e-07, 5.690380930900574e-07, 1.000240445137024e-06, 1.4314427971839905e-06, 1.862645149230957e-06, 2.2938475012779236e-06, 2.72504985332489e-06, 3.1562522053718567e-06, 3.5874545574188232e-06, 4.01865690946579e-06, 4.449859261512756e-06, 4.881061613559723e-06, 5.3122639656066895e-06, 5.743466317653656e-06, 6.1746686697006226e-06, 6.605871021747589e-06, 7.037073373794556e-06, 7.468275725841522e-06, 7.899478077888489e-06, 8.330680429935455e-06, 8.761882781982422e-06]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 5.0, 6.0, 20.0, 25.0, 43.0, 77.0, 130.0, 265.0, 830.0, 3275.0, 22470.0, 565842.0, 433139.0, 18371.0, 2686.0, 713.0, 285.0, 142.0, 90.0, 55.0, 29.0, 23.0, 16.0, 8.0, 5.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.05169677734375, -0.050464630126953125, -0.04923248291015625, -0.048000335693359375, -0.0467681884765625, -0.045536041259765625, -0.04430389404296875, -0.043071746826171875, -0.041839599609375, -0.040607452392578125, -0.03937530517578125, -0.038143157958984375, -0.0369110107421875, -0.035678863525390625, -0.03444671630859375, -0.033214569091796875, -0.031982421875, -0.030750274658203125, -0.02951812744140625, -0.028285980224609375, -0.0270538330078125, -0.025821685791015625, -0.02458953857421875, -0.023357391357421875, -0.022125244140625, -0.020893096923828125, -0.01966094970703125, -0.018428802490234375, -0.0171966552734375, -0.015964508056640625, -0.01473236083984375, -0.013500213623046875, -0.01226806640625, -0.011035919189453125, -0.00980377197265625, -0.008571624755859375, -0.0073394775390625, -0.006107330322265625, -0.00487518310546875, -0.003643035888671875, -0.002410888671875, -0.001178741455078125, 5.340576171875e-05, 0.001285552978515625, 0.0025177001953125, 0.003749847412109375, 0.00498199462890625, 0.006214141845703125, 0.0074462890625, 0.008678436279296875, 0.00991058349609375, 0.011142730712890625, 0.0123748779296875, 0.013607025146484375, 0.01483917236328125, 0.016071319580078125, 0.017303466796875, 0.018535614013671875, 0.01976776123046875, 0.020999908447265625, 0.0222320556640625, 0.023464202880859375, 0.02469635009765625, 0.025928497314453125, 0.02716064453125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 4.0, 15.0, 12.0, 23.0, 30.0, 46.0, 63.0, 109.0, 151.0, 143.0, 122.0, 97.0, 66.0, 36.0, 27.0, 26.0, 16.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.005329132080078125, -0.005089461803436279, -0.004849791526794434, -0.004610121250152588, -0.004370450973510742, -0.0041307806968688965, -0.0038911104202270508, -0.003651440143585205, -0.0034117698669433594, -0.0031720995903015137, -0.002932429313659668, -0.0026927590370178223, -0.0024530887603759766, -0.002213418483734131, -0.001973748207092285, -0.0017340779304504395, -0.0014944076538085938, -0.001254737377166748, -0.0010150671005249023, -0.0007753968238830566, -0.0005357265472412109, -0.00029605627059936523, -5.638599395751953e-05, 0.00018328428268432617, 0.0004229545593261719, 0.0006626248359680176, 0.0009022951126098633, 0.001141965389251709, 0.0013816356658935547, 0.0016213059425354004, 0.001860976219177246, 0.002100646495819092, 0.0023403167724609375, 0.002579987049102783, 0.002819657325744629, 0.0030593276023864746, 0.0032989978790283203, 0.003538668155670166, 0.0037783384323120117, 0.004018008708953857, 0.004257678985595703, 0.004497349262237549, 0.0047370195388793945, 0.00497668981552124, 0.005216360092163086, 0.005456030368804932, 0.005695700645446777, 0.005935370922088623, 0.006175041198730469, 0.0064147114753723145, 0.00665438175201416, 0.006894052028656006, 0.0071337223052978516, 0.007373392581939697, 0.007613062858581543, 0.007852733135223389, 0.008092403411865234, 0.00833207368850708, 0.008571743965148926, 0.008811414241790771, 0.009051084518432617, 0.009290754795074463, 0.009530425071716309, 0.009770095348358154, 0.010009765625]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 6.0, 11.0, 18.0, 27.0, 58.0, 147.0, 282.0, 248.0, 123.0, 40.0, 29.0, 9.0, 8.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61208176612854, -0.5970747470855713, -0.5820677280426025, -0.5670607686042786, -0.5520537495613098, -0.5370467305183411, -0.5220397114753723, -0.5070327520370483, -0.4920257329940796, -0.47701871395111084, -0.4620117247104645, -0.4470047056674957, -0.43199771642684937, -0.4169906973838806, -0.40198370814323425, -0.3869766891002655, -0.37196969985961914, -0.3569626808166504, -0.34195569157600403, -0.3269486725330353, -0.3119416832923889, -0.29693466424942017, -0.2819276750087738, -0.26692065596580505, -0.2519136369228363, -0.23690663278102875, -0.2218996286392212, -0.20689262449741364, -0.19188562035560608, -0.17687860131263733, -0.16187161207199097, -0.14686459302902222, -0.13185760378837585, -0.1168505996465683, -0.10184359550476074, -0.08683659136295319, -0.07182958722114563, -0.05682257562875748, -0.04181557148694992, -0.026808567345142365, -0.011801563203334808, 0.0032054418697953224, 0.018212446942925453, 0.03321945294737816, 0.048226457089185715, 0.06323346495628357, 0.07824046909809113, 0.09324747323989868, 0.10825447738170624, 0.1232614815235138, 0.13826848566532135, 0.1532754898071289, 0.16828249394893646, 0.18328949809074402, 0.19829651713371277, 0.21330350637435913, 0.22831052541732788, 0.24331752955913544, 0.258324533700943, 0.27333155274391174, 0.2883385419845581, 0.30334556102752686, 0.3183525502681732, 0.33335956931114197, 0.34836655855178833]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 5.0, 6.0, 11.0, 11.0, 18.0, 18.0, 14.0, 29.0, 24.0, 43.0, 40.0, 43.0, 59.0, 63.0, 39.0, 58.0, 44.0, 45.0, 67.0, 52.0, 41.0, 43.0, 35.0, 38.0, 38.0, 29.0, 22.0, 15.0, 13.0, 16.0, 8.0, 1.0, 4.0, 7.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.16176283359527588, -0.15728718042373657, -0.15281152725219727, -0.14833585917949677, -0.14386020600795746, -0.13938455283641815, -0.13490888476371765, -0.13043323159217834, -0.12595757842063904, -0.12148192524909973, -0.11700626462697983, -0.11253060400485992, -0.10805495083332062, -0.10357929766178131, -0.09910363703966141, -0.0946279764175415, -0.0901523232460022, -0.08567667007446289, -0.08120100945234299, -0.07672534883022308, -0.07224969565868378, -0.06777404248714447, -0.06329838186502457, -0.05882272496819496, -0.054347068071365356, -0.04987141117453575, -0.045395754277706146, -0.04092009738087654, -0.036444440484046936, -0.03196878358721733, -0.027493126690387726, -0.02301746979355812, -0.018541812896728516, -0.01406615599989891, -0.009590499103069305, -0.0051148422062397, -0.0006391853094100952, 0.00383647158741951, 0.008312128484249115, 0.01278778538107872, 0.017263442277908325, 0.02173909917473793, 0.026214756071567535, 0.03069041296839714, 0.035166069865226746, 0.03964172676205635, 0.044117383658885956, 0.04859304055571556, 0.053068697452545166, 0.05754435434937477, 0.062020011246204376, 0.06649567186832428, 0.07097132503986359, 0.0754469782114029, 0.0799226388335228, 0.0843982994556427, 0.088873952627182, 0.09334960579872131, 0.09782526642084122, 0.10230092704296112, 0.10677658021450043, 0.11125223338603973, 0.11572789400815964, 0.12020355463027954, 0.12467920780181885]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 5.0, 12.0, 20.0, 49.0, 133.0, 355.0, 1129.0, 4424.0, 28807.0, 852978.0, 147007.0, 10483.0, 2203.0, 629.0, 178.0, 63.0, 28.0, 11.0, 5.0, 6.0, 5.0, 1.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34619140625, -0.33371734619140625, -0.3212432861328125, -0.30876922607421875, -0.296295166015625, -0.28382110595703125, -0.2713470458984375, -0.25887298583984375, -0.24639892578125, -0.23392486572265625, -0.2214508056640625, -0.20897674560546875, -0.196502685546875, -0.18402862548828125, -0.1715545654296875, -0.15908050537109375, -0.1466064453125, -0.13413238525390625, -0.1216583251953125, -0.10918426513671875, -0.096710205078125, -0.08423614501953125, -0.0717620849609375, -0.05928802490234375, -0.04681396484375, -0.03433990478515625, -0.0218658447265625, -0.00939178466796875, 0.003082275390625, 0.01555633544921875, 0.0280303955078125, 0.04050445556640625, 0.052978515625, 0.06545257568359375, 0.0779266357421875, 0.09040069580078125, 0.102874755859375, 0.11534881591796875, 0.1278228759765625, 0.14029693603515625, 0.15277099609375, 0.16524505615234375, 0.1777191162109375, 0.19019317626953125, 0.202667236328125, 0.21514129638671875, 0.2276153564453125, 0.24008941650390625, 0.2525634765625, 0.26503753662109375, 0.2775115966796875, 0.28998565673828125, 0.302459716796875, 0.31493377685546875, 0.3274078369140625, 0.33988189697265625, 0.35235595703125, 0.36483001708984375, 0.3773040771484375, 0.38977813720703125, 0.402252197265625, 0.41472625732421875, 0.4272003173828125, 0.43967437744140625, 0.4521484375]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 6.0, 7.0, 10.0, 12.0, 16.0, 13.0, 25.0, 28.0, 42.0, 49.0, 50.0, 52.0, 49.0, 51.0, 48.0, 67.0, 50.0, 58.0, 56.0, 51.0, 39.0, 39.0, 35.0, 33.0, 25.0, 26.0, 16.0, 12.0, 8.0, 10.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.34716796875, -0.3376007080078125, -0.328033447265625, -0.3184661865234375, -0.30889892578125, -0.2993316650390625, -0.289764404296875, -0.2801971435546875, -0.2706298828125, -0.2610626220703125, -0.251495361328125, -0.2419281005859375, -0.23236083984375, -0.2227935791015625, -0.213226318359375, -0.2036590576171875, -0.194091796875, -0.1845245361328125, -0.174957275390625, -0.1653900146484375, -0.15582275390625, -0.1462554931640625, -0.136688232421875, -0.1271209716796875, -0.1175537109375, -0.1079864501953125, -0.098419189453125, -0.0888519287109375, -0.07928466796875, -0.0697174072265625, -0.060150146484375, -0.0505828857421875, -0.041015625, -0.0314483642578125, -0.021881103515625, -0.0123138427734375, -0.00274658203125, 0.0068206787109375, 0.016387939453125, 0.0259552001953125, 0.0355224609375, 0.0450897216796875, 0.054656982421875, 0.0642242431640625, 0.07379150390625, 0.0833587646484375, 0.092926025390625, 0.1024932861328125, 0.112060546875, 0.1216278076171875, 0.131195068359375, 0.1407623291015625, 0.15032958984375, 0.1598968505859375, 0.169464111328125, 0.1790313720703125, 0.1885986328125, 0.1981658935546875, 0.207733154296875, 0.2173004150390625, 0.22686767578125, 0.2364349365234375, 0.246002197265625, 0.2555694580078125, 0.26513671875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 10.0, 7.0, 13.0, 15.0, 23.0, 35.0, 41.0, 71.0, 141.0, 252.0, 664.0, 2605.0, 19770.0, 857151.0, 157851.0, 7577.0, 1364.0, 440.0, 212.0, 103.0, 73.0, 34.0, 29.0, 17.0, 12.0, 10.0, 10.0, 5.0, 7.0, 3.0, 5.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.380615234375, -0.36864471435546875, -0.3566741943359375, -0.34470367431640625, -0.332733154296875, -0.32076263427734375, -0.3087921142578125, -0.29682159423828125, -0.28485107421875, -0.27288055419921875, -0.2609100341796875, -0.24893951416015625, -0.236968994140625, -0.22499847412109375, -0.2130279541015625, -0.20105743408203125, -0.1890869140625, -0.17711639404296875, -0.1651458740234375, -0.15317535400390625, -0.141204833984375, -0.12923431396484375, -0.1172637939453125, -0.10529327392578125, -0.09332275390625, -0.08135223388671875, -0.0693817138671875, -0.05741119384765625, -0.045440673828125, -0.03347015380859375, -0.0214996337890625, -0.00952911376953125, 0.00244140625, 0.01441192626953125, 0.0263824462890625, 0.03835296630859375, 0.050323486328125, 0.06229400634765625, 0.0742645263671875, 0.08623504638671875, 0.09820556640625, 0.11017608642578125, 0.1221466064453125, 0.13411712646484375, 0.146087646484375, 0.15805816650390625, 0.1700286865234375, 0.18199920654296875, 0.1939697265625, 0.20594024658203125, 0.2179107666015625, 0.22988128662109375, 0.241851806640625, 0.25382232666015625, 0.2657928466796875, 0.27776336669921875, 0.28973388671875, 0.30170440673828125, 0.3136749267578125, 0.32564544677734375, 0.337615966796875, 0.34958648681640625, 0.3615570068359375, 0.37352752685546875, 0.385498046875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 5.0, 6.0, 7.0, 13.0, 6.0, 15.0, 12.0, 17.0, 18.0, 16.0, 24.0, 21.0, 19.0, 34.0, 28.0, 45.0, 40.0, 47.0, 41.0, 52.0, 44.0, 37.0, 43.0, 52.0, 54.0, 32.0, 30.0, 43.0, 23.0, 30.0, 26.0, 22.0, 22.0, 17.0, 17.0, 8.0, 12.0, 8.0, 4.0, 3.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.283203125, -0.2745780944824219, -0.26595306396484375, -0.2573280334472656, -0.2487030029296875, -0.24007797241210938, -0.23145294189453125, -0.22282791137695312, -0.214202880859375, -0.20557785034179688, -0.19695281982421875, -0.18832778930664062, -0.1797027587890625, -0.17107772827148438, -0.16245269775390625, -0.15382766723632812, -0.14520263671875, -0.13657760620117188, -0.12795257568359375, -0.11932754516601562, -0.1107025146484375, -0.10207748413085938, -0.09345245361328125, -0.08482742309570312, -0.076202392578125, -0.06757736206054688, -0.05895233154296875, -0.050327301025390625, -0.0417022705078125, -0.033077239990234375, -0.02445220947265625, -0.015827178955078125, -0.0072021484375, 0.001422882080078125, 0.01004791259765625, 0.018672943115234375, 0.0272979736328125, 0.035923004150390625, 0.04454803466796875, 0.053173065185546875, 0.061798095703125, 0.07042312622070312, 0.07904815673828125, 0.08767318725585938, 0.0962982177734375, 0.10492324829101562, 0.11354827880859375, 0.12217330932617188, 0.13079833984375, 0.13942337036132812, 0.14804840087890625, 0.15667343139648438, 0.1652984619140625, 0.17392349243164062, 0.18254852294921875, 0.19117355346679688, 0.199798583984375, 0.20842361450195312, 0.21704864501953125, 0.22567367553710938, 0.2342987060546875, 0.24292373657226562, 0.25154876708984375, 0.2601737976074219, 0.268798828125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 5.0, 0.0, 6.0, 5.0, 8.0, 17.0, 24.0, 44.0, 70.0, 156.0, 389.0, 1668.0, 13327.0, 864536.0, 161288.0, 5514.0, 910.0, 277.0, 121.0, 56.0, 43.0, 20.0, 25.0, 13.0, 7.0, 7.0, 3.0, 5.0, 4.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1549072265625, -0.1503276824951172, -0.14574813842773438, -0.14116859436035156, -0.13658905029296875, -0.13200950622558594, -0.12742996215820312, -0.12285041809082031, -0.1182708740234375, -0.11369132995605469, -0.10911178588867188, -0.10453224182128906, -0.09995269775390625, -0.09537315368652344, -0.09079360961914062, -0.08621406555175781, -0.081634521484375, -0.07705497741699219, -0.07247543334960938, -0.06789588928222656, -0.06331634521484375, -0.05873680114746094, -0.054157257080078125, -0.04957771301269531, -0.0449981689453125, -0.04041862487792969, -0.035839080810546875, -0.03125953674316406, -0.02667999267578125, -0.022100448608398438, -0.017520904541015625, -0.012941360473632812, -0.00836181640625, -0.0037822723388671875, 0.000797271728515625, 0.0053768157958984375, 0.00995635986328125, 0.014535903930664062, 0.019115447998046875, 0.023694992065429688, 0.0282745361328125, 0.03285408020019531, 0.037433624267578125, 0.04201316833496094, 0.04659271240234375, 0.05117225646972656, 0.055751800537109375, 0.06033134460449219, 0.064910888671875, 0.06949043273925781, 0.07406997680664062, 0.07864952087402344, 0.08322906494140625, 0.08780860900878906, 0.09238815307617188, 0.09696769714355469, 0.1015472412109375, 0.10612678527832031, 0.11070632934570312, 0.11528587341308594, 0.11986541748046875, 0.12444496154785156, 0.12902450561523438, 0.1336040496826172, 0.13818359375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 14.0, 8.0, 9.0, 29.0, 39.0, 86.0, 182.0, 240.0, 171.0, 94.0, 45.0, 37.0, 11.0, 9.0, 9.0, 6.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6450881958007812e-05, -1.5875324606895447e-05, -1.529976725578308e-05, -1.4724209904670715e-05, -1.414865255355835e-05, -1.3573095202445984e-05, -1.2997537851333618e-05, -1.2421980500221252e-05, -1.1846423149108887e-05, -1.1270865797996521e-05, -1.0695308446884155e-05, -1.011975109577179e-05, -9.544193744659424e-06, -8.968636393547058e-06, -8.393079042434692e-06, -7.817521691322327e-06, -7.241964340209961e-06, -6.666406989097595e-06, -6.0908496379852295e-06, -5.515292286872864e-06, -4.939734935760498e-06, -4.364177584648132e-06, -3.7886202335357666e-06, -3.213062882423401e-06, -2.637505531311035e-06, -2.0619481801986694e-06, -1.4863908290863037e-06, -9.10833477973938e-07, -3.3527612686157227e-07, 2.4028122425079346e-07, 8.158385753631592e-07, 1.391395926475525e-06, 1.9669532775878906e-06, 2.5425106287002563e-06, 3.118067979812622e-06, 3.693625330924988e-06, 4.2691826820373535e-06, 4.844740033149719e-06, 5.420297384262085e-06, 5.995854735374451e-06, 6.571412086486816e-06, 7.146969437599182e-06, 7.722526788711548e-06, 8.298084139823914e-06, 8.87364149093628e-06, 9.449198842048645e-06, 1.002475619316101e-05, 1.0600313544273376e-05, 1.1175870895385742e-05, 1.1751428246498108e-05, 1.2326985597610474e-05, 1.290254294872284e-05, 1.3478100299835205e-05, 1.405365765094757e-05, 1.4629215002059937e-05, 1.5204772353172302e-05, 1.5780329704284668e-05, 1.6355887055397034e-05, 1.69314444065094e-05, 1.7507001757621765e-05, 1.808255910873413e-05, 1.8658116459846497e-05, 1.9233673810958862e-05, 1.9809231162071228e-05, 2.0384788513183594e-05]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 11.0, 12.0, 12.0, 28.0, 43.0, 79.0, 188.0, 493.0, 1999.0, 18207.0, 984630.0, 38874.0, 2808.0, 678.0, 257.0, 100.0, 53.0, 26.0, 17.0, 10.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.186279296875, -0.18056488037109375, -0.1748504638671875, -0.16913604736328125, -0.163421630859375, -0.15770721435546875, -0.1519927978515625, -0.14627838134765625, -0.14056396484375, -0.13484954833984375, -0.1291351318359375, -0.12342071533203125, -0.117706298828125, -0.11199188232421875, -0.1062774658203125, -0.10056304931640625, -0.0948486328125, -0.08913421630859375, -0.0834197998046875, -0.07770538330078125, -0.071990966796875, -0.06627655029296875, -0.0605621337890625, -0.05484771728515625, -0.04913330078125, -0.04341888427734375, -0.0377044677734375, -0.03199005126953125, -0.026275634765625, -0.02056121826171875, -0.0148468017578125, -0.00913238525390625, -0.00341796875, 0.00229644775390625, 0.0080108642578125, 0.01372528076171875, 0.019439697265625, 0.02515411376953125, 0.0308685302734375, 0.03658294677734375, 0.04229736328125, 0.04801177978515625, 0.0537261962890625, 0.05944061279296875, 0.065155029296875, 0.07086944580078125, 0.0765838623046875, 0.08229827880859375, 0.0880126953125, 0.09372711181640625, 0.0994415283203125, 0.10515594482421875, 0.110870361328125, 0.11658477783203125, 0.1222991943359375, 0.12801361083984375, 0.13372802734375, 0.13944244384765625, 0.1451568603515625, 0.15087127685546875, 0.156585693359375, 0.16230010986328125, 0.1680145263671875, 0.17372894287109375, 0.179443359375]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 7.0, 25.0, 15.0, 28.0, 32.0, 72.0, 75.0, 127.0, 145.0, 150.0, 97.0, 74.0, 40.0, 35.0, 15.0, 15.0, 11.0, 10.0, 10.0, 0.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.033843994140625, -0.03273963928222656, -0.031635284423828125, -0.030530929565429688, -0.02942657470703125, -0.028322219848632812, -0.027217864990234375, -0.026113510131835938, -0.0250091552734375, -0.023904800415039062, -0.022800445556640625, -0.021696090698242188, -0.02059173583984375, -0.019487380981445312, -0.018383026123046875, -0.017278671264648438, -0.01617431640625, -0.015069961547851562, -0.013965606689453125, -0.012861251831054688, -0.01175689697265625, -0.010652542114257812, -0.009548187255859375, -0.008443832397460938, -0.0073394775390625, -0.0062351226806640625, -0.005130767822265625, -0.0040264129638671875, -0.00292205810546875, -0.0018177032470703125, -0.000713348388671875, 0.0003910064697265625, 0.001495361328125, 0.0025997161865234375, 0.003704071044921875, 0.0048084259033203125, 0.00591278076171875, 0.0070171356201171875, 0.008121490478515625, 0.009225845336914062, 0.0103302001953125, 0.011434555053710938, 0.012538909912109375, 0.013643264770507812, 0.01474761962890625, 0.015851974487304688, 0.016956329345703125, 0.018060684204101562, 0.0191650390625, 0.020269393920898438, 0.021373748779296875, 0.022478103637695312, 0.02358245849609375, 0.024686813354492188, 0.025791168212890625, 0.026895523071289062, 0.0279998779296875, 0.029104232788085938, 0.030208587646484375, 0.03131294250488281, 0.03241729736328125, 0.03352165222167969, 0.034626007080078125, 0.03573036193847656, 0.036834716796875]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 13.0, 26.0, 48.0, 185.0, 362.0, 263.0, 58.0, 31.0, 15.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.0096774101257324, -1.9699279069900513, -1.9301785230636597, -1.8904290199279785, -1.850679636001587, -1.8109301328659058, -1.7711807489395142, -1.731431245803833, -1.6916818618774414, -1.6519323587417603, -1.6121829748153687, -1.5724334716796875, -1.532684087753296, -1.4929345846176147, -1.4531852006912231, -1.413435697555542, -1.3736863136291504, -1.3339368104934692, -1.2941874265670776, -1.2544379234313965, -1.2146885395050049, -1.1749390363693237, -1.1351896524429321, -1.095440149307251, -1.0556906461715698, -1.0159411430358887, -0.9761917591094971, -0.9364423155784607, -0.8966928720474243, -0.8569434285163879, -0.8171939849853516, -0.7774444818496704, -0.7376950979232788, -0.6979456543922424, -0.658196210861206, -0.6184467673301697, -0.5786973237991333, -0.5389478802680969, -0.49919840693473816, -0.4594489634037018, -0.4196995198726654, -0.37995007634162903, -0.34020063281059265, -0.3004511594772339, -0.2607017159461975, -0.22095228731632233, -0.18120282888412476, -0.14145338535308838, -0.101703941822052, -0.06195449456572533, -0.02220504730939865, 0.017544403672218323, 0.0572938472032547, 0.09704329073429108, 0.13679274916648865, 0.17654219269752502, 0.2162916362285614, 0.2560410797595978, 0.29579052329063416, 0.3355399966239929, 0.3752894401550293, 0.4150388836860657, 0.45478832721710205, 0.4945377707481384, 0.5342872142791748]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 6.0, 3.0, 3.0, 5.0, 9.0, 7.0, 11.0, 16.0, 23.0, 14.0, 16.0, 27.0, 35.0, 45.0, 43.0, 53.0, 43.0, 37.0, 54.0, 53.0, 46.0, 50.0, 47.0, 46.0, 45.0, 44.0, 46.0, 30.0, 26.0, 26.0, 20.0, 17.0, 19.0, 6.0, 8.0, 9.0, 11.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.589144229888916, -0.5728532075881958, -0.5565621852874756, -0.5402711629867554, -0.5239801406860352, -0.5076891183853149, -0.49139806628227234, -0.4751070439815521, -0.4588159918785095, -0.4425249695777893, -0.4262339472770691, -0.4099429249763489, -0.3936518728733063, -0.37736085057258606, -0.36106982827186584, -0.34477880597114563, -0.3284877836704254, -0.3121967613697052, -0.295905739068985, -0.2796146869659424, -0.26332366466522217, -0.24703264236450195, -0.23074162006378174, -0.21445059776306152, -0.19815956056118011, -0.1818685382604599, -0.1655775010585785, -0.14928647875785828, -0.13299545645713806, -0.11670441925525665, -0.10041339695453644, -0.08412236720323563, -0.0678313672542572, -0.05154033750295639, -0.03524931147694588, -0.018958285450935364, -0.002667255699634552, 0.01362377405166626, 0.029914796352386475, 0.046205826103687286, 0.0624968558549881, 0.07878788560628891, 0.09507891535758972, 0.11136993765830994, 0.12766095995903015, 0.14395199716091156, 0.16024301946163177, 0.17653405666351318, 0.1928250789642334, 0.2091161012649536, 0.22540713846683502, 0.24169816076755524, 0.25798919796943665, 0.27428022027015686, 0.2905712425708771, 0.3068622648715973, 0.3231533169746399, 0.3394443392753601, 0.3557353615760803, 0.37202638387680054, 0.38831743597984314, 0.40460845828056335, 0.42089948058128357, 0.4371905028820038, 0.453481525182724]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 2.0, 8.0, 13.0, 11.0, 16.0, 18.0, 30.0, 40.0, 65.0, 95.0, 149.0, 294.0, 591.0, 1317.0, 3285.0, 12638.0, 258103.0, 3715774.0, 183419.0, 12653.0, 3276.0, 1239.0, 538.0, 280.0, 139.0, 91.0, 54.0, 44.0, 27.0, 20.0, 12.0, 11.0, 6.0, 6.0, 8.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3994140625, -0.3867225646972656, -0.37403106689453125, -0.3613395690917969, -0.3486480712890625, -0.3359565734863281, -0.32326507568359375, -0.3105735778808594, -0.297882080078125, -0.2851905822753906, -0.27249908447265625, -0.2598075866699219, -0.2471160888671875, -0.23442459106445312, -0.22173309326171875, -0.20904159545898438, -0.19635009765625, -0.18365859985351562, -0.17096710205078125, -0.15827560424804688, -0.1455841064453125, -0.13289260864257812, -0.12020111083984375, -0.10750961303710938, -0.094818115234375, -0.08212661743164062, -0.06943511962890625, -0.056743621826171875, -0.0440521240234375, -0.031360626220703125, -0.01866912841796875, -0.005977630615234375, 0.0067138671875, 0.019405364990234375, 0.03209686279296875, 0.044788360595703125, 0.0574798583984375, 0.07017135620117188, 0.08286285400390625, 0.09555435180664062, 0.108245849609375, 0.12093734741210938, 0.13362884521484375, 0.14632034301757812, 0.1590118408203125, 0.17170333862304688, 0.18439483642578125, 0.19708633422851562, 0.20977783203125, 0.22246932983398438, 0.23516082763671875, 0.24785232543945312, 0.2605438232421875, 0.2732353210449219, 0.28592681884765625, 0.2986183166503906, 0.311309814453125, 0.3240013122558594, 0.33669281005859375, 0.3493843078613281, 0.3620758056640625, 0.3747673034667969, 0.38745880126953125, 0.4001502990722656, 0.412841796875]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 8.0, 6.0, 9.0, 10.0, 15.0, 19.0, 27.0, 44.0, 59.0, 50.0, 61.0, 60.0, 77.0, 76.0, 62.0, 67.0, 56.0, 50.0, 43.0, 36.0, 38.0, 34.0, 23.0, 21.0, 20.0, 12.0, 8.0, 5.0, 2.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2509765625, -0.2445354461669922, -0.23809432983398438, -0.23165321350097656, -0.22521209716796875, -0.21877098083496094, -0.21232986450195312, -0.2058887481689453, -0.1994476318359375, -0.1930065155029297, -0.18656539916992188, -0.18012428283691406, -0.17368316650390625, -0.16724205017089844, -0.16080093383789062, -0.1543598175048828, -0.147918701171875, -0.1414775848388672, -0.13503646850585938, -0.12859535217285156, -0.12215423583984375, -0.11571311950683594, -0.10927200317382812, -0.10283088684082031, -0.0963897705078125, -0.08994865417480469, -0.08350753784179688, -0.07706642150878906, -0.07062530517578125, -0.06418418884277344, -0.057743072509765625, -0.05130195617675781, -0.04486083984375, -0.03841972351074219, -0.031978607177734375, -0.025537490844726562, -0.01909637451171875, -0.012655258178710938, -0.006214141845703125, 0.0002269744873046875, 0.0066680908203125, 0.013109207153320312, 0.019550323486328125, 0.025991439819335938, 0.03243255615234375, 0.03887367248535156, 0.045314788818359375, 0.05175590515136719, 0.058197021484375, 0.06463813781738281, 0.07107925415039062, 0.07752037048339844, 0.08396148681640625, 0.09040260314941406, 0.09684371948242188, 0.10328483581542969, 0.1097259521484375, 0.11616706848144531, 0.12260818481445312, 0.12904930114746094, 0.13549041748046875, 0.14193153381347656, 0.14837265014648438, 0.1548137664794922, 0.1612548828125]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 6.0, 11.0, 8.0, 17.0, 19.0, 27.0, 35.0, 73.0, 92.0, 176.0, 315.0, 795.0, 2139.0, 8750.0, 81714.0, 3982344.0, 103343.0, 10134.0, 2479.0, 911.0, 355.0, 200.0, 107.0, 59.0, 46.0, 30.0, 17.0, 13.0, 12.0, 8.0, 6.0, 2.0, 7.0, 3.0, 6.0, 4.0, 2.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.335693359375, -0.3220100402832031, -0.30832672119140625, -0.2946434020996094, -0.2809600830078125, -0.2672767639160156, -0.25359344482421875, -0.23991012573242188, -0.226226806640625, -0.21254348754882812, -0.19886016845703125, -0.18517684936523438, -0.1714935302734375, -0.15781021118164062, -0.14412689208984375, -0.13044357299804688, -0.11676025390625, -0.10307693481445312, -0.08939361572265625, -0.07571029663085938, -0.0620269775390625, -0.048343658447265625, -0.03466033935546875, -0.020977020263671875, -0.007293701171875, 0.006389617919921875, 0.02007293701171875, 0.033756256103515625, 0.0474395751953125, 0.061122894287109375, 0.07480621337890625, 0.08848953247070312, 0.1021728515625, 0.11585617065429688, 0.12953948974609375, 0.14322280883789062, 0.1569061279296875, 0.17058944702148438, 0.18427276611328125, 0.19795608520507812, 0.211639404296875, 0.22532272338867188, 0.23900604248046875, 0.2526893615722656, 0.2663726806640625, 0.2800559997558594, 0.29373931884765625, 0.3074226379394531, 0.32110595703125, 0.3347892761230469, 0.34847259521484375, 0.3621559143066406, 0.3758392333984375, 0.3895225524902344, 0.40320587158203125, 0.4168891906738281, 0.430572509765625, 0.4442558288574219, 0.45793914794921875, 0.4716224670410156, 0.4853057861328125, 0.4989891052246094, 0.5126724243164062, 0.5263557434082031, 0.5400390625]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 10.0, 12.0, 9.0, 16.0, 17.0, 32.0, 43.0, 73.0, 97.0, 252.0, 548.0, 1051.0, 944.0, 467.0, 208.0, 110.0, 41.0, 44.0, 18.0, 16.0, 13.0, 11.0, 6.0, 5.0, 6.0, 2.0, 9.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.10394287109375, -0.1013336181640625, -0.098724365234375, -0.0961151123046875, -0.093505859375, -0.0908966064453125, -0.088287353515625, -0.0856781005859375, -0.08306884765625, -0.0804595947265625, -0.077850341796875, -0.0752410888671875, -0.0726318359375, -0.0700225830078125, -0.067413330078125, -0.0648040771484375, -0.06219482421875, -0.0595855712890625, -0.056976318359375, -0.0543670654296875, -0.0517578125, -0.0491485595703125, -0.046539306640625, -0.0439300537109375, -0.04132080078125, -0.0387115478515625, -0.036102294921875, -0.0334930419921875, -0.0308837890625, -0.0282745361328125, -0.025665283203125, -0.0230560302734375, -0.02044677734375, -0.0178375244140625, -0.015228271484375, -0.0126190185546875, -0.010009765625, -0.0074005126953125, -0.004791259765625, -0.0021820068359375, 0.00042724609375, 0.0030364990234375, 0.005645751953125, 0.0082550048828125, 0.0108642578125, 0.0134735107421875, 0.016082763671875, 0.0186920166015625, 0.02130126953125, 0.0239105224609375, 0.026519775390625, 0.0291290283203125, 0.03173828125, 0.0343475341796875, 0.036956787109375, 0.0395660400390625, 0.04217529296875, 0.0447845458984375, 0.047393798828125, 0.0500030517578125, 0.0526123046875, 0.0552215576171875, 0.057830810546875, 0.0604400634765625, 0.06304931640625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 6.0, 15.0, 6.0, 20.0, 29.0, 44.0, 71.0, 108.0, 153.0, 163.0, 133.0, 82.0, 58.0, 36.0, 23.0, 14.0, 13.0, 9.0, 5.0, 0.0, 4.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34517422318458557, -0.3340901732444763, -0.32300612330436707, -0.3119220733642578, -0.30083802342414856, -0.2897539734840393, -0.27866995334625244, -0.2675859034061432, -0.25650185346603394, -0.24541780352592468, -0.23433375358581543, -0.22324970364570618, -0.21216566860675812, -0.20108161866664886, -0.1899975687265396, -0.17891353368759155, -0.1678294688463211, -0.15674541890621185, -0.1456613689661026, -0.13457733392715454, -0.12349328398704529, -0.11240923404693604, -0.10132518410682678, -0.09024114161729813, -0.07915709167718887, -0.06807304173707962, -0.056988999247550964, -0.04590494930744171, -0.03482090309262276, -0.023736856877803802, -0.01265280693769455, -0.0015687644481658936, 0.00951528549194336, 0.020599331706762314, 0.03168337792158127, 0.04276742786169052, 0.053851474076509476, 0.06493552029132843, 0.07601957023143768, 0.08710361272096634, 0.09818766266107559, 0.10927171260118484, 0.1203557550907135, 0.13143980503082275, 0.142523854970932, 0.15360790491104126, 0.1646919548511505, 0.17577598989009857, 0.18686003983020782, 0.19794408977031708, 0.20902813971042633, 0.2201121747493744, 0.23119622468948364, 0.2422802746295929, 0.25336432456970215, 0.2644483745098114, 0.27553242444992065, 0.2866164743900299, 0.29770052433013916, 0.3087845742702484, 0.31986862421035767, 0.33095264434814453, 0.34203672409057617, 0.35312074422836304, 0.3642047941684723]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 6.0, 4.0, 5.0, 6.0, 14.0, 13.0, 19.0, 15.0, 21.0, 30.0, 29.0, 28.0, 38.0, 43.0, 43.0, 50.0, 49.0, 49.0, 63.0, 53.0, 36.0, 42.0, 44.0, 38.0, 38.0, 37.0, 49.0, 22.0, 21.0, 17.0, 15.0, 15.0, 13.0, 9.0, 8.0, 7.0, 3.0, 2.0, 2.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13359737396240234, -0.12859424948692322, -0.12359113991260529, -0.11858802288770676, -0.11358490586280823, -0.1085817888379097, -0.10357867181301117, -0.09857554733753204, -0.09357243776321411, -0.08856932073831558, -0.08356620371341705, -0.07856308668851852, -0.07355996966362, -0.06855685263872147, -0.06355373561382294, -0.05855061486363411, -0.05354749411344528, -0.04854437708854675, -0.043541260063648224, -0.038538143038749695, -0.033535026013851166, -0.028531907126307487, -0.02352878823876381, -0.01852567121386528, -0.013522554188966751, -0.008519437164068222, -0.0035163192078471184, 0.0014867987483739853, 0.006489915773272514, 0.011493032798171043, 0.01649615168571472, 0.02149926871061325, 0.02650238573551178, 0.03150550276041031, 0.03650861978530884, 0.04151173681020737, 0.046514853835105896, 0.051517970860004425, 0.05652109161019325, 0.06152420863509178, 0.06652732193470001, 0.07153043895959854, 0.07653355598449707, 0.0815366730093956, 0.08653979003429413, 0.09154290705919266, 0.09654602408409119, 0.10154914855957031, 0.10655226558446884, 0.11155538260936737, 0.1165584996342659, 0.12156161665916443, 0.12656474113464355, 0.1315678507089615, 0.1365709751844406, 0.14157408475875854, 0.14657720923423767, 0.1515803337097168, 0.15658344328403473, 0.16158656775951385, 0.1665896773338318, 0.1715928018093109, 0.17659591138362885, 0.18159903585910797, 0.1866021454334259]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 2.0, 3.0, 3.0, 9.0, 16.0, 26.0, 16.0, 32.0, 54.0, 72.0, 121.0, 158.0, 280.0, 370.0, 577.0, 960.0, 1505.0, 2486.0, 4158.0, 7141.0, 12684.0, 23665.0, 45449.0, 92795.0, 187339.0, 276092.0, 193389.0, 95801.0, 47411.0, 24291.0, 13069.0, 7334.0, 4352.0, 2562.0, 1590.0, 948.0, 622.0, 379.0, 274.0, 177.0, 123.0, 80.0, 49.0, 31.0, 25.0, 18.0, 6.0, 6.0, 2.0, 7.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.0172119140625, -0.016713380813598633, -0.016214847564697266, -0.0157163143157959, -0.015217781066894531, -0.014719247817993164, -0.014220714569091797, -0.01372218132019043, -0.013223648071289062, -0.012725114822387695, -0.012226581573486328, -0.011728048324584961, -0.011229515075683594, -0.010730981826782227, -0.01023244857788086, -0.009733915328979492, -0.009235382080078125, -0.008736848831176758, -0.00823831558227539, -0.0077397823333740234, -0.007241249084472656, -0.006742715835571289, -0.006244182586669922, -0.005745649337768555, -0.0052471160888671875, -0.00474858283996582, -0.004250049591064453, -0.003751516342163086, -0.0032529830932617188, -0.0027544498443603516, -0.0022559165954589844, -0.0017573833465576172, -0.00125885009765625, -0.0007603168487548828, -0.0002617835998535156, 0.00023674964904785156, 0.0007352828979492188, 0.001233816146850586, 0.0017323493957519531, 0.0022308826446533203, 0.0027294158935546875, 0.0032279491424560547, 0.003726482391357422, 0.004225015640258789, 0.004723548889160156, 0.0052220821380615234, 0.005720615386962891, 0.006219148635864258, 0.006717681884765625, 0.007216215133666992, 0.007714748382568359, 0.008213281631469727, 0.008711814880371094, 0.009210348129272461, 0.009708881378173828, 0.010207414627075195, 0.010705947875976562, 0.01120448112487793, 0.011703014373779297, 0.012201547622680664, 0.012700080871582031, 0.013198614120483398, 0.013697147369384766, 0.014195680618286133, 0.0146942138671875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 1.0, 3.0, 8.0, 8.0, 15.0, 14.0, 19.0, 17.0, 34.0, 23.0, 39.0, 42.0, 47.0, 67.0, 47.0, 63.0, 64.0, 63.0, 40.0, 55.0, 53.0, 46.0, 39.0, 38.0, 40.0, 28.0, 21.0, 13.0, 15.0, 7.0, 5.0, 7.0, 5.0, 4.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1241455078125, -0.12025260925292969, -0.11635971069335938, -0.11246681213378906, -0.10857391357421875, -0.10468101501464844, -0.10078811645507812, -0.09689521789550781, -0.0930023193359375, -0.08910942077636719, -0.08521652221679688, -0.08132362365722656, -0.07743072509765625, -0.07353782653808594, -0.06964492797851562, -0.06575202941894531, -0.061859130859375, -0.05796623229980469, -0.054073333740234375, -0.05018043518066406, -0.04628753662109375, -0.04239463806152344, -0.038501739501953125, -0.03460884094238281, -0.0307159423828125, -0.026823043823242188, -0.022930145263671875, -0.019037246704101562, -0.01514434814453125, -0.011251449584960938, -0.007358551025390625, -0.0034656524658203125, 0.00042724609375, 0.0043201446533203125, 0.008213043212890625, 0.012105941772460938, 0.01599884033203125, 0.019891738891601562, 0.023784637451171875, 0.027677536010742188, 0.0315704345703125, 0.03546333312988281, 0.039356231689453125, 0.04324913024902344, 0.04714202880859375, 0.05103492736816406, 0.054927825927734375, 0.05882072448730469, 0.062713623046875, 0.06660652160644531, 0.07049942016601562, 0.07439231872558594, 0.07828521728515625, 0.08217811584472656, 0.08607101440429688, 0.08996391296386719, 0.0938568115234375, 0.09774971008300781, 0.10164260864257812, 0.10553550720214844, 0.10942840576171875, 0.11332130432128906, 0.11721420288085938, 0.12110710144042969, 0.125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 9.0, 8.0, 12.0, 39.0, 59.0, 119.0, 295.0, 802.0, 2382.0, 9289.0, 48791.0, 370933.0, 525127.0, 72899.0, 12815.0, 3135.0, 1064.0, 406.0, 171.0, 88.0, 34.0, 19.0, 11.0, 6.0, 8.0, 10.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.048065185546875, -0.046613216400146484, -0.04516124725341797, -0.04370927810668945, -0.04225730895996094, -0.04080533981323242, -0.039353370666503906, -0.03790140151977539, -0.036449432373046875, -0.03499746322631836, -0.033545494079589844, -0.03209352493286133, -0.030641555786132812, -0.029189586639404297, -0.02773761749267578, -0.026285648345947266, -0.02483367919921875, -0.023381710052490234, -0.02192974090576172, -0.020477771759033203, -0.019025802612304688, -0.017573833465576172, -0.016121864318847656, -0.01466989517211914, -0.013217926025390625, -0.01176595687866211, -0.010313987731933594, -0.008862018585205078, -0.0074100494384765625, -0.005958080291748047, -0.004506111145019531, -0.0030541419982910156, -0.0016021728515625, -0.00015020370483398438, 0.0013017654418945312, 0.002753734588623047, 0.0042057037353515625, 0.005657672882080078, 0.007109642028808594, 0.00856161117553711, 0.010013580322265625, 0.01146554946899414, 0.012917518615722656, 0.014369487762451172, 0.015821456909179688, 0.017273426055908203, 0.01872539520263672, 0.020177364349365234, 0.02162933349609375, 0.023081302642822266, 0.02453327178955078, 0.025985240936279297, 0.027437210083007812, 0.028889179229736328, 0.030341148376464844, 0.03179311752319336, 0.033245086669921875, 0.03469705581665039, 0.036149024963378906, 0.03760099411010742, 0.03905296325683594, 0.04050493240356445, 0.04195690155029297, 0.043408870697021484, 0.04486083984375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 5.0, 4.0, 3.0, 3.0, 7.0, 1.0, 8.0, 5.0, 10.0, 14.0, 13.0, 22.0, 20.0, 25.0, 27.0, 23.0, 36.0, 43.0, 38.0, 40.0, 65.0, 46.0, 60.0, 47.0, 54.0, 44.0, 54.0, 31.0, 45.0, 35.0, 36.0, 29.0, 22.0, 21.0, 16.0, 22.0, 5.0, 6.0, 8.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1990966796875, -0.19237327575683594, -0.18564987182617188, -0.1789264678955078, -0.17220306396484375, -0.1654796600341797, -0.15875625610351562, -0.15203285217285156, -0.1453094482421875, -0.13858604431152344, -0.13186264038085938, -0.1251392364501953, -0.11841583251953125, -0.11169242858886719, -0.10496902465820312, -0.09824562072753906, -0.091522216796875, -0.08479881286621094, -0.07807540893554688, -0.07135200500488281, -0.06462860107421875, -0.05790519714355469, -0.051181793212890625, -0.04445838928222656, -0.0377349853515625, -0.031011581420898438, -0.024288177490234375, -0.017564773559570312, -0.01084136962890625, -0.0041179656982421875, 0.002605438232421875, 0.009328842163085938, 0.01605224609375, 0.022775650024414062, 0.029499053955078125, 0.03622245788574219, 0.04294586181640625, 0.04966926574707031, 0.056392669677734375, 0.06311607360839844, 0.0698394775390625, 0.07656288146972656, 0.08328628540039062, 0.09000968933105469, 0.09673309326171875, 0.10345649719238281, 0.11017990112304688, 0.11690330505371094, 0.123626708984375, 0.13035011291503906, 0.13707351684570312, 0.1437969207763672, 0.15052032470703125, 0.1572437286376953, 0.16396713256835938, 0.17069053649902344, 0.1774139404296875, 0.18413734436035156, 0.19086074829101562, 0.1975841522216797, 0.20430755615234375, 0.2110309600830078, 0.21775436401367188, 0.22447776794433594, 0.231201171875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 4.0, 5.0, 8.0, 21.0, 13.0, 26.0, 44.0, 55.0, 90.0, 124.0, 225.0, 347.0, 592.0, 1171.0, 2365.0, 5748.0, 16824.0, 70059.0, 393476.0, 446017.0, 80936.0, 18908.0, 6106.0, 2525.0, 1237.0, 642.0, 345.0, 228.0, 132.0, 80.0, 68.0, 40.0, 18.0, 23.0, 16.0, 10.0, 10.0, 5.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.01029205322265625, -0.009960532188415527, -0.009629011154174805, -0.009297490119934082, -0.00896596908569336, -0.008634448051452637, -0.008302927017211914, -0.007971405982971191, -0.007639884948730469, -0.007308363914489746, -0.0069768428802490234, -0.006645321846008301, -0.006313800811767578, -0.0059822797775268555, -0.005650758743286133, -0.00531923770904541, -0.0049877166748046875, -0.004656195640563965, -0.004324674606323242, -0.0039931535720825195, -0.003661632537841797, -0.0033301115036010742, -0.0029985904693603516, -0.002667069435119629, -0.0023355484008789062, -0.0020040273666381836, -0.001672506332397461, -0.0013409852981567383, -0.0010094642639160156, -0.000677943229675293, -0.0003464221954345703, -1.4901161193847656e-05, 0.000316619873046875, 0.0006481409072875977, 0.0009796619415283203, 0.001311182975769043, 0.0016427040100097656, 0.0019742250442504883, 0.002305746078491211, 0.0026372671127319336, 0.0029687881469726562, 0.003300309181213379, 0.0036318302154541016, 0.003963351249694824, 0.004294872283935547, 0.0046263933181762695, 0.004957914352416992, 0.005289435386657715, 0.0056209564208984375, 0.00595247745513916, 0.006283998489379883, 0.0066155195236206055, 0.006947040557861328, 0.007278561592102051, 0.0076100826263427734, 0.007941603660583496, 0.008273124694824219, 0.008604645729064941, 0.008936166763305664, 0.009267687797546387, 0.00959920883178711, 0.009930729866027832, 0.010262250900268555, 0.010593771934509277, 0.01092529296875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 4.0, 3.0, 10.0, 4.0, 7.0, 6.0, 13.0, 7.0, 23.0, 26.0, 23.0, 55.0, 37.0, 58.0, 61.0, 80.0, 83.0, 48.0, 73.0, 77.0, 61.0, 52.0, 52.0, 43.0, 17.0, 25.0, 19.0, 11.0, 11.0, 7.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.635883331298828e-06, -3.4654513001441956e-06, -3.295019268989563e-06, -3.1245872378349304e-06, -2.954155206680298e-06, -2.7837231755256653e-06, -2.6132911443710327e-06, -2.4428591132164e-06, -2.2724270820617676e-06, -2.101995050907135e-06, -1.9315630197525024e-06, -1.7611309885978699e-06, -1.5906989574432373e-06, -1.4202669262886047e-06, -1.2498348951339722e-06, -1.0794028639793396e-06, -9.08970832824707e-07, -7.385388016700745e-07, -5.681067705154419e-07, -3.976747393608093e-07, -2.2724270820617676e-07, -5.681067705154419e-08, 1.1362135410308838e-07, 2.8405338525772095e-07, 4.544854164123535e-07, 6.249174475669861e-07, 7.953494787216187e-07, 9.657815098762512e-07, 1.1362135410308838e-06, 1.3066455721855164e-06, 1.477077603340149e-06, 1.6475096344947815e-06, 1.817941665649414e-06, 1.9883736968040466e-06, 2.158805727958679e-06, 2.3292377591133118e-06, 2.4996697902679443e-06, 2.670101821422577e-06, 2.8405338525772095e-06, 3.010965883731842e-06, 3.1813979148864746e-06, 3.351829946041107e-06, 3.5222619771957397e-06, 3.6926940083503723e-06, 3.863126039505005e-06, 4.0335580706596375e-06, 4.20399010181427e-06, 4.374422132968903e-06, 4.544854164123535e-06, 4.715286195278168e-06, 4.8857182264328e-06, 5.056150257587433e-06, 5.2265822887420654e-06, 5.397014319896698e-06, 5.5674463510513306e-06, 5.737878382205963e-06, 5.908310413360596e-06, 6.078742444515228e-06, 6.249174475669861e-06, 6.419606506824493e-06, 6.590038537979126e-06, 6.7604705691337585e-06, 6.930902600288391e-06, 7.101334631443024e-06, 7.271766662597656e-06]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 6.0, 7.0, 2.0, 8.0, 7.0, 15.0, 15.0, 25.0, 33.0, 35.0, 57.0, 80.0, 109.0, 178.0, 234.0, 445.0, 826.0, 1583.0, 4112.0, 11775.0, 40542.0, 171836.0, 504253.0, 233566.0, 53747.0, 15336.0, 5321.0, 2059.0, 934.0, 551.0, 304.0, 172.0, 129.0, 72.0, 38.0, 36.0, 33.0, 17.0, 17.0, 8.0, 11.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00911712646484375, -0.00882863998413086, -0.008540153503417969, -0.008251667022705078, -0.007963180541992188, -0.007674694061279297, -0.007386207580566406, -0.007097721099853516, -0.006809234619140625, -0.006520748138427734, -0.006232261657714844, -0.005943775177001953, -0.0056552886962890625, -0.005366802215576172, -0.005078315734863281, -0.004789829254150391, -0.0045013427734375, -0.004212856292724609, -0.003924369812011719, -0.003635883331298828, -0.0033473968505859375, -0.003058910369873047, -0.0027704238891601562, -0.0024819374084472656, -0.002193450927734375, -0.0019049644470214844, -0.0016164779663085938, -0.0013279914855957031, -0.0010395050048828125, -0.0007510185241699219, -0.00046253204345703125, -0.00017404556274414062, 0.00011444091796875, 0.0004029273986816406, 0.0006914138793945312, 0.0009799003601074219, 0.0012683868408203125, 0.0015568733215332031, 0.0018453598022460938, 0.0021338462829589844, 0.002422332763671875, 0.0027108192443847656, 0.0029993057250976562, 0.003287792205810547, 0.0035762786865234375, 0.003864765167236328, 0.004153251647949219, 0.004441738128662109, 0.004730224609375, 0.005018711090087891, 0.005307197570800781, 0.005595684051513672, 0.0058841705322265625, 0.006172657012939453, 0.006461143493652344, 0.006749629974365234, 0.007038116455078125, 0.007326602935791016, 0.007615089416503906, 0.007903575897216797, 0.008192062377929688, 0.008480548858642578, 0.008769035339355469, 0.00905752182006836, 0.00934600830078125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 6.0, 2.0, 1.0, 6.0, 1.0, 3.0, 11.0, 18.0, 16.0, 17.0, 19.0, 25.0, 28.0, 37.0, 33.0, 45.0, 46.0, 53.0, 55.0, 62.0, 53.0, 65.0, 61.0, 56.0, 45.0, 34.0, 31.0, 26.0, 24.0, 27.0, 21.0, 16.0, 5.0, 12.0, 10.0, 9.0, 6.0, 2.0, 2.0, 2.0, 4.0, 7.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0017490386962890625, -0.0016888082027435303, -0.001628577709197998, -0.0015683472156524658, -0.0015081167221069336, -0.0014478862285614014, -0.0013876557350158691, -0.001327425241470337, -0.0012671947479248047, -0.0012069642543792725, -0.0011467337608337402, -0.001086503267288208, -0.0010262727737426758, -0.0009660422801971436, -0.0009058117866516113, -0.0008455812931060791, -0.0007853507995605469, -0.0007251203060150146, -0.0006648898124694824, -0.0006046593189239502, -0.000544428825378418, -0.00048419833183288574, -0.0004239678382873535, -0.0003637373447418213, -0.00030350685119628906, -0.00024327635765075684, -0.0001830458641052246, -0.00012281537055969238, -6.258487701416016e-05, -2.3543834686279297e-06, 5.78761100769043e-05, 0.00011810660362243652, 0.00017833709716796875, 0.00023856759071350098, 0.0002987980842590332, 0.00035902857780456543, 0.00041925907135009766, 0.0004794895648956299, 0.0005397200584411621, 0.0005999505519866943, 0.0006601810455322266, 0.0007204115390777588, 0.000780642032623291, 0.0008408725261688232, 0.0009011030197143555, 0.0009613335132598877, 0.00102156400680542, 0.0010817945003509521, 0.0011420249938964844, 0.0012022554874420166, 0.0012624859809875488, 0.001322716474533081, 0.0013829469680786133, 0.0014431774616241455, 0.0015034079551696777, 0.00156363844871521, 0.0016238689422607422, 0.0016840994358062744, 0.0017443299293518066, 0.0018045604228973389, 0.001864790916442871, 0.0019250214099884033, 0.0019852519035339355, 0.0020454823970794678, 0.002105712890625]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 8.0, 24.0, 31.0, 70.0, 136.0, 264.0, 222.0, 115.0, 63.0, 22.0, 19.0, 8.0, 5.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3553064465522766, -0.34480053186416626, -0.3342946171760559, -0.32378873229026794, -0.3132828176021576, -0.30277690291404724, -0.2922710180282593, -0.2817651033401489, -0.2712591886520386, -0.2607532739639282, -0.25024735927581787, -0.2397414743900299, -0.22923555970191956, -0.2187296450138092, -0.20822374522686005, -0.1977178454399109, -0.18721193075180054, -0.17670601606369019, -0.16620011627674103, -0.15569421648979187, -0.14518830180168152, -0.13468238711357117, -0.12417648732662201, -0.11367058008909225, -0.1031646728515625, -0.09265876561403275, -0.08215285837650299, -0.07164695113897324, -0.06114104390144348, -0.05063513666391373, -0.04012922942638397, -0.029623322188854218, -0.019117414951324463, -0.008611507713794708, 0.0018943995237350464, 0.012400306761264801, 0.022906213998794556, 0.03341212123632431, 0.043918028473854065, 0.05442393571138382, 0.06492984294891357, 0.07543575018644333, 0.08594165742397308, 0.09644756466150284, 0.10695347189903259, 0.11745937913656235, 0.1279652863740921, 0.13847118616104126, 0.1489771008491516, 0.15948301553726196, 0.16998891532421112, 0.18049481511116028, 0.19100072979927063, 0.20150664448738098, 0.21201254427433014, 0.2225184440612793, 0.23302435874938965, 0.2435302734375, 0.25403618812561035, 0.2645420730113983, 0.27504798769950867, 0.285553902387619, 0.296059787273407, 0.30656570196151733, 0.3170716166496277]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 6.0, 2.0, 1.0, 7.0, 10.0, 12.0, 18.0, 14.0, 17.0, 21.0, 28.0, 36.0, 38.0, 42.0, 50.0, 50.0, 49.0, 62.0, 63.0, 56.0, 35.0, 44.0, 54.0, 40.0, 42.0, 37.0, 41.0, 25.0, 24.0, 9.0, 19.0, 13.0, 7.0, 7.0, 6.0, 4.0, 6.0, 2.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10806149989366531, -0.10454869270324707, -0.10103588551282883, -0.09752307832241058, -0.09401026368141174, -0.0904974564909935, -0.08698464930057526, -0.08347184211015701, -0.07995903491973877, -0.07644622772932053, -0.07293342053890228, -0.06942060589790344, -0.0659077987074852, -0.062394991517066956, -0.05888218432664871, -0.05536937713623047, -0.05185656622052193, -0.048343759030103683, -0.04483094811439514, -0.0413181409239769, -0.037805333733558655, -0.03429252654314041, -0.03077971562743187, -0.027266908437013626, -0.023754099383950233, -0.02024129033088684, -0.016728483140468597, -0.013215674087405205, -0.009702865965664387, -0.006190057843923569, -0.002677248790860176, 0.0008355583995580673, 0.00434836745262146, 0.007861175574362278, 0.011373983696103096, 0.014886792749166489, 0.018399599939584732, 0.021912408992648125, 0.025425218045711517, 0.02893802523612976, 0.032450832426548004, 0.03596363961696625, 0.03947645053267479, 0.04298925772309303, 0.046502064913511276, 0.05001487582921982, 0.05352768301963806, 0.057040490210056305, 0.06055330112576485, 0.06406611204147339, 0.06757891923189163, 0.07109172642230988, 0.07460453361272812, 0.07811734080314636, 0.0816301554441452, 0.08514295518398285, 0.08865576982498169, 0.09216857701539993, 0.09568138420581818, 0.09919419884681702, 0.10270700603723526, 0.1062198132276535, 0.10973262041807175, 0.11324542760848999, 0.11675823479890823]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 6.0, 14.0, 33.0, 34.0, 62.0, 90.0, 173.0, 263.0, 503.0, 921.0, 1678.0, 3288.0, 6861.0, 15780.0, 43583.0, 182828.0, 581340.0, 146608.0, 37596.0, 14173.0, 6148.0, 3034.0, 1577.0, 838.0, 469.0, 277.0, 159.0, 102.0, 45.0, 38.0, 20.0, 12.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10638427734375, -0.10338211059570312, -0.10037994384765625, -0.09737777709960938, -0.0943756103515625, -0.09137344360351562, -0.08837127685546875, -0.08536911010742188, -0.082366943359375, -0.07936477661132812, -0.07636260986328125, -0.07336044311523438, -0.0703582763671875, -0.06735610961914062, -0.06435394287109375, -0.061351776123046875, -0.058349609375, -0.055347442626953125, -0.05234527587890625, -0.049343109130859375, -0.0463409423828125, -0.043338775634765625, -0.04033660888671875, -0.037334442138671875, -0.034332275390625, -0.031330108642578125, -0.02832794189453125, -0.025325775146484375, -0.0223236083984375, -0.019321441650390625, -0.01631927490234375, -0.013317108154296875, -0.01031494140625, -0.007312774658203125, -0.00431060791015625, -0.001308441162109375, 0.0016937255859375, 0.004695892333984375, 0.00769805908203125, 0.010700225830078125, 0.013702392578125, 0.016704559326171875, 0.01970672607421875, 0.022708892822265625, 0.0257110595703125, 0.028713226318359375, 0.03171539306640625, 0.034717559814453125, 0.0377197265625, 0.040721893310546875, 0.04372406005859375, 0.046726226806640625, 0.0497283935546875, 0.052730560302734375, 0.05573272705078125, 0.058734893798828125, 0.061737060546875, 0.06473922729492188, 0.06774139404296875, 0.07074356079101562, 0.0737457275390625, 0.07674789428710938, 0.07975006103515625, 0.08275222778320312, 0.08575439453125]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 5.0, 8.0, 3.0, 12.0, 12.0, 8.0, 16.0, 21.0, 26.0, 36.0, 37.0, 49.0, 48.0, 58.0, 53.0, 53.0, 61.0, 54.0, 41.0, 47.0, 49.0, 56.0, 48.0, 44.0, 32.0, 27.0, 21.0, 12.0, 11.0, 12.0, 10.0, 9.0, 4.0, 6.0, 3.0, 1.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.243408203125, -0.23533248901367188, -0.22725677490234375, -0.21918106079101562, -0.2111053466796875, -0.20302963256835938, -0.19495391845703125, -0.18687820434570312, -0.178802490234375, -0.17072677612304688, -0.16265106201171875, -0.15457534790039062, -0.1464996337890625, -0.13842391967773438, -0.13034820556640625, -0.12227249145507812, -0.11419677734375, -0.10612106323242188, -0.09804534912109375, -0.08996963500976562, -0.0818939208984375, -0.07381820678710938, -0.06574249267578125, -0.057666778564453125, -0.049591064453125, -0.041515350341796875, -0.03343963623046875, -0.025363922119140625, -0.0172882080078125, -0.009212493896484375, -0.00113677978515625, 0.006938934326171875, 0.0150146484375, 0.023090362548828125, 0.03116607666015625, 0.039241790771484375, 0.0473175048828125, 0.055393218994140625, 0.06346893310546875, 0.07154464721679688, 0.079620361328125, 0.08769607543945312, 0.09577178955078125, 0.10384750366210938, 0.1119232177734375, 0.11999893188476562, 0.12807464599609375, 0.13615036010742188, 0.14422607421875, 0.15230178833007812, 0.16037750244140625, 0.16845321655273438, 0.1765289306640625, 0.18460464477539062, 0.19268035888671875, 0.20075607299804688, 0.208831787109375, 0.21690750122070312, 0.22498321533203125, 0.23305892944335938, 0.2411346435546875, 0.24921035766601562, 0.25728607177734375, 0.2653617858886719, 0.2734375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 3.0, 3.0, 9.0, 17.0, 27.0, 32.0, 54.0, 101.0, 182.0, 436.0, 1186.0, 5538.0, 141672.0, 879515.0, 16557.0, 2020.0, 611.0, 266.0, 129.0, 61.0, 44.0, 25.0, 13.0, 13.0, 4.0, 6.0, 5.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.33544921875, -0.3264350891113281, -0.31742095947265625, -0.3084068298339844, -0.2993927001953125, -0.2903785705566406, -0.28136444091796875, -0.2723503112792969, -0.263336181640625, -0.2543220520019531, -0.24530792236328125, -0.23629379272460938, -0.2272796630859375, -0.21826553344726562, -0.20925140380859375, -0.20023727416992188, -0.19122314453125, -0.18220901489257812, -0.17319488525390625, -0.16418075561523438, -0.1551666259765625, -0.14615249633789062, -0.13713836669921875, -0.12812423706054688, -0.119110107421875, -0.11009597778320312, -0.10108184814453125, -0.09206771850585938, -0.0830535888671875, -0.07403945922851562, -0.06502532958984375, -0.056011199951171875, -0.0469970703125, -0.037982940673828125, -0.02896881103515625, -0.019954681396484375, -0.0109405517578125, -0.001926422119140625, 0.00708770751953125, 0.016101837158203125, 0.025115966796875, 0.034130096435546875, 0.04314422607421875, 0.052158355712890625, 0.0611724853515625, 0.07018661499023438, 0.07920074462890625, 0.08821487426757812, 0.09722900390625, 0.10624313354492188, 0.11525726318359375, 0.12427139282226562, 0.1332855224609375, 0.14229965209960938, 0.15131378173828125, 0.16032791137695312, 0.169342041015625, 0.17835617065429688, 0.18737030029296875, 0.19638442993164062, 0.2053985595703125, 0.21441268920898438, 0.22342681884765625, 0.23244094848632812, 0.241455078125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 7.0, 3.0, 7.0, 6.0, 9.0, 11.0, 13.0, 24.0, 12.0, 16.0, 21.0, 25.0, 28.0, 26.0, 39.0, 42.0, 49.0, 34.0, 35.0, 43.0, 44.0, 55.0, 37.0, 37.0, 32.0, 45.0, 45.0, 33.0, 37.0, 25.0, 22.0, 16.0, 20.0, 29.0, 15.0, 17.0, 8.0, 8.0, 9.0, 7.0, 3.0, 2.0, 3.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.2427978515625, -0.2352924346923828, -0.22778701782226562, -0.22028160095214844, -0.21277618408203125, -0.20527076721191406, -0.19776535034179688, -0.1902599334716797, -0.1827545166015625, -0.1752490997314453, -0.16774368286132812, -0.16023826599121094, -0.15273284912109375, -0.14522743225097656, -0.13772201538085938, -0.1302165985107422, -0.122711181640625, -0.11520576477050781, -0.10770034790039062, -0.10019493103027344, -0.09268951416015625, -0.08518409729003906, -0.07767868041992188, -0.07017326354980469, -0.0626678466796875, -0.05516242980957031, -0.047657012939453125, -0.04015159606933594, -0.03264617919921875, -0.025140762329101562, -0.017635345458984375, -0.010129928588867188, -0.00262451171875, 0.0048809051513671875, 0.012386322021484375, 0.019891738891601562, 0.02739715576171875, 0.03490257263183594, 0.042407989501953125, 0.04991340637207031, 0.0574188232421875, 0.06492424011230469, 0.07242965698242188, 0.07993507385253906, 0.08744049072265625, 0.09494590759277344, 0.10245132446289062, 0.10995674133300781, 0.117462158203125, 0.12496757507324219, 0.13247299194335938, 0.13997840881347656, 0.14748382568359375, 0.15498924255371094, 0.16249465942382812, 0.1700000762939453, 0.1775054931640625, 0.1850109100341797, 0.19251632690429688, 0.20002174377441406, 0.20752716064453125, 0.21503257751464844, 0.22253799438476562, 0.2300434112548828, 0.237548828125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 6.0, 12.0, 10.0, 18.0, 22.0, 55.0, 130.0, 304.0, 896.0, 4335.0, 84996.0, 943776.0, 11587.0, 1633.0, 444.0, 146.0, 78.0, 39.0, 21.0, 17.0, 12.0, 2.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.169189453125, -0.16438674926757812, -0.15958404541015625, -0.15478134155273438, -0.1499786376953125, -0.14517593383789062, -0.14037322998046875, -0.13557052612304688, -0.130767822265625, -0.12596511840820312, -0.12116241455078125, -0.11635971069335938, -0.1115570068359375, -0.10675430297851562, -0.10195159912109375, -0.09714889526367188, -0.09234619140625, -0.08754348754882812, -0.08274078369140625, -0.07793807983398438, -0.0731353759765625, -0.06833267211914062, -0.06352996826171875, -0.058727264404296875, -0.053924560546875, -0.049121856689453125, -0.04431915283203125, -0.039516448974609375, -0.0347137451171875, -0.029911041259765625, -0.02510833740234375, -0.020305633544921875, -0.0155029296875, -0.010700225830078125, -0.00589752197265625, -0.001094818115234375, 0.0037078857421875, 0.008510589599609375, 0.01331329345703125, 0.018115997314453125, 0.022918701171875, 0.027721405029296875, 0.03252410888671875, 0.037326812744140625, 0.0421295166015625, 0.046932220458984375, 0.05173492431640625, 0.056537628173828125, 0.06134033203125, 0.06614303588867188, 0.07094573974609375, 0.07574844360351562, 0.0805511474609375, 0.08535385131835938, 0.09015655517578125, 0.09495925903320312, 0.099761962890625, 0.10456466674804688, 0.10936737060546875, 0.11417007446289062, 0.1189727783203125, 0.12377548217773438, 0.12857818603515625, 0.13338088989257812, 0.13818359375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 4.0, 9.0, 15.0, 11.0, 22.0, 36.0, 79.0, 143.0, 230.0, 157.0, 125.0, 65.0, 38.0, 21.0, 14.0, 8.0, 5.0, 3.0, 3.0, 2.0, 5.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.6629695892333984e-05, -1.624133437871933e-05, -1.5852972865104675e-05, -1.546461135149002e-05, -1.5076249837875366e-05, -1.4687888324260712e-05, -1.4299526810646057e-05, -1.3911165297031403e-05, -1.3522803783416748e-05, -1.3134442269802094e-05, -1.2746080756187439e-05, -1.2357719242572784e-05, -1.196935772895813e-05, -1.1580996215343475e-05, -1.119263470172882e-05, -1.0804273188114166e-05, -1.0415911674499512e-05, -1.0027550160884857e-05, -9.639188647270203e-06, -9.250827133655548e-06, -8.862465620040894e-06, -8.474104106426239e-06, -8.085742592811584e-06, -7.69738107919693e-06, -7.309019565582275e-06, -6.920658051967621e-06, -6.532296538352966e-06, -6.143935024738312e-06, -5.755573511123657e-06, -5.367211997509003e-06, -4.978850483894348e-06, -4.590488970279694e-06, -4.202127456665039e-06, -3.8137659430503845e-06, -3.42540442943573e-06, -3.0370429158210754e-06, -2.648681402206421e-06, -2.2603198885917664e-06, -1.8719583749771118e-06, -1.4835968613624573e-06, -1.0952353477478027e-06, -7.068738341331482e-07, -3.1851232051849365e-07, 6.984919309616089e-08, 4.5821070671081543e-07, 8.4657222032547e-07, 1.2349337339401245e-06, 1.623295247554779e-06, 2.0116567611694336e-06, 2.400018274784088e-06, 2.7883797883987427e-06, 3.1767413020133972e-06, 3.5651028156280518e-06, 3.953464329242706e-06, 4.341825842857361e-06, 4.730187356472015e-06, 5.11854887008667e-06, 5.5069103837013245e-06, 5.895271897315979e-06, 6.2836334109306335e-06, 6.671994924545288e-06, 7.060356438159943e-06, 7.448717951774597e-06, 7.837079465389252e-06, 8.225440979003906e-06]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 4.0, 6.0, 15.0, 27.0, 39.0, 55.0, 117.0, 256.0, 831.0, 3757.0, 117340.0, 916322.0, 7898.0, 1169.0, 386.0, 134.0, 85.0, 40.0, 20.0, 17.0, 6.0, 6.0, 7.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.157470703125, -0.15187835693359375, -0.1462860107421875, -0.14069366455078125, -0.135101318359375, -0.12950897216796875, -0.1239166259765625, -0.11832427978515625, -0.11273193359375, -0.10713958740234375, -0.1015472412109375, -0.09595489501953125, -0.090362548828125, -0.08477020263671875, -0.0791778564453125, -0.07358551025390625, -0.0679931640625, -0.06240081787109375, -0.0568084716796875, -0.05121612548828125, -0.045623779296875, -0.04003143310546875, -0.0344390869140625, -0.02884674072265625, -0.02325439453125, -0.01766204833984375, -0.0120697021484375, -0.00647735595703125, -0.000885009765625, 0.00470733642578125, 0.0102996826171875, 0.01589202880859375, 0.021484375, 0.02707672119140625, 0.0326690673828125, 0.03826141357421875, 0.043853759765625, 0.04944610595703125, 0.0550384521484375, 0.06063079833984375, 0.06622314453125, 0.07181549072265625, 0.0774078369140625, 0.08300018310546875, 0.088592529296875, 0.09418487548828125, 0.0997772216796875, 0.10536956787109375, 0.1109619140625, 0.11655426025390625, 0.1221466064453125, 0.12773895263671875, 0.133331298828125, 0.13892364501953125, 0.1445159912109375, 0.15010833740234375, 0.15570068359375, 0.16129302978515625, 0.1668853759765625, 0.17247772216796875, 0.178070068359375, 0.18366241455078125, 0.1892547607421875, 0.19484710693359375, 0.200439453125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 5.0, 5.0, 9.0, 7.0, 8.0, 26.0, 23.0, 66.0, 111.0, 235.0, 233.0, 120.0, 61.0, 29.0, 20.0, 18.0, 14.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049224853515625, -0.04785728454589844, -0.046489715576171875, -0.04512214660644531, -0.04375457763671875, -0.04238700866699219, -0.041019439697265625, -0.03965187072753906, -0.0382843017578125, -0.03691673278808594, -0.035549163818359375, -0.03418159484863281, -0.03281402587890625, -0.03144645690917969, -0.030078887939453125, -0.028711318969726562, -0.02734375, -0.025976181030273438, -0.024608612060546875, -0.023241043090820312, -0.02187347412109375, -0.020505905151367188, -0.019138336181640625, -0.017770767211914062, -0.0164031982421875, -0.015035629272460938, -0.013668060302734375, -0.012300491333007812, -0.01093292236328125, -0.009565353393554688, -0.008197784423828125, -0.0068302154541015625, -0.005462646484375, -0.0040950775146484375, -0.002727508544921875, -0.0013599395751953125, 7.62939453125e-06, 0.0013751983642578125, 0.002742767333984375, 0.0041103363037109375, 0.0054779052734375, 0.0068454742431640625, 0.008213043212890625, 0.009580612182617188, 0.01094818115234375, 0.012315750122070312, 0.013683319091796875, 0.015050888061523438, 0.01641845703125, 0.017786026000976562, 0.019153594970703125, 0.020521163940429688, 0.02188873291015625, 0.023256301879882812, 0.024623870849609375, 0.025991439819335938, 0.0273590087890625, 0.028726577758789062, 0.030094146728515625, 0.03146171569824219, 0.03282928466796875, 0.03419685363769531, 0.035564422607421875, 0.03693199157714844, 0.038299560546875]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 13.0, 41.0, 169.0, 461.0, 236.0, 61.0, 12.0, 11.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.575226366519928, -0.5330412983894348, -0.49085626006126404, -0.4486711919307709, -0.4064861536026001, -0.36430108547210693, -0.32211601734161377, -0.279930979013443, -0.23774591088294983, -0.19556085765361786, -0.1533758044242859, -0.11119073629379272, -0.06900568306446075, -0.026820629835128784, 0.01536443829536438, 0.057549476623535156, 0.09973454475402832, 0.1419195979833603, 0.18410465121269226, 0.22628971934318542, 0.2684747576713562, 0.31065982580184937, 0.35284489393234253, 0.3950299322605133, 0.43721500039100647, 0.47940006852149963, 0.5215851068496704, 0.5637701749801636, 0.6059552431106567, 0.6481403112411499, 0.6903253793716431, 0.7325103878974915, 0.7746955156326294, 0.8168805837631226, 0.8590656518936157, 0.9012507200241089, 0.9434357285499573, 0.9856207966804504, 1.0278058052062988, 1.069990873336792, 1.1121759414672852, 1.1543610095977783, 1.1965460777282715, 1.2387311458587646, 1.2809162139892578, 1.323101282119751, 1.3652863502502441, 1.4074712991714478, 1.4496564865112305, 1.4918415546417236, 1.5340266227722168, 1.57621169090271, 1.6183967590332031, 1.6605818271636963, 1.7027668952941895, 1.744951844215393, 1.7871369123458862, 1.8293219804763794, 1.8715070486068726, 1.9136921167373657, 1.9558771848678589, 1.9980621337890625, 2.0402472019195557, 2.082432270050049, 2.124617338180542]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 6.0, 12.0, 15.0, 17.0, 26.0, 19.0, 37.0, 27.0, 29.0, 52.0, 34.0, 35.0, 44.0, 48.0, 47.0, 60.0, 60.0, 45.0, 52.0, 48.0, 40.0, 45.0, 36.0, 35.0, 25.0, 16.0, 19.0, 14.0, 13.0, 12.0, 11.0, 4.0, 7.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.6271568536758423, -0.6113367676734924, -0.5955166816711426, -0.5796966552734375, -0.5638765692710876, -0.5480564832687378, -0.5322363972663879, -0.5164163112640381, -0.500596284866333, -0.48477619886398315, -0.4689561426639557, -0.45313605666160583, -0.43731600046157837, -0.4214959144592285, -0.40567582845687866, -0.3898557424545288, -0.37403565645217896, -0.3582155704498291, -0.34239551424980164, -0.3265754282474518, -0.3107553720474243, -0.29493528604507446, -0.2791152000427246, -0.26329511404037476, -0.2474750578403473, -0.23165498673915863, -0.21583491563796997, -0.20001482963562012, -0.18419475853443146, -0.1683746874332428, -0.15255460143089294, -0.13673453032970428, -0.12091448903083801, -0.10509441792964935, -0.0892743393778801, -0.07345426082611084, -0.05763418972492218, -0.04181411862373352, -0.025994040071964264, -0.010173961520195007, 0.005646109580993652, 0.02146618440747261, 0.03728625923395157, 0.05310633406043053, 0.06892640888690948, 0.08474647998809814, 0.1005665585398674, 0.11638663709163666, 0.13220670819282532, 0.14802677929401398, 0.16384685039520264, 0.1796669363975525, 0.19548700749874115, 0.2113070785999298, 0.22712716460227966, 0.24294723570346832, 0.258767306804657, 0.27458739280700684, 0.2904074490070343, 0.30622753500938416, 0.3220475912094116, 0.3378676772117615, 0.35368776321411133, 0.3695078492164612, 0.38532790541648865]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 5.0, 2.0, 3.0, 2.0, 3.0, 4.0, 11.0, 12.0, 14.0, 19.0, 36.0, 37.0, 68.0, 112.0, 185.0, 242.0, 491.0, 889.0, 1722.0, 4311.0, 14165.0, 117929.0, 2952185.0, 1039865.0, 47029.0, 8593.0, 3285.0, 1371.0, 749.0, 367.0, 219.0, 117.0, 74.0, 45.0, 42.0, 27.0, 19.0, 13.0, 8.0, 11.0, 3.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.291259765625, -0.28238677978515625, -0.2735137939453125, -0.26464080810546875, -0.255767822265625, -0.24689483642578125, -0.2380218505859375, -0.22914886474609375, -0.22027587890625, -0.21140289306640625, -0.2025299072265625, -0.19365692138671875, -0.184783935546875, -0.17591094970703125, -0.1670379638671875, -0.15816497802734375, -0.1492919921875, -0.14041900634765625, -0.1315460205078125, -0.12267303466796875, -0.113800048828125, -0.10492706298828125, -0.0960540771484375, -0.08718109130859375, -0.07830810546875, -0.06943511962890625, -0.0605621337890625, -0.05168914794921875, -0.042816162109375, -0.03394317626953125, -0.0250701904296875, -0.01619720458984375, -0.00732421875, 0.00154876708984375, 0.0104217529296875, 0.01929473876953125, 0.028167724609375, 0.03704071044921875, 0.0459136962890625, 0.05478668212890625, 0.06365966796875, 0.07253265380859375, 0.0814056396484375, 0.09027862548828125, 0.099151611328125, 0.10802459716796875, 0.1168975830078125, 0.12577056884765625, 0.1346435546875, 0.14351654052734375, 0.1523895263671875, 0.16126251220703125, 0.170135498046875, 0.17900848388671875, 0.1878814697265625, 0.19675445556640625, 0.20562744140625, 0.21450042724609375, 0.2233734130859375, 0.23224639892578125, 0.241119384765625, 0.24999237060546875, 0.2588653564453125, 0.26773834228515625, 0.276611328125]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 9.0, 4.0, 8.0, 20.0, 18.0, 28.0, 22.0, 25.0, 25.0, 40.0, 38.0, 64.0, 54.0, 43.0, 54.0, 51.0, 70.0, 45.0, 57.0, 47.0, 35.0, 37.0, 35.0, 30.0, 26.0, 16.0, 18.0, 10.0, 14.0, 9.0, 7.0, 11.0, 6.0, 6.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11334228515625, -0.10926532745361328, -0.10518836975097656, -0.10111141204833984, -0.09703445434570312, -0.0929574966430664, -0.08888053894042969, -0.08480358123779297, -0.08072662353515625, -0.07664966583251953, -0.07257270812988281, -0.0684957504272461, -0.06441879272460938, -0.060341835021972656, -0.05626487731933594, -0.05218791961669922, -0.0481109619140625, -0.04403400421142578, -0.03995704650878906, -0.035880088806152344, -0.031803131103515625, -0.027726173400878906, -0.023649215698242188, -0.01957225799560547, -0.01549530029296875, -0.011418342590332031, -0.0073413848876953125, -0.0032644271850585938, 0.000812530517578125, 0.004889488220214844, 0.008966445922851562, 0.013043403625488281, 0.017120361328125, 0.02119731903076172, 0.025274276733398438, 0.029351234436035156, 0.033428192138671875, 0.037505149841308594, 0.04158210754394531, 0.04565906524658203, 0.04973602294921875, 0.05381298065185547, 0.05788993835449219, 0.061966896057128906, 0.06604385375976562, 0.07012081146240234, 0.07419776916503906, 0.07827472686767578, 0.0823516845703125, 0.08642864227294922, 0.09050559997558594, 0.09458255767822266, 0.09865951538085938, 0.1027364730834961, 0.10681343078613281, 0.11089038848876953, 0.11496734619140625, 0.11904430389404297, 0.12312126159667969, 0.1271982192993164, 0.13127517700195312, 0.13535213470458984, 0.13942909240722656, 0.14350605010986328, 0.1475830078125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 5.0, 4.0, 3.0, 9.0, 8.0, 13.0, 13.0, 15.0, 27.0, 50.0, 55.0, 104.0, 183.0, 321.0, 754.0, 2102.0, 8211.0, 63622.0, 3762991.0, 330422.0, 19270.0, 3884.0, 1168.0, 470.0, 229.0, 118.0, 81.0, 42.0, 25.0, 20.0, 17.0, 12.0, 7.0, 13.0, 12.0, 3.0, 1.0, 2.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.32666015625, -0.31603240966796875, -0.3054046630859375, -0.29477691650390625, -0.284149169921875, -0.27352142333984375, -0.2628936767578125, -0.25226593017578125, -0.24163818359375, -0.23101043701171875, -0.2203826904296875, -0.20975494384765625, -0.199127197265625, -0.18849945068359375, -0.1778717041015625, -0.16724395751953125, -0.1566162109375, -0.14598846435546875, -0.1353607177734375, -0.12473297119140625, -0.114105224609375, -0.10347747802734375, -0.0928497314453125, -0.08222198486328125, -0.07159423828125, -0.06096649169921875, -0.0503387451171875, -0.03971099853515625, -0.029083251953125, -0.01845550537109375, -0.0078277587890625, 0.00279998779296875, 0.013427734375, 0.02405548095703125, 0.0346832275390625, 0.04531097412109375, 0.055938720703125, 0.06656646728515625, 0.0771942138671875, 0.08782196044921875, 0.09844970703125, 0.10907745361328125, 0.1197052001953125, 0.13033294677734375, 0.140960693359375, 0.15158843994140625, 0.1622161865234375, 0.17284393310546875, 0.1834716796875, 0.19409942626953125, 0.2047271728515625, 0.21535491943359375, 0.225982666015625, 0.23661041259765625, 0.2472381591796875, 0.25786590576171875, 0.26849365234375, 0.27912139892578125, 0.2897491455078125, 0.30037689208984375, 0.311004638671875, 0.32163238525390625, 0.3322601318359375, 0.34288787841796875, 0.353515625]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 5.0, 5.0, 9.0, 13.0, 10.0, 20.0, 28.0, 44.0, 82.0, 83.0, 168.0, 387.0, 643.0, 957.0, 685.0, 380.0, 191.0, 118.0, 72.0, 41.0, 27.0, 25.0, 23.0, 17.0, 10.0, 5.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055877685546875, -0.0538487434387207, -0.051819801330566406, -0.04979085922241211, -0.04776191711425781, -0.045732975006103516, -0.04370403289794922, -0.04167509078979492, -0.039646148681640625, -0.03761720657348633, -0.03558826446533203, -0.033559322357177734, -0.03153038024902344, -0.02950143814086914, -0.027472496032714844, -0.025443553924560547, -0.02341461181640625, -0.021385669708251953, -0.019356727600097656, -0.01732778549194336, -0.015298843383789062, -0.013269901275634766, -0.011240959167480469, -0.009212017059326172, -0.007183074951171875, -0.005154132843017578, -0.0031251907348632812, -0.0010962486267089844, 0.0009326934814453125, 0.0029616355895996094, 0.004990577697753906, 0.007019519805908203, 0.0090484619140625, 0.011077404022216797, 0.013106346130371094, 0.01513528823852539, 0.017164230346679688, 0.019193172454833984, 0.02122211456298828, 0.023251056671142578, 0.025279998779296875, 0.027308940887451172, 0.02933788299560547, 0.031366825103759766, 0.03339576721191406, 0.03542470932006836, 0.037453651428222656, 0.03948259353637695, 0.04151153564453125, 0.04354047775268555, 0.045569419860839844, 0.04759836196899414, 0.04962730407714844, 0.051656246185302734, 0.05368518829345703, 0.05571413040161133, 0.057743072509765625, 0.05977201461791992, 0.06180095672607422, 0.06382989883422852, 0.06585884094238281, 0.06788778305053711, 0.0699167251586914, 0.0719456672668457, 0.073974609375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 8.0, 3.0, 6.0, 14.0, 14.0, 17.0, 55.0, 67.0, 97.0, 152.0, 144.0, 145.0, 92.0, 57.0, 44.0, 32.0, 24.0, 10.0, 2.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.32026854157447815, -0.3109922707080841, -0.3017159700393677, -0.29243969917297363, -0.2831634283065796, -0.27388715744018555, -0.2646108567714691, -0.2553345859050751, -0.24605830013751984, -0.2367820143699646, -0.22750574350357056, -0.21822945773601532, -0.20895317196846008, -0.19967690110206604, -0.1904006153345108, -0.18112432956695557, -0.17184805870056152, -0.1625717729330063, -0.15329550206661224, -0.144019216299057, -0.13474294543266296, -0.12546665966510773, -0.11619037389755249, -0.10691409558057785, -0.09763781726360321, -0.08836153894662857, -0.07908526062965393, -0.0698089748620987, -0.060532696545124054, -0.051256418228149414, -0.041980136185884476, -0.03270385414361954, -0.023427575826644897, -0.014151295647025108, -0.004875015467405319, 0.00440126471221447, 0.013677544891834259, 0.0229538232088089, 0.03223010525107384, 0.041506387293338776, 0.050782665610313416, 0.060058943927288055, 0.0693352222442627, 0.07861150801181793, 0.08788778632879257, 0.09716406464576721, 0.10644035041332245, 0.11571662873029709, 0.12499290704727173, 0.13426919281482697, 0.143545463681221, 0.15282174944877625, 0.1620980203151703, 0.17137430608272552, 0.18065059185028076, 0.1899268627166748, 0.19920314848423004, 0.20847943425178528, 0.21775570511817932, 0.22703199088573456, 0.2363082766532898, 0.24558454751968384, 0.2548608183860779, 0.2641371190547943, 0.27341338992118835]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 11.0, 16.0, 17.0, 16.0, 21.0, 23.0, 22.0, 16.0, 36.0, 40.0, 32.0, 33.0, 46.0, 45.0, 49.0, 44.0, 57.0, 51.0, 42.0, 47.0, 49.0, 33.0, 43.0, 37.0, 31.0, 30.0, 18.0, 12.0, 16.0, 13.0, 15.0, 5.0, 6.0, 6.0, 2.0, 3.0, 4.0, 4.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11806507408618927, -0.11389222741127014, -0.10971938073635101, -0.10554653406143188, -0.10137368738651276, -0.09720084071159363, -0.0930280014872551, -0.08885515481233597, -0.08468230813741684, -0.08050946146249771, -0.07633661478757858, -0.07216376811265945, -0.06799092888832092, -0.0638180822134018, -0.059645235538482666, -0.05547238886356354, -0.05129954218864441, -0.04712669551372528, -0.04295384883880615, -0.03878100588917732, -0.034608159214258194, -0.030435312539339066, -0.026262467727065086, -0.022089622914791107, -0.01791677623987198, -0.013743930496275425, -0.009571084752678871, -0.005398239009082317, -0.0012253932654857635, 0.002947453409433365, 0.007120298221707344, 0.011293143033981323, 0.015466004610061646, 0.019638851284980774, 0.023811696097254753, 0.027984540909528732, 0.03215738758444786, 0.03633023425936699, 0.04050307720899582, 0.04467592388391495, 0.048848770558834076, 0.053021617233753204, 0.05719446390867233, 0.06136730685830116, 0.06554014980792999, 0.06971299648284912, 0.07388584315776825, 0.07805868983268738, 0.0822315365076065, 0.08640438318252563, 0.09057722985744476, 0.09475007653236389, 0.09892292320728302, 0.10309576988220215, 0.10726860910654068, 0.11144145578145981, 0.11561430245637894, 0.11978714913129807, 0.1239599958062172, 0.12813283503055573, 0.13230568170547485, 0.13647852838039398, 0.1406513750553131, 0.14482422173023224, 0.14899706840515137]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 2.0, 3.0, 14.0, 7.0, 15.0, 25.0, 69.0, 87.0, 181.0, 421.0, 770.0, 1804.0, 4467.0, 12421.0, 39922.0, 156743.0, 482547.0, 258288.0, 61947.0, 18145.0, 6223.0, 2438.0, 1020.0, 474.0, 255.0, 102.0, 68.0, 37.0, 26.0, 17.0, 11.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.037994384765625, -0.03703665733337402, -0.03607892990112305, -0.03512120246887207, -0.034163475036621094, -0.03320574760437012, -0.03224802017211914, -0.031290292739868164, -0.030332565307617188, -0.02937483787536621, -0.028417110443115234, -0.027459383010864258, -0.02650165557861328, -0.025543928146362305, -0.024586200714111328, -0.02362847328186035, -0.022670745849609375, -0.0217130184173584, -0.020755290985107422, -0.019797563552856445, -0.01883983612060547, -0.017882108688354492, -0.016924381256103516, -0.01596665382385254, -0.015008926391601562, -0.014051198959350586, -0.01309347152709961, -0.012135744094848633, -0.011178016662597656, -0.01022028923034668, -0.009262561798095703, -0.008304834365844727, -0.00734710693359375, -0.0063893795013427734, -0.005431652069091797, -0.00447392463684082, -0.0035161972045898438, -0.002558469772338867, -0.0016007423400878906, -0.0006430149078369141, 0.0003147125244140625, 0.001272439956665039, 0.0022301673889160156, 0.003187894821166992, 0.004145622253417969, 0.005103349685668945, 0.006061077117919922, 0.0070188045501708984, 0.007976531982421875, 0.008934259414672852, 0.009891986846923828, 0.010849714279174805, 0.011807441711425781, 0.012765169143676758, 0.013722896575927734, 0.014680624008178711, 0.015638351440429688, 0.016596078872680664, 0.01755380630493164, 0.018511533737182617, 0.019469261169433594, 0.02042698860168457, 0.021384716033935547, 0.022342443466186523, 0.0233001708984375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 8.0, 9.0, 19.0, 23.0, 19.0, 23.0, 23.0, 26.0, 27.0, 35.0, 57.0, 45.0, 50.0, 44.0, 62.0, 57.0, 59.0, 47.0, 58.0, 42.0, 53.0, 38.0, 35.0, 25.0, 22.0, 20.0, 7.0, 8.0, 9.0, 10.0, 13.0, 6.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.095458984375, -0.0921010971069336, -0.08874320983886719, -0.08538532257080078, -0.08202743530273438, -0.07866954803466797, -0.07531166076660156, -0.07195377349853516, -0.06859588623046875, -0.06523799896240234, -0.06188011169433594, -0.05852222442626953, -0.055164337158203125, -0.05180644989013672, -0.04844856262207031, -0.045090675354003906, -0.0417327880859375, -0.038374900817871094, -0.03501701354980469, -0.03165912628173828, -0.028301239013671875, -0.02494335174560547, -0.021585464477539062, -0.018227577209472656, -0.01486968994140625, -0.011511802673339844, -0.008153915405273438, -0.004796028137207031, -0.001438140869140625, 0.0019197463989257812, 0.0052776336669921875, 0.008635520935058594, 0.011993408203125, 0.015351295471191406, 0.018709182739257812, 0.02206707000732422, 0.025424957275390625, 0.02878284454345703, 0.03214073181152344, 0.035498619079589844, 0.03885650634765625, 0.042214393615722656, 0.04557228088378906, 0.04893016815185547, 0.052288055419921875, 0.05564594268798828, 0.05900382995605469, 0.062361717224121094, 0.0657196044921875, 0.0690774917602539, 0.07243537902832031, 0.07579326629638672, 0.07915115356445312, 0.08250904083251953, 0.08586692810058594, 0.08922481536865234, 0.09258270263671875, 0.09594058990478516, 0.09929847717285156, 0.10265636444091797, 0.10601425170898438, 0.10937213897705078, 0.11273002624511719, 0.1160879135131836, 0.11944580078125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 7.0, 6.0, 5.0, 14.0, 14.0, 21.0, 38.0, 77.0, 111.0, 177.0, 342.0, 603.0, 1162.0, 2607.0, 6800.0, 20911.0, 84265.0, 379515.0, 417585.0, 97268.0, 23864.0, 7454.0, 2854.0, 1309.0, 680.0, 346.0, 203.0, 108.0, 75.0, 35.0, 25.0, 16.0, 13.0, 9.0, 8.0, 3.0, 6.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.032928466796875, -0.03196120262145996, -0.030993938446044922, -0.030026674270629883, -0.029059410095214844, -0.028092145919799805, -0.027124881744384766, -0.026157617568969727, -0.025190353393554688, -0.02422308921813965, -0.02325582504272461, -0.02228856086730957, -0.02132129669189453, -0.020354032516479492, -0.019386768341064453, -0.018419504165649414, -0.017452239990234375, -0.016484975814819336, -0.015517711639404297, -0.014550447463989258, -0.013583183288574219, -0.01261591911315918, -0.01164865493774414, -0.010681390762329102, -0.009714126586914062, -0.008746862411499023, -0.007779598236083984, -0.006812334060668945, -0.005845069885253906, -0.004877805709838867, -0.003910541534423828, -0.002943277359008789, -0.00197601318359375, -0.001008749008178711, -4.1484832763671875e-05, 0.0009257793426513672, 0.0018930435180664062, 0.0028603076934814453, 0.0038275718688964844, 0.0047948360443115234, 0.0057621002197265625, 0.0067293643951416016, 0.007696628570556641, 0.00866389274597168, 0.009631156921386719, 0.010598421096801758, 0.011565685272216797, 0.012532949447631836, 0.013500213623046875, 0.014467477798461914, 0.015434741973876953, 0.016402006149291992, 0.01736927032470703, 0.01833653450012207, 0.01930379867553711, 0.02027106285095215, 0.021238327026367188, 0.022205591201782227, 0.023172855377197266, 0.024140119552612305, 0.025107383728027344, 0.026074647903442383, 0.027041912078857422, 0.02800917625427246, 0.0289764404296875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 5.0, 3.0, 6.0, 6.0, 15.0, 13.0, 14.0, 16.0, 13.0, 23.0, 19.0, 26.0, 19.0, 21.0, 26.0, 38.0, 32.0, 37.0, 39.0, 41.0, 37.0, 43.0, 37.0, 44.0, 36.0, 40.0, 36.0, 50.0, 31.0, 17.0, 34.0, 30.0, 24.0, 26.0, 16.0, 15.0, 9.0, 9.0, 16.0, 9.0, 7.0, 5.0, 7.0, 6.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.1640625, -0.15893936157226562, -0.15381622314453125, -0.14869308471679688, -0.1435699462890625, -0.13844680786132812, -0.13332366943359375, -0.12820053100585938, -0.123077392578125, -0.11795425415039062, -0.11283111572265625, -0.10770797729492188, -0.1025848388671875, -0.09746170043945312, -0.09233856201171875, -0.08721542358398438, -0.08209228515625, -0.07696914672851562, -0.07184600830078125, -0.06672286987304688, -0.0615997314453125, -0.056476593017578125, -0.05135345458984375, -0.046230316162109375, -0.041107177734375, -0.035984039306640625, -0.03086090087890625, -0.025737762451171875, -0.0206146240234375, -0.015491485595703125, -0.01036834716796875, -0.005245208740234375, -0.0001220703125, 0.005001068115234375, 0.01012420654296875, 0.015247344970703125, 0.0203704833984375, 0.025493621826171875, 0.03061676025390625, 0.035739898681640625, 0.040863037109375, 0.045986175537109375, 0.05110931396484375, 0.056232452392578125, 0.0613555908203125, 0.06647872924804688, 0.07160186767578125, 0.07672500610351562, 0.08184814453125, 0.08697128295898438, 0.09209442138671875, 0.09721755981445312, 0.1023406982421875, 0.10746383666992188, 0.11258697509765625, 0.11771011352539062, 0.122833251953125, 0.12795639038085938, 0.13307952880859375, 0.13820266723632812, 0.1433258056640625, 0.14844894409179688, 0.15357208251953125, 0.15869522094726562, 0.163818359375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 6.0, 12.0, 14.0, 24.0, 37.0, 60.0, 109.0, 236.0, 495.0, 1255.0, 4028.0, 20170.0, 215857.0, 710464.0, 81264.0, 10412.0, 2464.0, 863.0, 378.0, 167.0, 85.0, 56.0, 30.0, 17.0, 12.0, 9.0, 9.0, 4.0, 9.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0142364501953125, -0.013715267181396484, -0.013194084167480469, -0.012672901153564453, -0.012151718139648438, -0.011630535125732422, -0.011109352111816406, -0.01058816909790039, -0.010066986083984375, -0.00954580307006836, -0.009024620056152344, -0.008503437042236328, -0.007982254028320312, -0.007461071014404297, -0.006939888000488281, -0.006418704986572266, -0.00589752197265625, -0.005376338958740234, -0.004855155944824219, -0.004333972930908203, -0.0038127899169921875, -0.003291606903076172, -0.0027704238891601562, -0.0022492408752441406, -0.001728057861328125, -0.0012068748474121094, -0.0006856918334960938, -0.00016450881958007812, 0.0003566741943359375, 0.0008778572082519531, 0.0013990402221679688, 0.0019202232360839844, 0.00244140625, 0.0029625892639160156, 0.0034837722778320312, 0.004004955291748047, 0.0045261383056640625, 0.005047321319580078, 0.005568504333496094, 0.006089687347412109, 0.006610870361328125, 0.007132053375244141, 0.007653236389160156, 0.008174419403076172, 0.008695602416992188, 0.009216785430908203, 0.009737968444824219, 0.010259151458740234, 0.01078033447265625, 0.011301517486572266, 0.011822700500488281, 0.012343883514404297, 0.012865066528320312, 0.013386249542236328, 0.013907432556152344, 0.01442861557006836, 0.014949798583984375, 0.01547098159790039, 0.015992164611816406, 0.016513347625732422, 0.017034530639648438, 0.017555713653564453, 0.01807689666748047, 0.018598079681396484, 0.0191192626953125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 9.0, 6.0, 12.0, 18.0, 15.0, 37.0, 32.0, 57.0, 58.0, 57.0, 107.0, 75.0, 125.0, 82.0, 68.0, 53.0, 43.0, 43.0, 23.0, 27.0, 9.0, 12.0, 12.0, 6.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.841255187988281e-06, -5.638226866722107e-06, -5.435198545455933e-06, -5.232170224189758e-06, -5.029141902923584e-06, -4.82611358165741e-06, -4.623085260391235e-06, -4.420056939125061e-06, -4.217028617858887e-06, -4.014000296592712e-06, -3.810971975326538e-06, -3.6079436540603638e-06, -3.4049153327941895e-06, -3.201887011528015e-06, -2.998858690261841e-06, -2.7958303689956665e-06, -2.592802047729492e-06, -2.389773726463318e-06, -2.1867454051971436e-06, -1.9837170839309692e-06, -1.780688762664795e-06, -1.5776604413986206e-06, -1.3746321201324463e-06, -1.171603798866272e-06, -9.685754776000977e-07, -7.655471563339233e-07, -5.62518835067749e-07, -3.594905138015747e-07, -1.564621925354004e-07, 4.6566128730773926e-08, 2.4959444999694824e-07, 4.5262277126312256e-07, 6.556510925292969e-07, 8.586794137954712e-07, 1.0617077350616455e-06, 1.2647360563278198e-06, 1.4677643775939941e-06, 1.6707926988601685e-06, 1.8738210201263428e-06, 2.076849341392517e-06, 2.2798776626586914e-06, 2.4829059839248657e-06, 2.68593430519104e-06, 2.8889626264572144e-06, 3.0919909477233887e-06, 3.295019268989563e-06, 3.4980475902557373e-06, 3.7010759115219116e-06, 3.904104232788086e-06, 4.10713255405426e-06, 4.3101608753204346e-06, 4.513189196586609e-06, 4.716217517852783e-06, 4.9192458391189575e-06, 5.122274160385132e-06, 5.325302481651306e-06, 5.5283308029174805e-06, 5.731359124183655e-06, 5.934387445449829e-06, 6.137415766716003e-06, 6.340444087982178e-06, 6.543472409248352e-06, 6.746500730514526e-06, 6.949529051780701e-06, 7.152557373046875e-06]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 9.0, 7.0, 3.0, 14.0, 15.0, 33.0, 27.0, 41.0, 62.0, 113.0, 150.0, 234.0, 443.0, 830.0, 1940.0, 4786.0, 15297.0, 64376.0, 313413.0, 481180.0, 126005.0, 26734.0, 7441.0, 2755.0, 1157.0, 603.0, 321.0, 194.0, 113.0, 87.0, 53.0, 43.0, 19.0, 18.0, 10.0, 14.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00933837890625, -0.009018659591674805, -0.00869894027709961, -0.008379220962524414, -0.008059501647949219, -0.0077397823333740234, -0.007420063018798828, -0.007100343704223633, -0.0067806243896484375, -0.006460905075073242, -0.006141185760498047, -0.0058214664459228516, -0.005501747131347656, -0.005182027816772461, -0.004862308502197266, -0.00454258918762207, -0.004222869873046875, -0.0039031505584716797, -0.0035834312438964844, -0.003263711929321289, -0.0029439926147460938, -0.0026242733001708984, -0.002304553985595703, -0.001984834671020508, -0.0016651153564453125, -0.0013453960418701172, -0.0010256767272949219, -0.0007059574127197266, -0.00038623809814453125, -6.651878356933594e-05, 0.0002532005310058594, 0.0005729198455810547, 0.00089263916015625, 0.0012123584747314453, 0.0015320777893066406, 0.001851797103881836, 0.0021715164184570312, 0.0024912357330322266, 0.002810955047607422, 0.003130674362182617, 0.0034503936767578125, 0.003770112991333008, 0.004089832305908203, 0.0044095516204833984, 0.004729270935058594, 0.005048990249633789, 0.005368709564208984, 0.00568842887878418, 0.006008148193359375, 0.00632786750793457, 0.006647586822509766, 0.006967306137084961, 0.007287025451660156, 0.0076067447662353516, 0.007926464080810547, 0.008246183395385742, 0.008565902709960938, 0.008885622024536133, 0.009205341339111328, 0.009525060653686523, 0.009844779968261719, 0.010164499282836914, 0.01048421859741211, 0.010803937911987305, 0.0111236572265625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 6.0, 12.0, 7.0, 15.0, 21.0, 19.0, 30.0, 35.0, 44.0, 68.0, 49.0, 63.0, 70.0, 78.0, 79.0, 58.0, 71.0, 61.0, 32.0, 46.0, 34.0, 30.0, 16.0, 10.0, 13.0, 12.0, 6.0, 3.0, 5.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0029659271240234375, -0.0028780102729797363, -0.002790093421936035, -0.002702176570892334, -0.002614259719848633, -0.0025263428688049316, -0.0024384260177612305, -0.0023505091667175293, -0.002262592315673828, -0.002174675464630127, -0.0020867586135864258, -0.0019988417625427246, -0.0019109249114990234, -0.0018230080604553223, -0.001735091209411621, -0.00164717435836792, -0.0015592575073242188, -0.0014713406562805176, -0.0013834238052368164, -0.0012955069541931152, -0.001207590103149414, -0.0011196732521057129, -0.0010317564010620117, -0.0009438395500183105, -0.0008559226989746094, -0.0007680058479309082, -0.000680088996887207, -0.0005921721458435059, -0.0005042552947998047, -0.0004163384437561035, -0.00032842159271240234, -0.00024050474166870117, -0.000152587890625, -6.467103958129883e-05, 2.3245811462402344e-05, 0.00011116266250610352, 0.0001990795135498047, 0.00028699636459350586, 0.00037491321563720703, 0.0004628300666809082, 0.0005507469177246094, 0.0006386637687683105, 0.0007265806198120117, 0.0008144974708557129, 0.0009024143218994141, 0.0009903311729431152, 0.0010782480239868164, 0.0011661648750305176, 0.0012540817260742188, 0.00134199857711792, 0.001429915428161621, 0.0015178322792053223, 0.0016057491302490234, 0.0016936659812927246, 0.0017815828323364258, 0.001869499683380127, 0.001957416534423828, 0.0020453333854675293, 0.0021332502365112305, 0.0022211670875549316, 0.002309083938598633, 0.002397000789642334, 0.002484917640686035, 0.0025728344917297363, 0.0026607513427734375]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 7.0, 13.0, 15.0, 52.0, 94.0, 169.0, 214.0, 188.0, 104.0, 61.0, 26.0, 24.0, 7.0, 7.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3339976370334625, -0.32557156682014465, -0.3171454668045044, -0.3087193965911865, -0.30029332637786865, -0.2918672561645508, -0.2834411859512329, -0.27501508593559265, -0.2665890157222748, -0.2581629455089569, -0.24973686039447784, -0.24131077527999878, -0.2328847050666809, -0.22445863485336304, -0.21603254973888397, -0.2076064646244049, -0.19918039441108704, -0.19075432419776917, -0.1823282390832901, -0.17390215396881104, -0.16547608375549316, -0.1570500135421753, -0.14862392842769623, -0.14019784331321716, -0.1317717730998993, -0.12334569543600082, -0.11491961777210236, -0.10649354010820389, -0.09806746244430542, -0.08964138478040695, -0.08121530711650848, -0.07278922945261002, -0.06436315178871155, -0.05593707412481308, -0.04751099646091461, -0.039084918797016144, -0.030658841133117676, -0.022232763469219208, -0.01380668580532074, -0.005380608141422272, 0.0030454695224761963, 0.011471547186374664, 0.019897624850273132, 0.0283237025141716, 0.03674978017807007, 0.045175857841968536, 0.053601935505867004, 0.06202801316976547, 0.07045409083366394, 0.07888016849756241, 0.08730624616146088, 0.09573232382535934, 0.10415840148925781, 0.11258447915315628, 0.12101055681705475, 0.1294366419315338, 0.13786271214485168, 0.14628878235816956, 0.15471486747264862, 0.16314095258712769, 0.17156702280044556, 0.17999309301376343, 0.1884191781282425, 0.19684526324272156, 0.20527133345603943]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 6.0, 6.0, 8.0, 17.0, 14.0, 24.0, 20.0, 29.0, 23.0, 35.0, 43.0, 37.0, 48.0, 41.0, 49.0, 64.0, 66.0, 52.0, 54.0, 58.0, 48.0, 34.0, 45.0, 35.0, 30.0, 24.0, 17.0, 14.0, 14.0, 12.0, 9.0, 5.0, 7.0, 0.0, 2.0, 4.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0979456678032875, -0.09462704509496689, -0.09130841493606567, -0.08798979222774506, -0.08467116206884384, -0.08135253936052322, -0.07803390920162201, -0.07471528649330139, -0.07139666378498077, -0.06807804107666016, -0.06475941091775894, -0.061440788209438324, -0.05812216177582741, -0.05480353534221649, -0.051484908908605576, -0.04816628247499466, -0.04484765604138374, -0.04152902960777283, -0.03821040317416191, -0.034891776740550995, -0.03157315403223038, -0.02825452759861946, -0.024935901165008545, -0.021617276594042778, -0.018298650160431862, -0.01498002465814352, -0.011661399155855179, -0.008342772722244263, -0.005024147219955921, -0.0017055217176675797, 0.0016131047159433365, 0.004931729286909103, 0.00825035572052002, 0.011568981222808361, 0.014887606725096703, 0.01820623315870762, 0.021524857729673386, 0.024843484163284302, 0.028162110596895218, 0.031480737030506134, 0.03479935973882675, 0.03811798617243767, 0.041436612606048584, 0.0447552353143692, 0.04807386174798012, 0.051392488181591034, 0.05471111461520195, 0.058029741048812866, 0.06134836748242378, 0.0646669939160347, 0.06798561662435532, 0.07130424678325653, 0.07462286949157715, 0.07794149219989777, 0.08126012235879898, 0.0845787450671196, 0.08789737522602081, 0.09121599793434143, 0.09453462809324265, 0.09785325080156326, 0.10117188096046448, 0.1044905036687851, 0.10780912637710571, 0.11112775653600693, 0.11444637924432755]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 7.0, 6.0, 2.0, 10.0, 21.0, 10.0, 23.0, 34.0, 49.0, 63.0, 128.0, 142.0, 268.0, 429.0, 689.0, 1210.0, 2213.0, 4444.0, 9748.0, 23440.0, 68303.0, 287531.0, 477539.0, 111663.0, 34522.0, 13509.0, 5880.0, 2901.0, 1538.0, 831.0, 506.0, 293.0, 186.0, 145.0, 91.0, 47.0, 44.0, 28.0, 22.0, 17.0, 10.0, 11.0, 2.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0711669921875, -0.06864261627197266, -0.06611824035644531, -0.06359386444091797, -0.061069488525390625, -0.05854511260986328, -0.05602073669433594, -0.053496360778808594, -0.05097198486328125, -0.048447608947753906, -0.04592323303222656, -0.04339885711669922, -0.040874481201171875, -0.03835010528564453, -0.03582572937011719, -0.033301353454589844, -0.0307769775390625, -0.028252601623535156, -0.025728225708007812, -0.02320384979248047, -0.020679473876953125, -0.01815509796142578, -0.015630722045898438, -0.013106346130371094, -0.01058197021484375, -0.008057594299316406, -0.0055332183837890625, -0.0030088424682617188, -0.000484466552734375, 0.0020399093627929688, 0.0045642852783203125, 0.007088661193847656, 0.009613037109375, 0.012137413024902344, 0.014661788940429688, 0.01718616485595703, 0.019710540771484375, 0.02223491668701172, 0.024759292602539062, 0.027283668518066406, 0.02980804443359375, 0.032332420349121094, 0.03485679626464844, 0.03738117218017578, 0.039905548095703125, 0.04242992401123047, 0.04495429992675781, 0.047478675842285156, 0.0500030517578125, 0.052527427673339844, 0.05505180358886719, 0.05757617950439453, 0.060100555419921875, 0.06262493133544922, 0.06514930725097656, 0.0676736831665039, 0.07019805908203125, 0.0727224349975586, 0.07524681091308594, 0.07777118682861328, 0.08029556274414062, 0.08281993865966797, 0.08534431457519531, 0.08786869049072266, 0.09039306640625]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 11.0, 12.0, 9.0, 16.0, 18.0, 22.0, 22.0, 39.0, 43.0, 48.0, 46.0, 52.0, 62.0, 74.0, 65.0, 57.0, 57.0, 65.0, 43.0, 40.0, 42.0, 32.0, 20.0, 19.0, 19.0, 14.0, 12.0, 7.0, 4.0, 4.0, 3.0, 3.0, 5.0, 5.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.211669921875, -0.20444107055664062, -0.19721221923828125, -0.18998336791992188, -0.1827545166015625, -0.17552566528320312, -0.16829681396484375, -0.16106796264648438, -0.153839111328125, -0.14661026000976562, -0.13938140869140625, -0.13215255737304688, -0.1249237060546875, -0.11769485473632812, -0.11046600341796875, -0.10323715209960938, -0.09600830078125, -0.08877944946289062, -0.08155059814453125, -0.07432174682617188, -0.0670928955078125, -0.059864044189453125, -0.05263519287109375, -0.045406341552734375, -0.038177490234375, -0.030948638916015625, -0.02371978759765625, -0.016490936279296875, -0.0092620849609375, -0.002033233642578125, 0.00519561767578125, 0.012424468994140625, 0.0196533203125, 0.026882171630859375, 0.03411102294921875, 0.041339874267578125, 0.0485687255859375, 0.055797576904296875, 0.06302642822265625, 0.07025527954101562, 0.077484130859375, 0.08471298217773438, 0.09194183349609375, 0.09917068481445312, 0.1063995361328125, 0.11362838745117188, 0.12085723876953125, 0.12808609008789062, 0.13531494140625, 0.14254379272460938, 0.14977264404296875, 0.15700149536132812, 0.1642303466796875, 0.17145919799804688, 0.17868804931640625, 0.18591690063476562, 0.193145751953125, 0.20037460327148438, 0.20760345458984375, 0.21483230590820312, 0.2220611572265625, 0.22929000854492188, 0.23651885986328125, 0.24374771118164062, 0.2509765625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 0.0, 3.0, 8.0, 5.0, 8.0, 6.0, 8.0, 28.0, 31.0, 48.0, 97.0, 193.0, 491.0, 1489.0, 13253.0, 804644.0, 219947.0, 6499.0, 1046.0, 351.0, 157.0, 89.0, 51.0, 29.0, 21.0, 8.0, 11.0, 7.0, 6.0, 6.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28759765625, -0.27857208251953125, -0.2695465087890625, -0.26052093505859375, -0.251495361328125, -0.24246978759765625, -0.2334442138671875, -0.22441864013671875, -0.21539306640625, -0.20636749267578125, -0.1973419189453125, -0.18831634521484375, -0.179290771484375, -0.17026519775390625, -0.1612396240234375, -0.15221405029296875, -0.1431884765625, -0.13416290283203125, -0.1251373291015625, -0.11611175537109375, -0.107086181640625, -0.09806060791015625, -0.0890350341796875, -0.08000946044921875, -0.07098388671875, -0.06195831298828125, -0.0529327392578125, -0.04390716552734375, -0.034881591796875, -0.02585601806640625, -0.0168304443359375, -0.00780487060546875, 0.001220703125, 0.01024627685546875, 0.0192718505859375, 0.02829742431640625, 0.037322998046875, 0.04634857177734375, 0.0553741455078125, 0.06439971923828125, 0.07342529296875, 0.08245086669921875, 0.0914764404296875, 0.10050201416015625, 0.109527587890625, 0.11855316162109375, 0.1275787353515625, 0.13660430908203125, 0.1456298828125, 0.15465545654296875, 0.1636810302734375, 0.17270660400390625, 0.181732177734375, 0.19075775146484375, 0.1997833251953125, 0.20880889892578125, 0.21783447265625, 0.22686004638671875, 0.2358856201171875, 0.24491119384765625, 0.253936767578125, 0.26296234130859375, 0.2719879150390625, 0.28101348876953125, 0.2900390625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 8.0, 8.0, 8.0, 10.0, 19.0, 21.0, 22.0, 32.0, 33.0, 32.0, 29.0, 37.0, 47.0, 35.0, 55.0, 53.0, 48.0, 51.0, 54.0, 36.0, 32.0, 33.0, 33.0, 38.0, 23.0, 27.0, 31.0, 22.0, 25.0, 18.0, 15.0, 16.0, 11.0, 10.0, 4.0, 5.0, 4.0, 1.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.221923828125, -0.21456527709960938, -0.20720672607421875, -0.19984817504882812, -0.1924896240234375, -0.18513107299804688, -0.17777252197265625, -0.17041397094726562, -0.163055419921875, -0.15569686889648438, -0.14833831787109375, -0.14097976684570312, -0.1336212158203125, -0.12626266479492188, -0.11890411376953125, -0.11154556274414062, -0.10418701171875, -0.09682846069335938, -0.08946990966796875, -0.08211135864257812, -0.0747528076171875, -0.06739425659179688, -0.06003570556640625, -0.052677154541015625, -0.045318603515625, -0.037960052490234375, -0.03060150146484375, -0.023242950439453125, -0.0158843994140625, -0.008525848388671875, -0.00116729736328125, 0.006191253662109375, 0.0135498046875, 0.020908355712890625, 0.02826690673828125, 0.035625457763671875, 0.0429840087890625, 0.050342559814453125, 0.05770111083984375, 0.06505966186523438, 0.072418212890625, 0.07977676391601562, 0.08713531494140625, 0.09449386596679688, 0.1018524169921875, 0.10921096801757812, 0.11656951904296875, 0.12392807006835938, 0.13128662109375, 0.13864517211914062, 0.14600372314453125, 0.15336227416992188, 0.1607208251953125, 0.16807937622070312, 0.17543792724609375, 0.18279647827148438, 0.190155029296875, 0.19751358032226562, 0.20487213134765625, 0.21223068237304688, 0.2195892333984375, 0.22694778442382812, 0.23430633544921875, 0.24166488647460938, 0.2490234375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 7.0, 19.0, 14.0, 24.0, 33.0, 64.0, 103.0, 255.0, 1063.0, 10755.0, 949727.0, 82892.0, 2758.0, 476.0, 160.0, 59.0, 40.0, 38.0, 15.0, 13.0, 9.0, 9.0, 5.0, 9.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1317138671875, -0.1272869110107422, -0.12285995483398438, -0.11843299865722656, -0.11400604248046875, -0.10957908630371094, -0.10515213012695312, -0.10072517395019531, -0.0962982177734375, -0.09187126159667969, -0.08744430541992188, -0.08301734924316406, -0.07859039306640625, -0.07416343688964844, -0.06973648071289062, -0.06530952453613281, -0.060882568359375, -0.05645561218261719, -0.052028656005859375, -0.04760169982910156, -0.04317474365234375, -0.03874778747558594, -0.034320831298828125, -0.029893875122070312, -0.0254669189453125, -0.021039962768554688, -0.016613006591796875, -0.012186050415039062, -0.00775909423828125, -0.0033321380615234375, 0.001094818115234375, 0.0055217742919921875, 0.00994873046875, 0.014375686645507812, 0.018802642822265625, 0.023229598999023438, 0.02765655517578125, 0.03208351135253906, 0.036510467529296875, 0.04093742370605469, 0.0453643798828125, 0.04979133605957031, 0.054218292236328125, 0.05864524841308594, 0.06307220458984375, 0.06749916076660156, 0.07192611694335938, 0.07635307312011719, 0.080780029296875, 0.08520698547363281, 0.08963394165039062, 0.09406089782714844, 0.09848785400390625, 0.10291481018066406, 0.10734176635742188, 0.11176872253417969, 0.1161956787109375, 0.12062263488769531, 0.12504959106445312, 0.12947654724121094, 0.13390350341796875, 0.13833045959472656, 0.14275741577148438, 0.1471843719482422, 0.151611328125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 3.0, 6.0, 8.0, 7.0, 7.0, 19.0, 24.0, 42.0, 68.0, 109.0, 195.0, 203.0, 129.0, 64.0, 34.0, 27.0, 13.0, 14.0, 12.0, 5.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2993812561035156e-05, -1.2575648725032806e-05, -1.2157484889030457e-05, -1.1739321053028107e-05, -1.1321157217025757e-05, -1.0902993381023407e-05, -1.0484829545021057e-05, -1.0066665709018707e-05, -9.648501873016357e-06, -9.230338037014008e-06, -8.812174201011658e-06, -8.394010365009308e-06, -7.975846529006958e-06, -7.557682693004608e-06, -7.139518857002258e-06, -6.7213550209999084e-06, -6.303191184997559e-06, -5.885027348995209e-06, -5.466863512992859e-06, -5.048699676990509e-06, -4.630535840988159e-06, -4.212372004985809e-06, -3.7942081689834595e-06, -3.3760443329811096e-06, -2.9578804969787598e-06, -2.53971666097641e-06, -2.12155282497406e-06, -1.7033889889717102e-06, -1.2852251529693604e-06, -8.670613169670105e-07, -4.4889748096466064e-07, -3.073364496231079e-08, 3.8743019104003906e-07, 8.055940270423889e-07, 1.2237578630447388e-06, 1.6419216990470886e-06, 2.0600855350494385e-06, 2.4782493710517883e-06, 2.896413207054138e-06, 3.314577043056488e-06, 3.732740879058838e-06, 4.150904715061188e-06, 4.569068551063538e-06, 4.9872323870658875e-06, 5.405396223068237e-06, 5.823560059070587e-06, 6.241723895072937e-06, 6.659887731075287e-06, 7.078051567077637e-06, 7.4962154030799866e-06, 7.914379239082336e-06, 8.332543075084686e-06, 8.750706911087036e-06, 9.168870747089386e-06, 9.587034583091736e-06, 1.0005198419094086e-05, 1.0423362255096436e-05, 1.0841526091098785e-05, 1.1259689927101135e-05, 1.1677853763103485e-05, 1.2096017599105835e-05, 1.2514181435108185e-05, 1.2932345271110535e-05, 1.3350509107112885e-05, 1.3768672943115234e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 8.0, 14.0, 14.0, 54.0, 103.0, 427.0, 2932.0, 647226.0, 394474.0, 2684.0, 397.0, 114.0, 40.0, 22.0, 13.0, 13.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1622314453125, -0.15517234802246094, -0.14811325073242188, -0.1410541534423828, -0.13399505615234375, -0.1269359588623047, -0.11987686157226562, -0.11281776428222656, -0.1057586669921875, -0.09869956970214844, -0.09164047241210938, -0.08458137512207031, -0.07752227783203125, -0.07046318054199219, -0.06340408325195312, -0.05634498596191406, -0.049285888671875, -0.04222679138183594, -0.035167694091796875, -0.028108596801757812, -0.02104949951171875, -0.013990402221679688, -0.006931304931640625, 0.0001277923583984375, 0.0071868896484375, 0.014245986938476562, 0.021305084228515625, 0.028364181518554688, 0.03542327880859375, 0.04248237609863281, 0.049541473388671875, 0.05660057067871094, 0.06365966796875, 0.07071876525878906, 0.07777786254882812, 0.08483695983886719, 0.09189605712890625, 0.09895515441894531, 0.10601425170898438, 0.11307334899902344, 0.1201324462890625, 0.12719154357910156, 0.13425064086914062, 0.1413097381591797, 0.14836883544921875, 0.1554279327392578, 0.16248703002929688, 0.16954612731933594, 0.176605224609375, 0.18366432189941406, 0.19072341918945312, 0.1977825164794922, 0.20484161376953125, 0.2119007110595703, 0.21895980834960938, 0.22601890563964844, 0.2330780029296875, 0.24013710021972656, 0.24719619750976562, 0.2542552947998047, 0.26131439208984375, 0.2683734893798828, 0.2754325866699219, 0.28249168395996094, 0.28955078125]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 7.0, 8.0, 12.0, 17.0, 44.0, 53.0, 115.0, 258.0, 231.0, 109.0, 56.0, 38.0, 13.0, 10.0, 6.0, 6.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.054962158203125, -0.05368375778198242, -0.052405357360839844, -0.051126956939697266, -0.04984855651855469, -0.04857015609741211, -0.04729175567626953, -0.04601335525512695, -0.044734954833984375, -0.0434565544128418, -0.04217815399169922, -0.04089975357055664, -0.03962135314941406, -0.038342952728271484, -0.037064552307128906, -0.03578615188598633, -0.03450775146484375, -0.03322935104370117, -0.031950950622558594, -0.030672550201416016, -0.029394149780273438, -0.02811574935913086, -0.02683734893798828, -0.025558948516845703, -0.024280548095703125, -0.023002147674560547, -0.02172374725341797, -0.02044534683227539, -0.019166946411132812, -0.017888545989990234, -0.016610145568847656, -0.015331745147705078, -0.0140533447265625, -0.012774944305419922, -0.011496543884277344, -0.010218143463134766, -0.008939743041992188, -0.007661342620849609, -0.006382942199707031, -0.005104541778564453, -0.003826141357421875, -0.002547740936279297, -0.0012693405151367188, 9.059906005859375e-06, 0.0012874603271484375, 0.0025658607482910156, 0.0038442611694335938, 0.005122661590576172, 0.00640106201171875, 0.007679462432861328, 0.008957862854003906, 0.010236263275146484, 0.011514663696289062, 0.01279306411743164, 0.014071464538574219, 0.015349864959716797, 0.016628265380859375, 0.017906665802001953, 0.01918506622314453, 0.02046346664428711, 0.021741867065429688, 0.023020267486572266, 0.024298667907714844, 0.025577068328857422, 0.02685546875]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 4.0, 7.0, 11.0, 12.0, 34.0, 74.0, 112.0, 183.0, 183.0, 145.0, 95.0, 52.0, 34.0, 22.0, 11.0, 7.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38317203521728516, -0.3685572147369385, -0.3539423644542694, -0.33932754397392273, -0.32471272349357605, -0.310097873210907, -0.2954830527305603, -0.2808682322502136, -0.26625341176986694, -0.25163859128952026, -0.2370237559080124, -0.22240892052650452, -0.20779410004615784, -0.19317926466464996, -0.1785644292831421, -0.1639496088027954, -0.14933475852012634, -0.13471992313861847, -0.12010510265827179, -0.10549026727676392, -0.09087543934583664, -0.07626061141490936, -0.06164577603340149, -0.04703094810247421, -0.032416120171546936, -0.01780129037797451, -0.0031864605844020844, 0.01142837107181549, 0.026043199002742767, 0.040658026933670044, 0.05527286231517792, 0.0698876902461052, 0.08450251817703247, 0.09911734610795975, 0.11373217403888702, 0.1283470094203949, 0.14296182990074158, 0.15757666528224945, 0.17219150066375732, 0.186806321144104, 0.20142115652561188, 0.21603599190711975, 0.23065081238746643, 0.2452656477689743, 0.2598804831504822, 0.27449530363082886, 0.28911012411117554, 0.3037249743938446, 0.3183397948741913, 0.33295461535453796, 0.34756946563720703, 0.3621842861175537, 0.3767991065979004, 0.39141392707824707, 0.40602877736091614, 0.4206435978412628, 0.4352584481239319, 0.44987326860427856, 0.46448811888694763, 0.4791029393672943, 0.493717759847641, 0.5083326101303101, 0.5229474306106567, 0.5375622510910034, 0.5521770715713501]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 1.0, 1.0, 3.0, 6.0, 4.0, 12.0, 10.0, 13.0, 13.0, 22.0, 22.0, 24.0, 21.0, 23.0, 36.0, 34.0, 43.0, 39.0, 26.0, 44.0, 44.0, 48.0, 51.0, 43.0, 29.0, 33.0, 40.0, 41.0, 30.0, 30.0, 24.0, 25.0, 25.0, 28.0, 20.0, 20.0, 12.0, 10.0, 10.0, 10.0, 6.0, 7.0, 5.0, 5.0, 5.0, 4.0, 3.0, 1.0, 0.0, 4.0, 0.0, 2.0], "bins": [-0.388520210981369, -0.37729737162590027, -0.3660745322704315, -0.35485169291496277, -0.343628853559494, -0.33240601420402527, -0.32118314504623413, -0.3099603056907654, -0.29873746633529663, -0.2875146269798279, -0.27629178762435913, -0.2650689482688904, -0.25384610891342163, -0.24262326955795288, -0.23140041530132294, -0.2201775759458542, -0.20895475149154663, -0.19773191213607788, -0.18650907278060913, -0.17528623342514038, -0.16406339406967163, -0.15284055471420288, -0.14161770045757294, -0.1303948611021042, -0.11917202174663544, -0.10794918239116669, -0.09672634303569794, -0.08550349622964859, -0.07428065687417984, -0.06305781751871109, -0.05183497071266174, -0.04061213135719299, -0.029389262199401855, -0.018166420981287956, -0.006943579763174057, 0.0042792633175849915, 0.015502102673053741, 0.02672494202852249, 0.03794778883457184, 0.04917062819004059, 0.06039346754550934, 0.07161630690097809, 0.08283914625644684, 0.09406199306249619, 0.10528483241796494, 0.11650767177343369, 0.12773051857948303, 0.13895335793495178, 0.15017619729042053, 0.16139903664588928, 0.17262187600135803, 0.18384471535682678, 0.19506755471229553, 0.20629039406776428, 0.21751324832439423, 0.22873608767986298, 0.23995892703533173, 0.25118178129196167, 0.2624046206474304, 0.27362746000289917, 0.2848502993583679, 0.29607313871383667, 0.3072959780693054, 0.31851881742477417, 0.3297416567802429]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 4.0, 3.0, 1.0, 12.0, 10.0, 10.0, 20.0, 26.0, 42.0, 53.0, 88.0, 155.0, 238.0, 417.0, 702.0, 1389.0, 2951.0, 7843.0, 32816.0, 368109.0, 3315159.0, 417360.0, 32846.0, 7895.0, 2997.0, 1382.0, 721.0, 400.0, 240.0, 145.0, 76.0, 60.0, 39.0, 33.0, 7.0, 14.0, 8.0, 8.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.226318359375, -0.2193584442138672, -0.21239852905273438, -0.20543861389160156, -0.19847869873046875, -0.19151878356933594, -0.18455886840820312, -0.1775989532470703, -0.1706390380859375, -0.1636791229248047, -0.15671920776367188, -0.14975929260253906, -0.14279937744140625, -0.13583946228027344, -0.12887954711914062, -0.12191963195800781, -0.114959716796875, -0.10799980163574219, -0.10103988647460938, -0.09407997131347656, -0.08712005615234375, -0.08016014099121094, -0.07320022583007812, -0.06624031066894531, -0.0592803955078125, -0.05232048034667969, -0.045360565185546875, -0.03840065002441406, -0.03144073486328125, -0.024480819702148438, -0.017520904541015625, -0.010560989379882812, -0.00360107421875, 0.0033588409423828125, 0.010318756103515625, 0.017278671264648438, 0.02423858642578125, 0.031198501586914062, 0.038158416748046875, 0.04511833190917969, 0.0520782470703125, 0.05903816223144531, 0.06599807739257812, 0.07295799255371094, 0.07991790771484375, 0.08687782287597656, 0.09383773803710938, 0.10079765319824219, 0.107757568359375, 0.11471748352050781, 0.12167739868164062, 0.12863731384277344, 0.13559722900390625, 0.14255714416503906, 0.14951705932617188, 0.1564769744873047, 0.1634368896484375, 0.1703968048095703, 0.17735671997070312, 0.18431663513183594, 0.19127655029296875, 0.19823646545410156, 0.20519638061523438, 0.2121562957763672, 0.2191162109375]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 5.0, 1.0, 3.0, 5.0, 8.0, 7.0, 11.0, 21.0, 14.0, 16.0, 34.0, 28.0, 29.0, 38.0, 47.0, 55.0, 49.0, 61.0, 52.0, 45.0, 71.0, 45.0, 55.0, 48.0, 44.0, 34.0, 31.0, 19.0, 31.0, 18.0, 20.0, 10.0, 19.0, 6.0, 2.0, 7.0, 2.0, 3.0, 5.0, 0.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.098876953125, -0.09499549865722656, -0.09111404418945312, -0.08723258972167969, -0.08335113525390625, -0.07946968078613281, -0.07558822631835938, -0.07170677185058594, -0.0678253173828125, -0.06394386291503906, -0.060062408447265625, -0.05618095397949219, -0.05229949951171875, -0.04841804504394531, -0.044536590576171875, -0.04065513610839844, -0.036773681640625, -0.03289222717285156, -0.029010772705078125, -0.025129318237304688, -0.02124786376953125, -0.017366409301757812, -0.013484954833984375, -0.009603500366210938, -0.0057220458984375, -0.0018405914306640625, 0.002040863037109375, 0.0059223175048828125, 0.00980377197265625, 0.013685226440429688, 0.017566680908203125, 0.021448135375976562, 0.02532958984375, 0.029211044311523438, 0.033092498779296875, 0.03697395324707031, 0.04085540771484375, 0.04473686218261719, 0.048618316650390625, 0.05249977111816406, 0.0563812255859375, 0.06026268005371094, 0.06414413452148438, 0.06802558898925781, 0.07190704345703125, 0.07578849792480469, 0.07966995239257812, 0.08355140686035156, 0.087432861328125, 0.09131431579589844, 0.09519577026367188, 0.09907722473144531, 0.10295867919921875, 0.10684013366699219, 0.11072158813476562, 0.11460304260253906, 0.1184844970703125, 0.12236595153808594, 0.12624740600585938, 0.1301288604736328, 0.13401031494140625, 0.1378917694091797, 0.14177322387695312, 0.14565467834472656, 0.1495361328125]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 8.0, 6.0, 13.0, 8.0, 18.0, 24.0, 37.0, 83.0, 107.0, 284.0, 622.0, 2225.0, 14292.0, 1135959.0, 3018251.0, 18474.0, 2569.0, 737.0, 272.0, 127.0, 64.0, 27.0, 22.0, 18.0, 3.0, 10.0, 6.0, 3.0, 7.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.322509765625, -0.3085212707519531, -0.29453277587890625, -0.2805442810058594, -0.2665557861328125, -0.2525672912597656, -0.23857879638671875, -0.22459030151367188, -0.210601806640625, -0.19661331176757812, -0.18262481689453125, -0.16863632202148438, -0.1546478271484375, -0.14065933227539062, -0.12667083740234375, -0.11268234252929688, -0.09869384765625, -0.08470535278320312, -0.07071685791015625, -0.056728363037109375, -0.0427398681640625, -0.028751373291015625, -0.01476287841796875, -0.000774383544921875, 0.013214111328125, 0.027202606201171875, 0.04119110107421875, 0.055179595947265625, 0.0691680908203125, 0.08315658569335938, 0.09714508056640625, 0.11113357543945312, 0.1251220703125, 0.13911056518554688, 0.15309906005859375, 0.16708755493164062, 0.1810760498046875, 0.19506454467773438, 0.20905303955078125, 0.22304153442382812, 0.237030029296875, 0.2510185241699219, 0.26500701904296875, 0.2789955139160156, 0.2929840087890625, 0.3069725036621094, 0.32096099853515625, 0.3349494934082031, 0.34893798828125, 0.3629264831542969, 0.37691497802734375, 0.3909034729003906, 0.4048919677734375, 0.4188804626464844, 0.43286895751953125, 0.4468574523925781, 0.460845947265625, 0.4748344421386719, 0.48882293701171875, 0.5028114318847656, 0.5167999267578125, 0.5307884216308594, 0.5447769165039062, 0.5587654113769531, 0.57275390625]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 3.0, 3.0, 7.0, 7.0, 9.0, 10.0, 14.0, 35.0, 38.0, 99.0, 180.0, 313.0, 693.0, 1059.0, 753.0, 366.0, 180.0, 94.0, 75.0, 35.0, 26.0, 17.0, 15.0, 12.0, 7.0, 6.0, 9.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0906982421875, -0.0885167121887207, -0.0863351821899414, -0.08415365219116211, -0.08197212219238281, -0.07979059219360352, -0.07760906219482422, -0.07542753219604492, -0.07324600219726562, -0.07106447219848633, -0.06888294219970703, -0.06670141220092773, -0.06451988220214844, -0.06233835220336914, -0.060156822204589844, -0.05797529220581055, -0.05579376220703125, -0.05361223220825195, -0.051430702209472656, -0.04924917221069336, -0.04706764221191406, -0.044886112213134766, -0.04270458221435547, -0.04052305221557617, -0.038341522216796875, -0.03615999221801758, -0.03397846221923828, -0.031796932220458984, -0.029615402221679688, -0.02743387222290039, -0.025252342224121094, -0.023070812225341797, -0.0208892822265625, -0.018707752227783203, -0.016526222229003906, -0.01434469223022461, -0.012163162231445312, -0.009981632232666016, -0.007800102233886719, -0.005618572235107422, -0.003437042236328125, -0.0012555122375488281, 0.0009260177612304688, 0.0031075477600097656, 0.0052890777587890625, 0.007470607757568359, 0.009652137756347656, 0.011833667755126953, 0.01401519775390625, 0.016196727752685547, 0.018378257751464844, 0.02055978775024414, 0.022741317749023438, 0.024922847747802734, 0.02710437774658203, 0.029285907745361328, 0.031467437744140625, 0.03364896774291992, 0.03583049774169922, 0.038012027740478516, 0.04019355773925781, 0.04237508773803711, 0.044556617736816406, 0.0467381477355957, 0.048919677734375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 6.0, 5.0, 9.0, 19.0, 38.0, 83.0, 119.0, 174.0, 186.0, 148.0, 85.0, 64.0, 37.0, 9.0, 9.0, 4.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4136539697647095, -0.4022037088871002, -0.39075344800949097, -0.3793031871318817, -0.36785292625427246, -0.3564026653766632, -0.34495240449905396, -0.3335021436214447, -0.32205188274383545, -0.3106016218662262, -0.29915136098861694, -0.2877011001110077, -0.27625083923339844, -0.2648005783557892, -0.25335031747817993, -0.24190005660057068, -0.23044981062412262, -0.21899954974651337, -0.2075492888689041, -0.19609902799129486, -0.1846487671136856, -0.17319850623607635, -0.1617482602596283, -0.15029799938201904, -0.1388477385044098, -0.12739747762680054, -0.11594721674919128, -0.10449695587158203, -0.09304669499397278, -0.08159643411636353, -0.07014618068933487, -0.058695919811725616, -0.04724565148353577, -0.035795390605926514, -0.02434513159096241, -0.012894872575998306, -0.0014446116983890533, 0.0100056491792202, 0.021455906331539154, 0.03290616720914841, 0.04435642808675766, 0.05580668896436691, 0.06725694984197617, 0.07870720326900482, 0.09015746414661407, 0.10160772502422333, 0.11305798590183258, 0.12450824677944183, 0.1359585076570511, 0.14740876853466034, 0.1588590294122696, 0.17030929028987885, 0.1817595511674881, 0.19320981204509735, 0.2046600580215454, 0.21611031889915466, 0.22756057977676392, 0.23901084065437317, 0.2504611015319824, 0.2619113624095917, 0.2733616232872009, 0.2848118841648102, 0.29626214504241943, 0.3077124059200287, 0.31916266679763794]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 4.0, 7.0, 13.0, 8.0, 12.0, 12.0, 20.0, 23.0, 22.0, 35.0, 38.0, 31.0, 41.0, 39.0, 52.0, 27.0, 52.0, 47.0, 45.0, 44.0, 46.0, 46.0, 50.0, 47.0, 42.0, 35.0, 22.0, 38.0, 28.0, 15.0, 12.0, 6.0, 10.0, 4.0, 4.0, 7.0, 7.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11764003336429596, -0.11358009278774261, -0.10952015221118927, -0.10546021908521652, -0.10140027850866318, -0.09734033793210983, -0.09328040480613708, -0.08922046422958374, -0.0851605236530304, -0.08110058307647705, -0.0770406424999237, -0.07298070937395096, -0.06892076879739761, -0.06486082822084427, -0.06080089136958122, -0.056740954518318176, -0.05268101394176483, -0.04862107336521149, -0.04456113651394844, -0.040501199662685394, -0.03644125908613205, -0.032381318509578705, -0.02832138165831566, -0.024261442944407463, -0.020201504230499268, -0.016141565516591072, -0.012081626802682877, -0.008021688088774681, -0.003961749374866486, 9.81893390417099e-05, 0.004158128052949905, 0.008218066766858101, 0.01227802038192749, 0.016337959095835686, 0.02039789780974388, 0.024457836523652077, 0.028517775237560272, 0.03257771581411362, 0.03663765266537666, 0.04069758951663971, 0.044757530093193054, 0.0488174706697464, 0.052877407521009445, 0.05693734437227249, 0.060997284948825836, 0.06505722552537918, 0.06911715865135193, 0.07317709922790527, 0.07723703980445862, 0.08129698038101196, 0.08535692095756531, 0.08941685408353806, 0.0934767946600914, 0.09753673523664474, 0.10159666836261749, 0.10565660893917084, 0.10971654951572418, 0.11377649009227753, 0.11783643066883087, 0.12189636379480362, 0.12595629692077637, 0.1300162374973297, 0.13407617807388306, 0.1381361186504364, 0.14219605922698975]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 7.0, 8.0, 13.0, 11.0, 26.0, 29.0, 47.0, 73.0, 103.0, 164.0, 262.0, 395.0, 683.0, 1109.0, 1945.0, 3831.0, 8066.0, 21199.0, 95432.0, 613053.0, 241798.0, 37204.0, 11746.0, 5067.0, 2632.0, 1531.0, 825.0, 466.0, 288.0, 165.0, 138.0, 83.0, 48.0, 50.0, 19.0, 9.0, 9.0, 4.0, 6.0, 3.0, 2.0, 5.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.045806884765625, -0.04415416717529297, -0.04250144958496094, -0.040848731994628906, -0.039196014404296875, -0.037543296813964844, -0.03589057922363281, -0.03423786163330078, -0.03258514404296875, -0.03093242645263672, -0.029279708862304688, -0.027626991271972656, -0.025974273681640625, -0.024321556091308594, -0.022668838500976562, -0.02101612091064453, -0.0193634033203125, -0.01771068572998047, -0.016057968139648438, -0.014405250549316406, -0.012752532958984375, -0.011099815368652344, -0.009447097778320312, -0.007794380187988281, -0.00614166259765625, -0.004488945007324219, -0.0028362274169921875, -0.0011835098266601562, 0.000469207763671875, 0.0021219253540039062, 0.0037746429443359375, 0.005427360534667969, 0.007080078125, 0.008732795715332031, 0.010385513305664062, 0.012038230895996094, 0.013690948486328125, 0.015343666076660156, 0.016996383666992188, 0.01864910125732422, 0.02030181884765625, 0.02195453643798828, 0.023607254028320312, 0.025259971618652344, 0.026912689208984375, 0.028565406799316406, 0.030218124389648438, 0.03187084197998047, 0.0335235595703125, 0.03517627716064453, 0.03682899475097656, 0.038481712341308594, 0.040134429931640625, 0.041787147521972656, 0.04343986511230469, 0.04509258270263672, 0.04674530029296875, 0.04839801788330078, 0.05005073547363281, 0.051703453063964844, 0.053356170654296875, 0.055008888244628906, 0.05666160583496094, 0.05831432342529297, 0.059967041015625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 9.0, 9.0, 9.0, 14.0, 16.0, 30.0, 28.0, 34.0, 50.0, 55.0, 55.0, 61.0, 67.0, 70.0, 58.0, 66.0, 57.0, 61.0, 55.0, 44.0, 42.0, 35.0, 24.0, 12.0, 9.0, 10.0, 6.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09808349609375, -0.09442615509033203, -0.09076881408691406, -0.0871114730834961, -0.08345413208007812, -0.07979679107666016, -0.07613945007324219, -0.07248210906982422, -0.06882476806640625, -0.06516742706298828, -0.06151008605957031, -0.057852745056152344, -0.054195404052734375, -0.050538063049316406, -0.04688072204589844, -0.04322338104248047, -0.0395660400390625, -0.03590869903564453, -0.03225135803222656, -0.028594017028808594, -0.024936676025390625, -0.021279335021972656, -0.017621994018554688, -0.013964653015136719, -0.01030731201171875, -0.006649971008300781, -0.0029926300048828125, 0.0006647109985351562, 0.004322052001953125, 0.007979393005371094, 0.011636734008789062, 0.015294075012207031, 0.018951416015625, 0.02260875701904297, 0.026266098022460938, 0.029923439025878906, 0.033580780029296875, 0.037238121032714844, 0.04089546203613281, 0.04455280303955078, 0.04821014404296875, 0.05186748504638672, 0.05552482604980469, 0.059182167053222656, 0.06283950805664062, 0.0664968490600586, 0.07015419006347656, 0.07381153106689453, 0.0774688720703125, 0.08112621307373047, 0.08478355407714844, 0.0884408950805664, 0.09209823608398438, 0.09575557708740234, 0.09941291809082031, 0.10307025909423828, 0.10672760009765625, 0.11038494110107422, 0.11404228210449219, 0.11769962310791016, 0.12135696411132812, 0.1250143051147461, 0.12867164611816406, 0.13232898712158203, 0.135986328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 5.0, 4.0, 10.0, 11.0, 15.0, 16.0, 28.0, 43.0, 77.0, 166.0, 286.0, 731.0, 1802.0, 5298.0, 23853.0, 446803.0, 533094.0, 27334.0, 5687.0, 1897.0, 727.0, 296.0, 148.0, 82.0, 40.0, 32.0, 18.0, 13.0, 2.0, 7.0, 5.0, 4.0, 2.0, 2.0, 3.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.08599853515625, -0.08367633819580078, -0.08135414123535156, -0.07903194427490234, -0.07670974731445312, -0.0743875503540039, -0.07206535339355469, -0.06974315643310547, -0.06742095947265625, -0.06509876251220703, -0.06277656555175781, -0.060454368591308594, -0.058132171630859375, -0.055809974670410156, -0.05348777770996094, -0.05116558074951172, -0.0488433837890625, -0.04652118682861328, -0.04419898986816406, -0.041876792907714844, -0.039554595947265625, -0.037232398986816406, -0.03491020202636719, -0.03258800506591797, -0.03026580810546875, -0.02794361114501953, -0.025621414184570312, -0.023299217224121094, -0.020977020263671875, -0.018654823303222656, -0.016332626342773438, -0.014010429382324219, -0.011688232421875, -0.009366035461425781, -0.0070438385009765625, -0.004721641540527344, -0.002399444580078125, -7.724761962890625e-05, 0.0022449493408203125, 0.004567146301269531, 0.00688934326171875, 0.009211540222167969, 0.011533737182617188, 0.013855934143066406, 0.016178131103515625, 0.018500328063964844, 0.020822525024414062, 0.02314472198486328, 0.0254669189453125, 0.02778911590576172, 0.030111312866210938, 0.032433509826660156, 0.034755706787109375, 0.037077903747558594, 0.03940010070800781, 0.04172229766845703, 0.04404449462890625, 0.04636669158935547, 0.04868888854980469, 0.051011085510253906, 0.053333282470703125, 0.055655479431152344, 0.05797767639160156, 0.06029987335205078, 0.0626220703125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 4.0, 10.0, 12.0, 10.0, 15.0, 11.0, 19.0, 20.0, 30.0, 26.0, 38.0, 36.0, 25.0, 52.0, 48.0, 46.0, 33.0, 40.0, 57.0, 45.0, 35.0, 46.0, 53.0, 39.0, 38.0, 35.0, 30.0, 27.0, 30.0, 18.0, 22.0, 8.0, 12.0, 3.0, 7.0, 6.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1611328125, -0.1559123992919922, -0.15069198608398438, -0.14547157287597656, -0.14025115966796875, -0.13503074645996094, -0.12981033325195312, -0.12458992004394531, -0.1193695068359375, -0.11414909362792969, -0.10892868041992188, -0.10370826721191406, -0.09848785400390625, -0.09326744079589844, -0.08804702758789062, -0.08282661437988281, -0.077606201171875, -0.07238578796386719, -0.06716537475585938, -0.06194496154785156, -0.05672454833984375, -0.05150413513183594, -0.046283721923828125, -0.04106330871582031, -0.0358428955078125, -0.030622482299804688, -0.025402069091796875, -0.020181655883789062, -0.01496124267578125, -0.009740829467773438, -0.004520416259765625, 0.0006999969482421875, 0.00592041015625, 0.011140823364257812, 0.016361236572265625, 0.021581649780273438, 0.02680206298828125, 0.03202247619628906, 0.037242889404296875, 0.04246330261230469, 0.0476837158203125, 0.05290412902832031, 0.058124542236328125, 0.06334495544433594, 0.06856536865234375, 0.07378578186035156, 0.07900619506835938, 0.08422660827636719, 0.089447021484375, 0.09466743469238281, 0.09988784790039062, 0.10510826110839844, 0.11032867431640625, 0.11554908752441406, 0.12076950073242188, 0.1259899139404297, 0.1312103271484375, 0.1364307403564453, 0.14165115356445312, 0.14687156677246094, 0.15209197998046875, 0.15731239318847656, 0.16253280639648438, 0.1677532196044922, 0.1729736328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 3.0, 6.0, 8.0, 11.0, 10.0, 17.0, 18.0, 33.0, 42.0, 78.0, 123.0, 239.0, 357.0, 811.0, 1981.0, 5821.0, 22293.0, 145021.0, 697981.0, 142005.0, 22020.0, 5768.0, 2074.0, 846.0, 440.0, 218.0, 117.0, 56.0, 52.0, 32.0, 22.0, 12.0, 14.0, 5.0, 2.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0153045654296875, -0.014802694320678711, -0.014300823211669922, -0.013798952102661133, -0.013297080993652344, -0.012795209884643555, -0.012293338775634766, -0.011791467666625977, -0.011289596557617188, -0.010787725448608398, -0.01028585433959961, -0.00978398323059082, -0.009282112121582031, -0.008780241012573242, -0.008278369903564453, -0.007776498794555664, -0.007274627685546875, -0.006772756576538086, -0.006270885467529297, -0.005769014358520508, -0.005267143249511719, -0.00476527214050293, -0.004263401031494141, -0.0037615299224853516, -0.0032596588134765625, -0.0027577877044677734, -0.0022559165954589844, -0.0017540454864501953, -0.0012521743774414062, -0.0007503032684326172, -0.0002484321594238281, 0.00025343894958496094, 0.00075531005859375, 0.001257181167602539, 0.0017590522766113281, 0.002260923385620117, 0.0027627944946289062, 0.0032646656036376953, 0.0037665367126464844, 0.0042684078216552734, 0.0047702789306640625, 0.0052721500396728516, 0.005774021148681641, 0.00627589225769043, 0.006777763366699219, 0.007279634475708008, 0.007781505584716797, 0.008283376693725586, 0.008785247802734375, 0.009287118911743164, 0.009788990020751953, 0.010290861129760742, 0.010792732238769531, 0.01129460334777832, 0.01179647445678711, 0.012298345565795898, 0.012800216674804688, 0.013302087783813477, 0.013803958892822266, 0.014305830001831055, 0.014807701110839844, 0.015309572219848633, 0.015811443328857422, 0.01631331443786621, 0.016815185546875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 2.0, 2.0, 8.0, 8.0, 13.0, 19.0, 16.0, 24.0, 39.0, 47.0, 56.0, 47.0, 69.0, 74.0, 81.0, 98.0, 74.0, 65.0, 63.0, 38.0, 32.0, 28.0, 23.0, 17.0, 10.0, 11.0, 7.0, 4.0, 3.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0067901611328125e-06, -4.827044904232025e-06, -4.647299647331238e-06, -4.4675543904304504e-06, -4.287809133529663e-06, -4.108063876628876e-06, -3.928318619728088e-06, -3.748573362827301e-06, -3.5688281059265137e-06, -3.3890828490257263e-06, -3.209337592124939e-06, -3.0295923352241516e-06, -2.8498470783233643e-06, -2.670101821422577e-06, -2.4903565645217896e-06, -2.310611307621002e-06, -2.130866050720215e-06, -1.9511207938194275e-06, -1.7713755369186401e-06, -1.5916302800178528e-06, -1.4118850231170654e-06, -1.232139766216278e-06, -1.0523945093154907e-06, -8.726492524147034e-07, -6.92903995513916e-07, -5.131587386131287e-07, -3.334134817123413e-07, -1.5366822481155396e-07, 2.60770320892334e-08, 2.0582228899002075e-07, 3.855675458908081e-07, 5.653128027915955e-07, 7.450580596923828e-07, 9.248033165931702e-07, 1.1045485734939575e-06, 1.2842938303947449e-06, 1.4640390872955322e-06, 1.6437843441963196e-06, 1.823529601097107e-06, 2.0032748579978943e-06, 2.1830201148986816e-06, 2.362765371799469e-06, 2.5425106287002563e-06, 2.7222558856010437e-06, 2.902001142501831e-06, 3.0817463994026184e-06, 3.2614916563034058e-06, 3.441236913204193e-06, 3.6209821701049805e-06, 3.800727427005768e-06, 3.980472683906555e-06, 4.1602179408073425e-06, 4.33996319770813e-06, 4.519708454608917e-06, 4.699453711509705e-06, 4.879198968410492e-06, 5.058944225311279e-06, 5.238689482212067e-06, 5.418434739112854e-06, 5.598179996013641e-06, 5.777925252914429e-06, 5.957670509815216e-06, 6.137415766716003e-06, 6.317161023616791e-06, 6.496906280517578e-06]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 7.0, 4.0, 11.0, 15.0, 11.0, 25.0, 39.0, 39.0, 71.0, 128.0, 194.0, 319.0, 553.0, 996.0, 2093.0, 4895.0, 14299.0, 59439.0, 363697.0, 487548.0, 84442.0, 18577.0, 6012.0, 2388.0, 1153.0, 644.0, 384.0, 198.0, 125.0, 89.0, 52.0, 33.0, 28.0, 13.0, 14.0, 6.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01465606689453125, -0.014213323593139648, -0.013770580291748047, -0.013327836990356445, -0.012885093688964844, -0.012442350387573242, -0.01199960708618164, -0.011556863784790039, -0.011114120483398438, -0.010671377182006836, -0.010228633880615234, -0.009785890579223633, -0.009343147277832031, -0.00890040397644043, -0.008457660675048828, -0.008014917373657227, -0.007572174072265625, -0.0071294307708740234, -0.006686687469482422, -0.00624394416809082, -0.005801200866699219, -0.005358457565307617, -0.004915714263916016, -0.004472970962524414, -0.0040302276611328125, -0.003587484359741211, -0.0031447410583496094, -0.002701997756958008, -0.0022592544555664062, -0.0018165111541748047, -0.0013737678527832031, -0.0009310245513916016, -0.00048828125, -4.553794860839844e-05, 0.0003972053527832031, 0.0008399486541748047, 0.0012826919555664062, 0.0017254352569580078, 0.0021681785583496094, 0.002610921859741211, 0.0030536651611328125, 0.003496408462524414, 0.003939151763916016, 0.004381895065307617, 0.004824638366699219, 0.00526738166809082, 0.005710124969482422, 0.0061528682708740234, 0.006595611572265625, 0.0070383548736572266, 0.007481098175048828, 0.00792384147644043, 0.008366584777832031, 0.008809328079223633, 0.009252071380615234, 0.009694814682006836, 0.010137557983398438, 0.010580301284790039, 0.01102304458618164, 0.011465787887573242, 0.011908531188964844, 0.012351274490356445, 0.012794017791748047, 0.013236761093139648, 0.01367950439453125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 7.0, 4.0, 8.0, 11.0, 19.0, 25.0, 29.0, 35.0, 46.0, 54.0, 74.0, 94.0, 101.0, 82.0, 72.0, 75.0, 55.0, 54.0, 44.0, 28.0, 16.0, 19.0, 14.0, 7.0, 6.0, 4.0, 5.0, 4.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00290679931640625, -0.0027904510498046875, -0.002674102783203125, -0.0025577545166015625, -0.00244140625, -0.0023250579833984375, -0.002208709716796875, -0.0020923614501953125, -0.00197601318359375, -0.0018596649169921875, -0.001743316650390625, -0.0016269683837890625, -0.0015106201171875, -0.0013942718505859375, -0.001277923583984375, -0.0011615753173828125, -0.00104522705078125, -0.0009288787841796875, -0.000812530517578125, -0.0006961822509765625, -0.000579833984375, -0.0004634857177734375, -0.000347137451171875, -0.0002307891845703125, -0.00011444091796875, 1.9073486328125e-06, 0.000118255615234375, 0.0002346038818359375, 0.0003509521484375, 0.0004673004150390625, 0.000583648681640625, 0.0006999969482421875, 0.00081634521484375, 0.0009326934814453125, 0.001049041748046875, 0.0011653900146484375, 0.00128173828125, 0.0013980865478515625, 0.001514434814453125, 0.0016307830810546875, 0.00174713134765625, 0.0018634796142578125, 0.001979827880859375, 0.0020961761474609375, 0.0022125244140625, 0.0023288726806640625, 0.002445220947265625, 0.0025615692138671875, 0.00267791748046875, 0.0027942657470703125, 0.002910614013671875, 0.0030269622802734375, 0.003143310546875, 0.0032596588134765625, 0.003376007080078125, 0.0034923553466796875, 0.00360870361328125, 0.0037250518798828125, 0.003841400146484375, 0.0039577484130859375, 0.0040740966796875, 0.0041904449462890625, 0.004306793212890625, 0.0044231414794921875, 0.00453948974609375]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 10.0, 13.0, 31.0, 88.0, 160.0, 228.0, 214.0, 129.0, 68.0, 24.0, 18.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31877464056015015, -0.3103354275226593, -0.30189621448516846, -0.29345703125, -0.28501781821250916, -0.2765786051750183, -0.26813939213752747, -0.2597001791000366, -0.25126099586486816, -0.24282178282737732, -0.23438258469104767, -0.22594337165355682, -0.21750417351722717, -0.20906496047973633, -0.20062574744224548, -0.19218653440475464, -0.1837473213672638, -0.17530810832977295, -0.1668689101934433, -0.15842969715595245, -0.1499904990196228, -0.14155128598213196, -0.1331120729446411, -0.12467286735773087, -0.11623366177082062, -0.10779445618391037, -0.09935525059700012, -0.09091603755950928, -0.08247683197259903, -0.07403762638568878, -0.06559841334819794, -0.05715920776128769, -0.04871998727321625, -0.040280781686306, -0.031841572374105453, -0.023402364924550056, -0.01496315747499466, -0.006523951888084412, 0.0019152574241161346, 0.010354466736316681, 0.01879367232322693, 0.027232879772782326, 0.03567208722233772, 0.04411129653453827, 0.05255050212144852, 0.060989707708358765, 0.06942892074584961, 0.07786812633275986, 0.0863073319196701, 0.09474653750658035, 0.1031857430934906, 0.11162495613098145, 0.1200641617178917, 0.12850336730480194, 0.13694258034229279, 0.14538177847862244, 0.15382099151611328, 0.16226020455360413, 0.17069940268993378, 0.17913861572742462, 0.18757781386375427, 0.19601702690124512, 0.20445623993873596, 0.2128954529762268, 0.22133465111255646]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 8.0, 3.0, 12.0, 11.0, 10.0, 24.0, 33.0, 33.0, 50.0, 40.0, 56.0, 61.0, 52.0, 60.0, 69.0, 56.0, 59.0, 52.0, 64.0, 61.0, 37.0, 38.0, 40.0, 12.0, 15.0, 13.0, 7.0, 10.0, 3.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08594147861003876, -0.08259603381156921, -0.07925058156251907, -0.07590513676404953, -0.07255969196557999, -0.06921423971652985, -0.0658687949180603, -0.06252335011959076, -0.059177905321121216, -0.055832456797361374, -0.05248701199889183, -0.04914156347513199, -0.045796118676662445, -0.0424506701529026, -0.03910522162914276, -0.03575977683067322, -0.032414328306913376, -0.029068881645798683, -0.02572343498468399, -0.02237798646092415, -0.019032541662454605, -0.015687093138694763, -0.01234164647758007, -0.008996199816465378, -0.005650753155350685, -0.0023053062614053488, 0.0010401406325399876, 0.0043855877593159676, 0.00773103442043066, 0.011076482012867928, 0.01442192867398262, 0.017767375335097313, 0.021112821996212006, 0.0244582686573267, 0.02780371531844139, 0.031149163842201233, 0.034494608640670776, 0.03784005716443062, 0.04118550568819046, 0.044530950486660004, 0.04787639528512955, 0.05122184380888939, 0.05456728860735893, 0.057912737131118774, 0.06125818192958832, 0.06460362672805786, 0.067949078977108, 0.07129452377557755, 0.07463997602462769, 0.07798542082309723, 0.08133087307214737, 0.08467631787061691, 0.08802176266908646, 0.0913672149181366, 0.09471265971660614, 0.09805810451507568, 0.10140354931354523, 0.10474899411201477, 0.10809444636106491, 0.11143989115953445, 0.114785335958004, 0.11813078820705414, 0.12147623300552368, 0.12482167780399323, 0.12816712260246277]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 4.0, 5.0, 10.0, 9.0, 12.0, 16.0, 17.0, 36.0, 47.0, 77.0, 132.0, 217.0, 279.0, 470.0, 882.0, 1543.0, 2943.0, 6018.0, 13143.0, 35739.0, 171263.0, 680459.0, 89537.0, 25209.0, 10287.0, 4636.0, 2391.0, 1259.0, 724.0, 455.0, 250.0, 161.0, 116.0, 67.0, 44.0, 29.0, 24.0, 14.0, 12.0, 8.0, 8.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09271240234375, -0.08932113647460938, -0.08592987060546875, -0.08253860473632812, -0.0791473388671875, -0.07575607299804688, -0.07236480712890625, -0.06897354125976562, -0.065582275390625, -0.062191009521484375, -0.05879974365234375, -0.055408477783203125, -0.0520172119140625, -0.048625946044921875, -0.04523468017578125, -0.041843414306640625, -0.0384521484375, -0.035060882568359375, -0.03166961669921875, -0.028278350830078125, -0.0248870849609375, -0.021495819091796875, -0.01810455322265625, -0.014713287353515625, -0.011322021484375, -0.007930755615234375, -0.00453948974609375, -0.001148223876953125, 0.0022430419921875, 0.005634307861328125, 0.00902557373046875, 0.012416839599609375, 0.01580810546875, 0.019199371337890625, 0.02259063720703125, 0.025981903076171875, 0.0293731689453125, 0.032764434814453125, 0.03615570068359375, 0.039546966552734375, 0.042938232421875, 0.046329498291015625, 0.04972076416015625, 0.053112030029296875, 0.0565032958984375, 0.059894561767578125, 0.06328582763671875, 0.06667709350585938, 0.070068359375, 0.07345962524414062, 0.07685089111328125, 0.08024215698242188, 0.0836334228515625, 0.08702468872070312, 0.09041595458984375, 0.09380722045898438, 0.097198486328125, 0.10058975219726562, 0.10398101806640625, 0.10737228393554688, 0.1107635498046875, 0.11415481567382812, 0.11754608154296875, 0.12093734741210938, 0.12432861328125]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 2.0, 5.0, 4.0, 7.0, 8.0, 8.0, 16.0, 18.0, 17.0, 31.0, 39.0, 39.0, 46.0, 59.0, 50.0, 65.0, 66.0, 45.0, 56.0, 57.0, 55.0, 61.0, 56.0, 37.0, 35.0, 33.0, 19.0, 23.0, 7.0, 8.0, 9.0, 5.0, 5.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1820068359375, -0.17581939697265625, -0.1696319580078125, -0.16344451904296875, -0.157257080078125, -0.15106964111328125, -0.1448822021484375, -0.13869476318359375, -0.13250732421875, -0.12631988525390625, -0.1201324462890625, -0.11394500732421875, -0.107757568359375, -0.10157012939453125, -0.0953826904296875, -0.08919525146484375, -0.0830078125, -0.07682037353515625, -0.0706329345703125, -0.06444549560546875, -0.058258056640625, -0.05207061767578125, -0.0458831787109375, -0.03969573974609375, -0.03350830078125, -0.02732086181640625, -0.0211334228515625, -0.01494598388671875, -0.008758544921875, -0.00257110595703125, 0.0036163330078125, 0.00980377197265625, 0.0159912109375, 0.02217864990234375, 0.0283660888671875, 0.03455352783203125, 0.040740966796875, 0.04692840576171875, 0.0531158447265625, 0.05930328369140625, 0.06549072265625, 0.07167816162109375, 0.0778656005859375, 0.08405303955078125, 0.090240478515625, 0.09642791748046875, 0.1026153564453125, 0.10880279541015625, 0.114990234375, 0.12117767333984375, 0.1273651123046875, 0.13355255126953125, 0.139739990234375, 0.14592742919921875, 0.1521148681640625, 0.15830230712890625, 0.16448974609375, 0.17067718505859375, 0.1768646240234375, 0.18305206298828125, 0.189239501953125, 0.19542694091796875, 0.2016143798828125, 0.20780181884765625, 0.2139892578125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0, 5.0, 8.0, 7.0, 14.0, 21.0, 12.0, 26.0, 20.0, 22.0, 36.0, 45.0, 60.0, 83.0, 120.0, 151.0, 178.0, 251.0, 390.0, 841.0, 3050.0, 16699.0, 630274.0, 377084.0, 14148.0, 2695.0, 823.0, 396.0, 251.0, 182.0, 152.0, 125.0, 64.0, 84.0, 48.0, 47.0, 46.0, 24.0, 22.0, 19.0, 10.0, 5.0, 5.0, 8.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2342529296875, -0.22643470764160156, -0.21861648559570312, -0.2107982635498047, -0.20298004150390625, -0.1951618194580078, -0.18734359741210938, -0.17952537536621094, -0.1717071533203125, -0.16388893127441406, -0.15607070922851562, -0.1482524871826172, -0.14043426513671875, -0.1326160430908203, -0.12479782104492188, -0.11697959899902344, -0.109161376953125, -0.10134315490722656, -0.09352493286132812, -0.08570671081542969, -0.07788848876953125, -0.07007026672363281, -0.062252044677734375, -0.05443382263183594, -0.0466156005859375, -0.03879737854003906, -0.030979156494140625, -0.023160934448242188, -0.01534271240234375, -0.0075244903564453125, 0.000293731689453125, 0.008111953735351562, 0.01593017578125, 0.023748397827148438, 0.031566619873046875, 0.03938484191894531, 0.04720306396484375, 0.05502128601074219, 0.06283950805664062, 0.07065773010253906, 0.0784759521484375, 0.08629417419433594, 0.09411239624023438, 0.10193061828613281, 0.10974884033203125, 0.11756706237792969, 0.12538528442382812, 0.13320350646972656, 0.141021728515625, 0.14883995056152344, 0.15665817260742188, 0.1644763946533203, 0.17229461669921875, 0.1801128387451172, 0.18793106079101562, 0.19574928283691406, 0.2035675048828125, 0.21138572692871094, 0.21920394897460938, 0.2270221710205078, 0.23484039306640625, 0.2426586151123047, 0.2504768371582031, 0.25829505920410156, 0.26611328125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 5.0, 7.0, 4.0, 8.0, 5.0, 8.0, 13.0, 11.0, 23.0, 24.0, 21.0, 17.0, 26.0, 26.0, 40.0, 23.0, 46.0, 39.0, 34.0, 44.0, 48.0, 42.0, 41.0, 48.0, 46.0, 36.0, 31.0, 32.0, 29.0, 20.0, 20.0, 27.0, 22.0, 24.0, 29.0, 18.0, 13.0, 14.0, 5.0, 9.0, 4.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 4.0], "bins": [-0.1719970703125, -0.16673660278320312, -0.16147613525390625, -0.15621566772460938, -0.1509552001953125, -0.14569473266601562, -0.14043426513671875, -0.13517379760742188, -0.129913330078125, -0.12465286254882812, -0.11939239501953125, -0.11413192749023438, -0.1088714599609375, -0.10361099243164062, -0.09835052490234375, -0.09309005737304688, -0.08782958984375, -0.08256912231445312, -0.07730865478515625, -0.07204818725585938, -0.0667877197265625, -0.061527252197265625, -0.05626678466796875, -0.051006317138671875, -0.045745849609375, -0.040485382080078125, -0.03522491455078125, -0.029964447021484375, -0.0247039794921875, -0.019443511962890625, -0.01418304443359375, -0.008922576904296875, -0.003662109375, 0.001598358154296875, 0.00685882568359375, 0.012119293212890625, 0.0173797607421875, 0.022640228271484375, 0.02790069580078125, 0.033161163330078125, 0.038421630859375, 0.043682098388671875, 0.04894256591796875, 0.054203033447265625, 0.0594635009765625, 0.06472396850585938, 0.06998443603515625, 0.07524490356445312, 0.08050537109375, 0.08576583862304688, 0.09102630615234375, 0.09628677368164062, 0.1015472412109375, 0.10680770874023438, 0.11206817626953125, 0.11732864379882812, 0.122589111328125, 0.12784957885742188, 0.13311004638671875, 0.13837051391601562, 0.1436309814453125, 0.14889144897460938, 0.15415191650390625, 0.15941238403320312, 0.1646728515625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 2.0, 5.0, 7.0, 6.0, 16.0, 7.0, 21.0, 42.0, 37.0, 73.0, 88.0, 204.0, 372.0, 767.0, 1611.0, 4209.0, 15312.0, 326154.0, 673493.0, 17945.0, 4544.0, 1794.0, 832.0, 406.0, 206.0, 139.0, 78.0, 60.0, 27.0, 36.0, 13.0, 10.0, 12.0, 8.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.0970458984375, -0.09435367584228516, -0.09166145324707031, -0.08896923065185547, -0.08627700805664062, -0.08358478546142578, -0.08089256286621094, -0.0782003402709961, -0.07550811767578125, -0.0728158950805664, -0.07012367248535156, -0.06743144989013672, -0.06473922729492188, -0.06204700469970703, -0.05935478210449219, -0.056662559509277344, -0.0539703369140625, -0.051278114318847656, -0.04858589172363281, -0.04589366912841797, -0.043201446533203125, -0.04050922393798828, -0.03781700134277344, -0.035124778747558594, -0.03243255615234375, -0.029740333557128906, -0.027048110961914062, -0.02435588836669922, -0.021663665771484375, -0.01897144317626953, -0.016279220581054688, -0.013586997985839844, -0.010894775390625, -0.008202552795410156, -0.0055103302001953125, -0.0028181076049804688, -0.000125885009765625, 0.0025663375854492188, 0.0052585601806640625, 0.007950782775878906, 0.01064300537109375, 0.013335227966308594, 0.016027450561523438, 0.01871967315673828, 0.021411895751953125, 0.02410411834716797, 0.026796340942382812, 0.029488563537597656, 0.0321807861328125, 0.034873008728027344, 0.03756523132324219, 0.04025745391845703, 0.042949676513671875, 0.04564189910888672, 0.04833412170410156, 0.051026344299316406, 0.05371856689453125, 0.056410789489746094, 0.05910301208496094, 0.06179523468017578, 0.06448745727539062, 0.06717967987060547, 0.06987190246582031, 0.07256412506103516, 0.07525634765625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 2.0, 9.0, 5.0, 7.0, 13.0, 23.0, 27.0, 61.0, 121.0, 337.0, 191.0, 79.0, 40.0, 22.0, 18.0, 13.0, 13.0, 4.0, 10.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3589859008789062e-05, -1.3173557817935944e-05, -1.2757256627082825e-05, -1.2340955436229706e-05, -1.1924654245376587e-05, -1.1508353054523468e-05, -1.1092051863670349e-05, -1.067575067281723e-05, -1.0259449481964111e-05, -9.843148291110992e-06, -9.426847100257874e-06, -9.010545909404755e-06, -8.594244718551636e-06, -8.177943527698517e-06, -7.761642336845398e-06, -7.345341145992279e-06, -6.92903995513916e-06, -6.512738764286041e-06, -6.096437573432922e-06, -5.6801363825798035e-06, -5.2638351917266846e-06, -4.847534000873566e-06, -4.431232810020447e-06, -4.014931619167328e-06, -3.598630428314209e-06, -3.18232923746109e-06, -2.766028046607971e-06, -2.3497268557548523e-06, -1.9334256649017334e-06, -1.5171244740486145e-06, -1.1008232831954956e-06, -6.845220923423767e-07, -2.682209014892578e-07, 1.4808028936386108e-07, 5.6438148021698e-07, 9.806826710700989e-07, 1.3969838619232178e-06, 1.8132850527763367e-06, 2.2295862436294556e-06, 2.6458874344825745e-06, 3.0621886253356934e-06, 3.4784898161888123e-06, 3.894791007041931e-06, 4.31109219789505e-06, 4.727393388748169e-06, 5.143694579601288e-06, 5.559995770454407e-06, 5.976296961307526e-06, 6.3925981521606445e-06, 6.8088993430137634e-06, 7.225200533866882e-06, 7.641501724720001e-06, 8.05780291557312e-06, 8.474104106426239e-06, 8.890405297279358e-06, 9.306706488132477e-06, 9.723007678985596e-06, 1.0139308869838715e-05, 1.0555610060691833e-05, 1.0971911251544952e-05, 1.1388212442398071e-05, 1.180451363325119e-05, 1.2220814824104309e-05, 1.2637116014957428e-05, 1.3053417205810547e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 4.0, 2.0, 2.0, 3.0, 4.0, 8.0, 11.0, 24.0, 39.0, 68.0, 160.0, 347.0, 886.0, 2831.0, 14047.0, 906676.0, 113912.0, 6730.0, 1701.0, 583.0, 245.0, 101.0, 64.0, 35.0, 24.0, 13.0, 3.0, 6.0, 5.0, 8.0, 7.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.16552734375, -0.1611490249633789, -0.1567707061767578, -0.15239238739013672, -0.14801406860351562, -0.14363574981689453, -0.13925743103027344, -0.13487911224365234, -0.13050079345703125, -0.12612247467041016, -0.12174415588378906, -0.11736583709716797, -0.11298751831054688, -0.10860919952392578, -0.10423088073730469, -0.0998525619506836, -0.0954742431640625, -0.0910959243774414, -0.08671760559082031, -0.08233928680419922, -0.07796096801757812, -0.07358264923095703, -0.06920433044433594, -0.06482601165771484, -0.06044769287109375, -0.056069374084472656, -0.05169105529785156, -0.04731273651123047, -0.042934417724609375, -0.03855609893798828, -0.03417778015136719, -0.029799461364746094, -0.025421142578125, -0.021042823791503906, -0.016664505004882812, -0.012286186218261719, -0.007907867431640625, -0.0035295486450195312, 0.0008487701416015625, 0.005227088928222656, 0.00960540771484375, 0.013983726501464844, 0.018362045288085938, 0.02274036407470703, 0.027118682861328125, 0.03149700164794922, 0.03587532043457031, 0.040253639221191406, 0.0446319580078125, 0.049010276794433594, 0.05338859558105469, 0.05776691436767578, 0.062145233154296875, 0.06652355194091797, 0.07090187072753906, 0.07528018951416016, 0.07965850830078125, 0.08403682708740234, 0.08841514587402344, 0.09279346466064453, 0.09717178344726562, 0.10155010223388672, 0.10592842102050781, 0.1103067398071289, 0.11468505859375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 1.0, 3.0, 1.0, 5.0, 5.0, 6.0, 12.0, 16.0, 37.0, 65.0, 110.0, 271.0, 211.0, 105.0, 51.0, 47.0, 21.0, 12.0, 4.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03369140625, -0.03239250183105469, -0.031093597412109375, -0.029794692993164062, -0.02849578857421875, -0.027196884155273438, -0.025897979736328125, -0.024599075317382812, -0.0233001708984375, -0.022001266479492188, -0.020702362060546875, -0.019403457641601562, -0.01810455322265625, -0.016805648803710938, -0.015506744384765625, -0.014207839965820312, -0.012908935546875, -0.011610031127929688, -0.010311126708984375, -0.009012222290039062, -0.00771331787109375, -0.0064144134521484375, -0.005115509033203125, -0.0038166046142578125, -0.0025177001953125, -0.0012187957763671875, 8.0108642578125e-05, 0.0013790130615234375, 0.00267791748046875, 0.0039768218994140625, 0.005275726318359375, 0.0065746307373046875, 0.00787353515625, 0.009172439575195312, 0.010471343994140625, 0.011770248413085938, 0.01306915283203125, 0.014368057250976562, 0.015666961669921875, 0.016965866088867188, 0.0182647705078125, 0.019563674926757812, 0.020862579345703125, 0.022161483764648438, 0.02346038818359375, 0.024759292602539062, 0.026058197021484375, 0.027357101440429688, 0.028656005859375, 0.029954910278320312, 0.031253814697265625, 0.03255271911621094, 0.03385162353515625, 0.03515052795410156, 0.036449432373046875, 0.03774833679199219, 0.0390472412109375, 0.04034614562988281, 0.041645050048828125, 0.04294395446777344, 0.04424285888671875, 0.04554176330566406, 0.046840667724609375, 0.04813957214355469, 0.0494384765625]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 13.0, 23.0, 36.0, 80.0, 167.0, 201.0, 194.0, 104.0, 81.0, 54.0, 25.0, 11.0, 9.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.618438184261322, -0.6024943590164185, -0.5865505337715149, -0.5706067085266113, -0.5546629428863525, -0.538719117641449, -0.5227752923965454, -0.5068314671516418, -0.4908876419067383, -0.4749438166618347, -0.45900002121925354, -0.44305619597435, -0.4271123707294464, -0.41116857528686523, -0.39522475004196167, -0.3792809247970581, -0.36333712935447693, -0.34739330410957336, -0.3314495086669922, -0.3155056834220886, -0.29956185817718506, -0.2836180329322815, -0.2676742374897003, -0.25173041224479675, -0.23578660190105438, -0.219842791557312, -0.20389896631240845, -0.18795515596866608, -0.1720113456249237, -0.15606752038002014, -0.14012371003627777, -0.1241798922419548, -0.10823610424995422, -0.09229228645563126, -0.07634846866130829, -0.06040465831756592, -0.04446084052324295, -0.028517022728919983, -0.012573212385177612, 0.0033706054091453552, 0.019314423203468323, 0.03525824099779129, 0.05120205506682396, 0.06714586913585663, 0.0830896869301796, 0.09903350472450256, 0.11497731506824493, 0.1309211254119873, 0.14686495065689087, 0.16280876100063324, 0.1787525862455368, 0.19469639658927917, 0.21064022183418274, 0.2265840321779251, 0.24252784252166748, 0.25847166776657104, 0.2744154930114746, 0.2903593182563782, 0.30630311369895935, 0.3222469389438629, 0.3381907641887665, 0.35413455963134766, 0.3700783848762512, 0.3860222101211548, 0.40196600556373596]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 8.0, 13.0, 8.0, 8.0, 17.0, 15.0, 20.0, 13.0, 23.0, 28.0, 29.0, 29.0, 27.0, 35.0, 37.0, 39.0, 41.0, 43.0, 38.0, 43.0, 37.0, 36.0, 36.0, 49.0, 34.0, 29.0, 41.0, 30.0, 27.0, 25.0, 24.0, 20.0, 20.0, 15.0, 19.0, 7.0, 9.0, 8.0, 4.0, 3.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.3023441433906555, -0.2936819791793823, -0.28501978516578674, -0.27635762095451355, -0.26769545674324036, -0.25903329253196716, -0.2503710985183716, -0.2417089343070984, -0.2330467700958252, -0.2243845909833908, -0.21572242677211761, -0.20706024765968323, -0.19839808344841003, -0.18973590433597565, -0.18107372522354126, -0.17241156101226807, -0.16374938189983368, -0.1550872027873993, -0.1464250385761261, -0.1377628594636917, -0.12910069525241852, -0.12043851613998413, -0.11177634447813034, -0.10311417281627655, -0.09445200115442276, -0.08578982949256897, -0.07712765783071518, -0.06846548616886139, -0.0598033107817173, -0.05114113911986351, -0.04247896373271942, -0.03381679207086563, -0.02515462040901184, -0.01649244874715805, -0.007830275222659111, 0.0008318983018398285, 0.009494069963693619, 0.01815624162554741, 0.026818417012691498, 0.03548058867454529, 0.04414276033639908, 0.05280493199825287, 0.06146710366010666, 0.07012927532196045, 0.07879145443439484, 0.08745361864566803, 0.09611579775810242, 0.10477796941995621, 0.11344014108181, 0.12210231274366379, 0.13076448440551758, 0.13942666351795197, 0.14808882772922516, 0.15675100684165955, 0.16541317105293274, 0.17407535016536713, 0.1827375292778015, 0.1913997083902359, 0.2000618726015091, 0.20872405171394348, 0.21738621592521667, 0.22604839503765106, 0.23471057415008545, 0.24337273836135864, 0.25203490257263184]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 5.0, 3.0, 8.0, 13.0, 10.0, 8.0, 12.0, 25.0, 19.0, 17.0, 21.0, 27.0, 19.0, 34.0, 48.0, 52.0, 109.0, 206.0, 581.0, 1953.0, 13075.0, 3081344.0, 1085318.0, 8746.0, 1530.0, 493.0, 205.0, 92.0, 62.0, 37.0, 27.0, 25.0, 26.0, 20.0, 21.0, 19.0, 13.0, 10.0, 11.0, 7.0, 5.0, 8.0, 6.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0], "bins": [-0.51806640625, -0.5007553100585938, -0.4834442138671875, -0.46613311767578125, -0.448822021484375, -0.43151092529296875, -0.4141998291015625, -0.39688873291015625, -0.37957763671875, -0.36226654052734375, -0.3449554443359375, -0.32764434814453125, -0.310333251953125, -0.29302215576171875, -0.2757110595703125, -0.25839996337890625, -0.2410888671875, -0.22377777099609375, -0.2064666748046875, -0.18915557861328125, -0.171844482421875, -0.15453338623046875, -0.1372222900390625, -0.11991119384765625, -0.10260009765625, -0.08528900146484375, -0.0679779052734375, -0.05066680908203125, -0.033355712890625, -0.01604461669921875, 0.0012664794921875, 0.01857757568359375, 0.035888671875, 0.05319976806640625, 0.0705108642578125, 0.08782196044921875, 0.105133056640625, 0.12244415283203125, 0.1397552490234375, 0.15706634521484375, 0.17437744140625, 0.19168853759765625, 0.2089996337890625, 0.22631072998046875, 0.243621826171875, 0.26093292236328125, 0.2782440185546875, 0.29555511474609375, 0.3128662109375, 0.33017730712890625, 0.3474884033203125, 0.36479949951171875, 0.382110595703125, 0.39942169189453125, 0.4167327880859375, 0.43404388427734375, 0.45135498046875, 0.46866607666015625, 0.4859771728515625, 0.5032882690429688, 0.520599365234375, 0.5379104614257812, 0.5552215576171875, 0.5725326538085938, 0.58984375]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 6.0, 4.0, 5.0, 10.0, 15.0, 13.0, 19.0, 24.0, 33.0, 39.0, 55.0, 48.0, 45.0, 59.0, 70.0, 61.0, 74.0, 64.0, 63.0, 60.0, 56.0, 36.0, 27.0, 32.0, 29.0, 12.0, 13.0, 9.0, 2.0, 9.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12481689453125, -0.12087154388427734, -0.11692619323730469, -0.11298084259033203, -0.10903549194335938, -0.10509014129638672, -0.10114479064941406, -0.0971994400024414, -0.09325408935546875, -0.0893087387084961, -0.08536338806152344, -0.08141803741455078, -0.07747268676757812, -0.07352733612060547, -0.06958198547363281, -0.06563663482666016, -0.0616912841796875, -0.057745933532714844, -0.05380058288574219, -0.04985523223876953, -0.045909881591796875, -0.04196453094482422, -0.03801918029785156, -0.034073829650878906, -0.03012847900390625, -0.026183128356933594, -0.022237777709960938, -0.01829242706298828, -0.014347076416015625, -0.010401725769042969, -0.0064563751220703125, -0.0025110244750976562, 0.001434326171875, 0.005379676818847656, 0.009325027465820312, 0.013270378112792969, 0.017215728759765625, 0.02116107940673828, 0.025106430053710938, 0.029051780700683594, 0.03299713134765625, 0.036942481994628906, 0.04088783264160156, 0.04483318328857422, 0.048778533935546875, 0.05272388458251953, 0.05666923522949219, 0.060614585876464844, 0.0645599365234375, 0.06850528717041016, 0.07245063781738281, 0.07639598846435547, 0.08034133911132812, 0.08428668975830078, 0.08823204040527344, 0.0921773910522461, 0.09612274169921875, 0.1000680923461914, 0.10401344299316406, 0.10795879364013672, 0.11190414428710938, 0.11584949493408203, 0.11979484558105469, 0.12374019622802734, 0.127685546875]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 10.0, 13.0, 11.0, 28.0, 42.0, 42.0, 125.0, 226.0, 687.0, 2270.0, 14543.0, 388518.0, 3733725.0, 47413.0, 4769.0, 1091.0, 394.0, 152.0, 58.0, 53.0, 32.0, 22.0, 16.0, 7.0, 8.0, 7.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.234130859375, -0.22359466552734375, -0.2130584716796875, -0.20252227783203125, -0.191986083984375, -0.18144989013671875, -0.1709136962890625, -0.16037750244140625, -0.14984130859375, -0.13930511474609375, -0.1287689208984375, -0.11823272705078125, -0.107696533203125, -0.09716033935546875, -0.0866241455078125, -0.07608795166015625, -0.0655517578125, -0.05501556396484375, -0.0444793701171875, -0.03394317626953125, -0.023406982421875, -0.01287078857421875, -0.0023345947265625, 0.00820159912109375, 0.01873779296875, 0.02927398681640625, 0.0398101806640625, 0.05034637451171875, 0.060882568359375, 0.07141876220703125, 0.0819549560546875, 0.09249114990234375, 0.10302734375, 0.11356353759765625, 0.1240997314453125, 0.13463592529296875, 0.145172119140625, 0.15570831298828125, 0.1662445068359375, 0.17678070068359375, 0.18731689453125, 0.19785308837890625, 0.2083892822265625, 0.21892547607421875, 0.229461669921875, 0.23999786376953125, 0.2505340576171875, 0.26107025146484375, 0.2716064453125, 0.28214263916015625, 0.2926788330078125, 0.30321502685546875, 0.313751220703125, 0.32428741455078125, 0.3348236083984375, 0.34535980224609375, 0.35589599609375, 0.36643218994140625, 0.3769683837890625, 0.38750457763671875, 0.398040771484375, 0.40857696533203125, 0.4191131591796875, 0.42964935302734375, 0.440185546875]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 2.0, 3.0, 15.0, 13.0, 24.0, 20.0, 33.0, 39.0, 52.0, 64.0, 114.0, 149.0, 251.0, 470.0, 668.0, 771.0, 521.0, 309.0, 189.0, 102.0, 77.0, 39.0, 41.0, 34.0, 24.0, 11.0, 14.0, 9.0, 4.0, 5.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.057708740234375, -0.05623483657836914, -0.05476093292236328, -0.05328702926635742, -0.05181312561035156, -0.0503392219543457, -0.048865318298339844, -0.047391414642333984, -0.045917510986328125, -0.044443607330322266, -0.042969703674316406, -0.04149580001831055, -0.04002189636230469, -0.03854799270629883, -0.03707408905029297, -0.03560018539428711, -0.03412628173828125, -0.03265237808227539, -0.03117847442626953, -0.029704570770263672, -0.028230667114257812, -0.026756763458251953, -0.025282859802246094, -0.023808956146240234, -0.022335052490234375, -0.020861148834228516, -0.019387245178222656, -0.017913341522216797, -0.016439437866210938, -0.014965534210205078, -0.013491630554199219, -0.01201772689819336, -0.0105438232421875, -0.00906991958618164, -0.007596015930175781, -0.006122112274169922, -0.0046482086181640625, -0.003174304962158203, -0.0017004013061523438, -0.00022649765014648438, 0.001247406005859375, 0.0027213096618652344, 0.004195213317871094, 0.005669116973876953, 0.0071430206298828125, 0.008616924285888672, 0.010090827941894531, 0.01156473159790039, 0.01303863525390625, 0.01451253890991211, 0.01598644256591797, 0.017460346221923828, 0.018934249877929688, 0.020408153533935547, 0.021882057189941406, 0.023355960845947266, 0.024829864501953125, 0.026303768157958984, 0.027777671813964844, 0.029251575469970703, 0.030725479125976562, 0.03219938278198242, 0.03367328643798828, 0.03514719009399414, 0.03662109375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 3.0, 5.0, 14.0, 14.0, 31.0, 44.0, 77.0, 104.0, 131.0, 160.0, 139.0, 94.0, 70.0, 45.0, 31.0, 20.0, 13.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25304198265075684, -0.2447388917207718, -0.23643580079078674, -0.2281327098608017, -0.21982961893081665, -0.2115265280008316, -0.20322343707084656, -0.19492033123970032, -0.18661725521087646, -0.17831416428089142, -0.17001107335090637, -0.16170798242092133, -0.15340489149093628, -0.14510180056095123, -0.1367987096309662, -0.12849560379981995, -0.1201925128698349, -0.11188942193984985, -0.10358633100986481, -0.09528324007987976, -0.08698014914989471, -0.07867705821990967, -0.07037395983934402, -0.06207086890935898, -0.05376777797937393, -0.045464687049388885, -0.03716159611940384, -0.028858501464128494, -0.020555410534143448, -0.012252319604158401, -0.003949224948883057, 0.00435386598110199, 0.012656956911087036, 0.020960047841072083, 0.029263140633702278, 0.037566233426332474, 0.04586932435631752, 0.054172415286302567, 0.06247550994157791, 0.07077860087156296, 0.079081691801548, 0.08738478273153305, 0.0956878736615181, 0.10399097204208374, 0.11229406297206879, 0.12059715390205383, 0.12890024483203888, 0.13720333576202393, 0.14550642669200897, 0.15380951762199402, 0.16211260855197906, 0.1704156994819641, 0.17871879041194916, 0.1870218813419342, 0.19532498717308044, 0.2036280632019043, 0.21193116903305054, 0.22023425996303558, 0.22853735089302063, 0.23684044182300568, 0.24514353275299072, 0.25344663858413696, 0.2617497146129608, 0.27005282044410706, 0.2783558964729309]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 5.0, 6.0, 7.0, 3.0, 7.0, 13.0, 14.0, 15.0, 21.0, 18.0, 28.0, 33.0, 36.0, 39.0, 49.0, 34.0, 48.0, 42.0, 42.0, 47.0, 56.0, 64.0, 45.0, 44.0, 33.0, 33.0, 43.0, 34.0, 22.0, 23.0, 18.0, 21.0, 24.0, 11.0, 13.0, 4.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09925607591867447, -0.0955699160695076, -0.09188375622034073, -0.08819759637117386, -0.08451143652200699, -0.08082527667284012, -0.07713910937309265, -0.07345294952392578, -0.06976678967475891, -0.06608062982559204, -0.06239446997642517, -0.0587083101272583, -0.05502215027809143, -0.05133599042892456, -0.04764982685446739, -0.04396366700530052, -0.04027751088142395, -0.03659135103225708, -0.03290519118309021, -0.02921902947127819, -0.02553286962211132, -0.02184670977294445, -0.01816054806113243, -0.014474388211965561, -0.01078822836279869, -0.007102068047970533, -0.003415907733142376, 0.0002702530473470688, 0.003956412896513939, 0.007642572745680809, 0.011328734457492828, 0.015014894306659698, 0.018701061606407166, 0.022387221455574036, 0.026073381304740906, 0.029759543016552925, 0.033445701003074646, 0.037131860852241516, 0.040818024426698685, 0.044504184275865555, 0.048190344125032425, 0.051876503974199295, 0.055562663823366165, 0.059248827397823334, 0.0629349872469902, 0.06662114709615707, 0.07030730694532394, 0.07399346679449081, 0.07767962664365768, 0.08136578649282455, 0.08505194634199142, 0.0887381061911583, 0.09242426604032516, 0.09611042588949203, 0.0997965931892395, 0.10348275303840637, 0.10716891288757324, 0.11085507273674011, 0.11454123258590698, 0.11822739243507385, 0.12191355228424072, 0.1255997121334076, 0.12928587198257446, 0.13297203183174133, 0.1366581916809082]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 6.0, 6.0, 9.0, 16.0, 25.0, 27.0, 59.0, 126.0, 233.0, 480.0, 1068.0, 2525.0, 6339.0, 18429.0, 129495.0, 777317.0, 87528.0, 15397.0, 5444.0, 2139.0, 954.0, 451.0, 201.0, 125.0, 61.0, 36.0, 23.0, 9.0, 12.0, 5.0, 7.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1121826171875, -0.10918521881103516, -0.10618782043457031, -0.10319042205810547, -0.10019302368164062, -0.09719562530517578, -0.09419822692871094, -0.0912008285522461, -0.08820343017578125, -0.0852060317993164, -0.08220863342285156, -0.07921123504638672, -0.07621383666992188, -0.07321643829345703, -0.07021903991699219, -0.06722164154052734, -0.0642242431640625, -0.061226844787597656, -0.05822944641113281, -0.05523204803466797, -0.052234649658203125, -0.04923725128173828, -0.04623985290527344, -0.043242454528808594, -0.04024505615234375, -0.037247657775878906, -0.03425025939941406, -0.03125286102294922, -0.028255462646484375, -0.02525806427001953, -0.022260665893554688, -0.019263267517089844, -0.016265869140625, -0.013268470764160156, -0.010271072387695312, -0.007273674011230469, -0.004276275634765625, -0.0012788772583007812, 0.0017185211181640625, 0.004715919494628906, 0.00771331787109375, 0.010710716247558594, 0.013708114624023438, 0.01670551300048828, 0.019702911376953125, 0.02270030975341797, 0.025697708129882812, 0.028695106506347656, 0.0316925048828125, 0.034689903259277344, 0.03768730163574219, 0.04068470001220703, 0.043682098388671875, 0.04667949676513672, 0.04967689514160156, 0.052674293518066406, 0.05567169189453125, 0.058669090270996094, 0.06166648864746094, 0.06466388702392578, 0.06766128540039062, 0.07065868377685547, 0.07365608215332031, 0.07665348052978516, 0.07965087890625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 4.0, 6.0, 10.0, 10.0, 14.0, 15.0, 14.0, 27.0, 24.0, 39.0, 29.0, 50.0, 41.0, 55.0, 51.0, 65.0, 45.0, 51.0, 59.0, 58.0, 40.0, 39.0, 47.0, 34.0, 34.0, 25.0, 32.0, 24.0, 16.0, 14.0, 6.0, 8.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.076904296875, -0.0740365982055664, -0.07116889953613281, -0.06830120086669922, -0.06543350219726562, -0.06256580352783203, -0.05969810485839844, -0.056830406188964844, -0.05396270751953125, -0.051095008850097656, -0.04822731018066406, -0.04535961151123047, -0.042491912841796875, -0.03962421417236328, -0.03675651550292969, -0.033888816833496094, -0.0310211181640625, -0.028153419494628906, -0.025285720825195312, -0.02241802215576172, -0.019550323486328125, -0.01668262481689453, -0.013814926147460938, -0.010947227478027344, -0.00807952880859375, -0.005211830139160156, -0.0023441314697265625, 0.0005235671997070312, 0.003391265869140625, 0.006258964538574219, 0.009126663208007812, 0.011994361877441406, 0.014862060546875, 0.017729759216308594, 0.020597457885742188, 0.02346515655517578, 0.026332855224609375, 0.02920055389404297, 0.03206825256347656, 0.034935951232910156, 0.03780364990234375, 0.040671348571777344, 0.04353904724121094, 0.04640674591064453, 0.049274444580078125, 0.05214214324951172, 0.05500984191894531, 0.057877540588378906, 0.0607452392578125, 0.0636129379272461, 0.06648063659667969, 0.06934833526611328, 0.07221603393554688, 0.07508373260498047, 0.07795143127441406, 0.08081912994384766, 0.08368682861328125, 0.08655452728271484, 0.08942222595214844, 0.09228992462158203, 0.09515762329101562, 0.09802532196044922, 0.10089302062988281, 0.1037607192993164, 0.10662841796875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 7.0, 6.0, 14.0, 22.0, 20.0, 50.0, 79.0, 153.0, 399.0, 1108.0, 4094.0, 23271.0, 521538.0, 470569.0, 21615.0, 3855.0, 1023.0, 387.0, 141.0, 72.0, 40.0, 23.0, 14.0, 14.0, 11.0, 13.0, 8.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11566162109375, -0.11261653900146484, -0.10957145690917969, -0.10652637481689453, -0.10348129272460938, -0.10043621063232422, -0.09739112854003906, -0.0943460464477539, -0.09130096435546875, -0.0882558822631836, -0.08521080017089844, -0.08216571807861328, -0.07912063598632812, -0.07607555389404297, -0.07303047180175781, -0.06998538970947266, -0.0669403076171875, -0.06389522552490234, -0.06085014343261719, -0.05780506134033203, -0.054759979248046875, -0.05171489715576172, -0.04866981506347656, -0.045624732971191406, -0.04257965087890625, -0.039534568786621094, -0.03648948669433594, -0.03344440460205078, -0.030399322509765625, -0.02735424041748047, -0.024309158325195312, -0.021264076232910156, -0.018218994140625, -0.015173912048339844, -0.012128829956054688, -0.009083747863769531, -0.006038665771484375, -0.0029935836791992188, 5.14984130859375e-05, 0.0030965805053710938, 0.00614166259765625, 0.009186744689941406, 0.012231826782226562, 0.015276908874511719, 0.018321990966796875, 0.02136707305908203, 0.024412155151367188, 0.027457237243652344, 0.0305023193359375, 0.033547401428222656, 0.03659248352050781, 0.03963756561279297, 0.042682647705078125, 0.04572772979736328, 0.04877281188964844, 0.051817893981933594, 0.05486297607421875, 0.057908058166503906, 0.06095314025878906, 0.06399822235107422, 0.06704330444335938, 0.07008838653564453, 0.07313346862792969, 0.07617855072021484, 0.0792236328125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 4.0, 7.0, 12.0, 5.0, 7.0, 10.0, 8.0, 14.0, 10.0, 18.0, 20.0, 33.0, 32.0, 28.0, 32.0, 42.0, 45.0, 29.0, 44.0, 49.0, 30.0, 52.0, 44.0, 39.0, 51.0, 41.0, 35.0, 39.0, 16.0, 35.0, 29.0, 23.0, 13.0, 22.0, 13.0, 14.0, 14.0, 12.0, 8.0, 9.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.1610107421875, -0.15622520446777344, -0.15143966674804688, -0.1466541290283203, -0.14186859130859375, -0.1370830535888672, -0.13229751586914062, -0.12751197814941406, -0.1227264404296875, -0.11794090270996094, -0.11315536499023438, -0.10836982727050781, -0.10358428955078125, -0.09879875183105469, -0.09401321411132812, -0.08922767639160156, -0.084442138671875, -0.07965660095214844, -0.07487106323242188, -0.07008552551269531, -0.06529998779296875, -0.06051445007324219, -0.055728912353515625, -0.05094337463378906, -0.0461578369140625, -0.04137229919433594, -0.036586761474609375, -0.03180122375488281, -0.02701568603515625, -0.022230148315429688, -0.017444610595703125, -0.012659072875976562, -0.00787353515625, -0.0030879974365234375, 0.001697540283203125, 0.0064830780029296875, 0.01126861572265625, 0.016054153442382812, 0.020839691162109375, 0.025625228881835938, 0.0304107666015625, 0.03519630432128906, 0.039981842041015625, 0.04476737976074219, 0.04955291748046875, 0.05433845520019531, 0.059123992919921875, 0.06390953063964844, 0.068695068359375, 0.07348060607910156, 0.07826614379882812, 0.08305168151855469, 0.08783721923828125, 0.09262275695800781, 0.09740829467773438, 0.10219383239746094, 0.1069793701171875, 0.11176490783691406, 0.11655044555664062, 0.12133598327636719, 0.12612152099609375, 0.1309070587158203, 0.13569259643554688, 0.14047813415527344, 0.145263671875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 6.0, 5.0, 13.0, 17.0, 26.0, 49.0, 61.0, 107.0, 181.0, 413.0, 992.0, 2753.0, 10055.0, 57676.0, 494707.0, 421199.0, 47246.0, 8741.0, 2480.0, 926.0, 401.0, 193.0, 104.0, 66.0, 39.0, 22.0, 18.0, 14.0, 7.0, 10.0, 4.0, 3.0, 3.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015625, -0.015103340148925781, -0.014581680297851562, -0.014060020446777344, -0.013538360595703125, -0.013016700744628906, -0.012495040893554688, -0.011973381042480469, -0.01145172119140625, -0.010930061340332031, -0.010408401489257812, -0.009886741638183594, -0.009365081787109375, -0.008843421936035156, -0.008321762084960938, -0.007800102233886719, -0.0072784423828125, -0.006756782531738281, -0.0062351226806640625, -0.005713462829589844, -0.005191802978515625, -0.004670143127441406, -0.0041484832763671875, -0.0036268234252929688, -0.00310516357421875, -0.0025835037231445312, -0.0020618438720703125, -0.0015401840209960938, -0.001018524169921875, -0.0004968643188476562, 2.47955322265625e-05, 0.0005464553833007812, 0.001068115234375, 0.0015897750854492188, 0.0021114349365234375, 0.0026330947875976562, 0.003154754638671875, 0.0036764144897460938, 0.0041980743408203125, 0.004719734191894531, 0.00524139404296875, 0.005763053894042969, 0.0062847137451171875, 0.006806373596191406, 0.007328033447265625, 0.007849693298339844, 0.008371353149414062, 0.008893013000488281, 0.0094146728515625, 0.009936332702636719, 0.010457992553710938, 0.010979652404785156, 0.011501312255859375, 0.012022972106933594, 0.012544631958007812, 0.013066291809082031, 0.01358795166015625, 0.014109611511230469, 0.014631271362304688, 0.015152931213378906, 0.015674591064453125, 0.016196250915527344, 0.016717910766601562, 0.01723957061767578, 0.01776123046875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 6.0, 9.0, 4.0, 14.0, 9.0, 14.0, 18.0, 20.0, 31.0, 21.0, 37.0, 54.0, 31.0, 80.0, 81.0, 85.0, 42.0, 69.0, 86.0, 58.0, 29.0, 43.0, 31.0, 23.0, 26.0, 20.0, 16.0, 6.0, 9.0, 7.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-5.662441253662109e-06, -5.500391125679016e-06, -5.338340997695923e-06, -5.17629086971283e-06, -5.014240741729736e-06, -4.852190613746643e-06, -4.69014048576355e-06, -4.5280903577804565e-06, -4.366040229797363e-06, -4.20399010181427e-06, -4.041939973831177e-06, -3.8798898458480835e-06, -3.7178397178649902e-06, -3.555789589881897e-06, -3.3937394618988037e-06, -3.2316893339157104e-06, -3.069639205932617e-06, -2.907589077949524e-06, -2.7455389499664307e-06, -2.5834888219833374e-06, -2.421438694000244e-06, -2.259388566017151e-06, -2.0973384380340576e-06, -1.9352883100509644e-06, -1.773238182067871e-06, -1.6111880540847778e-06, -1.4491379261016846e-06, -1.2870877981185913e-06, -1.125037670135498e-06, -9.629875421524048e-07, -8.009374141693115e-07, -6.388872861862183e-07, -4.76837158203125e-07, -3.1478703022003174e-07, -1.5273690223693848e-07, 9.313225746154785e-09, 1.7136335372924805e-07, 3.334134817123413e-07, 4.954636096954346e-07, 6.575137376785278e-07, 8.195638656616211e-07, 9.816139936447144e-07, 1.1436641216278076e-06, 1.3057142496109009e-06, 1.4677643775939941e-06, 1.6298145055770874e-06, 1.7918646335601807e-06, 1.953914761543274e-06, 2.115964889526367e-06, 2.2780150175094604e-06, 2.4400651454925537e-06, 2.602115273475647e-06, 2.7641654014587402e-06, 2.9262155294418335e-06, 3.0882656574249268e-06, 3.25031578540802e-06, 3.4123659133911133e-06, 3.5744160413742065e-06, 3.7364661693573e-06, 3.898516297340393e-06, 4.060566425323486e-06, 4.22261655330658e-06, 4.384666681289673e-06, 4.546716809272766e-06, 4.708766937255859e-06]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 7.0, 5.0, 3.0, 4.0, 9.0, 11.0, 15.0, 29.0, 64.0, 74.0, 101.0, 211.0, 415.0, 883.0, 2209.0, 6554.0, 28415.0, 197968.0, 627334.0, 151975.0, 22934.0, 5763.0, 1965.0, 741.0, 402.0, 196.0, 105.0, 50.0, 33.0, 27.0, 12.0, 7.0, 8.0, 8.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.018890380859375, -0.018357276916503906, -0.017824172973632812, -0.01729106903076172, -0.016757965087890625, -0.01622486114501953, -0.015691757202148438, -0.015158653259277344, -0.01462554931640625, -0.014092445373535156, -0.013559341430664062, -0.013026237487792969, -0.012493133544921875, -0.011960029602050781, -0.011426925659179688, -0.010893821716308594, -0.0103607177734375, -0.009827613830566406, -0.009294509887695312, -0.008761405944824219, -0.008228302001953125, -0.007695198059082031, -0.0071620941162109375, -0.006628990173339844, -0.00609588623046875, -0.005562782287597656, -0.0050296783447265625, -0.004496574401855469, -0.003963470458984375, -0.0034303665161132812, -0.0028972625732421875, -0.0023641586303710938, -0.0018310546875, -0.0012979507446289062, -0.0007648468017578125, -0.00023174285888671875, 0.000301361083984375, 0.0008344650268554688, 0.0013675689697265625, 0.0019006729125976562, 0.00243377685546875, 0.0029668807983398438, 0.0034999847412109375, 0.004033088684082031, 0.004566192626953125, 0.005099296569824219, 0.0056324005126953125, 0.006165504455566406, 0.0066986083984375, 0.007231712341308594, 0.0077648162841796875, 0.008297920227050781, 0.008831024169921875, 0.009364128112792969, 0.009897232055664062, 0.010430335998535156, 0.01096343994140625, 0.011496543884277344, 0.012029647827148438, 0.012562751770019531, 0.013095855712890625, 0.013628959655761719, 0.014162063598632812, 0.014695167541503906, 0.015228271484375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 9.0, 6.0, 10.0, 11.0, 26.0, 19.0, 35.0, 32.0, 35.0, 59.0, 88.0, 91.0, 75.0, 85.0, 78.0, 76.0, 61.0, 35.0, 36.0, 29.0, 28.0, 17.0, 10.0, 3.0, 7.0, 7.0, 5.0, 6.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.003871917724609375, -0.0037503838539123535, -0.003628849983215332, -0.0035073161125183105, -0.003385782241821289, -0.0032642483711242676, -0.003142714500427246, -0.0030211806297302246, -0.002899646759033203, -0.0027781128883361816, -0.00265657901763916, -0.0025350451469421387, -0.002413511276245117, -0.0022919774055480957, -0.0021704435348510742, -0.0020489096641540527, -0.0019273757934570312, -0.0018058419227600098, -0.0016843080520629883, -0.0015627741813659668, -0.0014412403106689453, -0.0013197064399719238, -0.0011981725692749023, -0.0010766386985778809, -0.0009551048278808594, -0.0008335709571838379, -0.0007120370864868164, -0.0005905032157897949, -0.00046896934509277344, -0.00034743547439575195, -0.00022590160369873047, -0.00010436773300170898, 1.71661376953125e-05, 0.00013870000839233398, 0.00026023387908935547, 0.00038176774978637695, 0.0005033016204833984, 0.0006248354911804199, 0.0007463693618774414, 0.0008679032325744629, 0.0009894371032714844, 0.0011109709739685059, 0.0012325048446655273, 0.0013540387153625488, 0.0014755725860595703, 0.0015971064567565918, 0.0017186403274536133, 0.0018401741981506348, 0.0019617080688476562, 0.0020832419395446777, 0.0022047758102416992, 0.0023263096809387207, 0.002447843551635742, 0.0025693774223327637, 0.002690911293029785, 0.0028124451637268066, 0.002933979034423828, 0.0030555129051208496, 0.003177046775817871, 0.0032985806465148926, 0.003420114517211914, 0.0035416483879089355, 0.003663182258605957, 0.0037847161293029785, 0.00390625]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 3.0, 9.0, 12.0, 22.0, 32.0, 79.0, 79.0, 133.0, 140.0, 159.0, 120.0, 88.0, 42.0, 38.0, 23.0, 13.0, 4.0, 8.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.20603322982788086, -0.2004377394914627, -0.19484224915504456, -0.1892467439174652, -0.18365125358104706, -0.1780557632446289, -0.17246027290821075, -0.1668647825717926, -0.16126927733421326, -0.1556737869977951, -0.15007829666137695, -0.1444827914237976, -0.13888730108737946, -0.1332918107509613, -0.12769632041454315, -0.122100830078125, -0.11650533974170685, -0.1109098494052887, -0.10531435161828995, -0.0997188612818718, -0.09412336349487305, -0.0885278731584549, -0.08293238282203674, -0.07733689248561859, -0.07174139469861984, -0.06614590436220169, -0.06055040657520294, -0.05495491623878479, -0.04935942217707634, -0.04376392811536789, -0.03816843777894974, -0.03257294371724129, -0.026977434754371643, -0.021381940692663193, -0.01578644849359989, -0.01019095629453659, -0.00459546223282814, 0.00100003182888031, 0.006595522165298462, 0.012191016227006912, 0.017786510288715363, 0.023382004350423813, 0.028977496549487114, 0.034572988748550415, 0.040168482810258865, 0.045763976871967316, 0.05135946720838547, 0.05695496127009392, 0.06255045533180237, 0.06814594566822052, 0.07374144345521927, 0.07933693379163742, 0.08493243157863617, 0.09052792191505432, 0.09612341225147247, 0.10171890258789062, 0.10731440037488937, 0.11290989071130753, 0.11850538849830627, 0.12410087883472443, 0.12969636917114258, 0.13529187440872192, 0.14088734984397888, 0.14648285508155823, 0.15207834541797638]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 6.0, 8.0, 9.0, 5.0, 4.0, 9.0, 14.0, 22.0, 14.0, 26.0, 34.0, 31.0, 47.0, 44.0, 49.0, 40.0, 44.0, 54.0, 62.0, 58.0, 57.0, 56.0, 36.0, 42.0, 32.0, 45.0, 24.0, 31.0, 34.0, 23.0, 17.0, 11.0, 7.0, 5.0, 6.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07813102751970291, -0.07540745288133621, -0.07268387824296951, -0.06996030360460281, -0.06723672896623611, -0.06451314687728882, -0.06178957596421242, -0.05906599760055542, -0.05634242296218872, -0.05361884832382202, -0.05089527368545532, -0.04817169904708862, -0.045448120683431625, -0.042724546045064926, -0.04000097140669823, -0.03727739304304123, -0.03455382212996483, -0.03183024749159813, -0.02910667099058628, -0.02638309635221958, -0.023659519851207733, -0.020935945212841034, -0.018212370574474335, -0.015488794073462486, -0.012765219435095787, -0.010041643865406513, -0.007318068761378527, -0.00459449365735054, -0.0018709180876612663, 0.0008526574820280075, 0.0035762321203947067, 0.006299808621406555, 0.009023383259773254, 0.011746958829462528, 0.014470534399151802, 0.0171941090375185, 0.01991768553853035, 0.02264126017689705, 0.025364834815263748, 0.028088411316275597, 0.030811985954642296, 0.033535562455654144, 0.036259137094020844, 0.03898271173238754, 0.04170628637075424, 0.04442986100912094, 0.04715343564748764, 0.04987701401114464, 0.05260058864951134, 0.055324163287878036, 0.058047737926244736, 0.06077131628990173, 0.06349489092826843, 0.06621846556663513, 0.06894204020500183, 0.07166561484336853, 0.07438918948173523, 0.07711276412010193, 0.07983633875846863, 0.08255991339683533, 0.08528348803520203, 0.08800706267356873, 0.09073063731193542, 0.09345421940088272, 0.09617779403924942]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 5.0, 12.0, 10.0, 16.0, 29.0, 44.0, 65.0, 98.0, 170.0, 314.0, 517.0, 985.0, 2021.0, 4517.0, 11774.0, 38137.0, 199954.0, 669989.0, 84590.0, 21635.0, 7411.0, 3122.0, 1439.0, 790.0, 406.0, 185.0, 121.0, 75.0, 56.0, 21.0, 13.0, 15.0, 13.0, 6.0, 6.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0867919921875, -0.08271217346191406, -0.07863235473632812, -0.07455253601074219, -0.07047271728515625, -0.06639289855957031, -0.062313079833984375, -0.05823326110839844, -0.0541534423828125, -0.05007362365722656, -0.045993804931640625, -0.04191398620605469, -0.03783416748046875, -0.03375434875488281, -0.029674530029296875, -0.025594711303710938, -0.021514892578125, -0.017435073852539062, -0.013355255126953125, -0.009275436401367188, -0.00519561767578125, -0.0011157989501953125, 0.002964019775390625, 0.0070438385009765625, 0.0111236572265625, 0.015203475952148438, 0.019283294677734375, 0.023363113403320312, 0.02744293212890625, 0.03152275085449219, 0.035602569580078125, 0.03968238830566406, 0.04376220703125, 0.04784202575683594, 0.051921844482421875, 0.05600166320800781, 0.06008148193359375, 0.06416130065917969, 0.06824111938476562, 0.07232093811035156, 0.0764007568359375, 0.08048057556152344, 0.08456039428710938, 0.08864021301269531, 0.09272003173828125, 0.09679985046386719, 0.10087966918945312, 0.10495948791503906, 0.109039306640625, 0.11311912536621094, 0.11719894409179688, 0.12127876281738281, 0.12535858154296875, 0.1294384002685547, 0.13351821899414062, 0.13759803771972656, 0.1416778564453125, 0.14575767517089844, 0.14983749389648438, 0.1539173126220703, 0.15799713134765625, 0.1620769500732422, 0.16615676879882812, 0.17023658752441406, 0.17431640625]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 9.0, 7.0, 3.0, 10.0, 8.0, 8.0, 18.0, 21.0, 19.0, 30.0, 35.0, 40.0, 44.0, 44.0, 47.0, 53.0, 54.0, 77.0, 45.0, 62.0, 49.0, 43.0, 58.0, 38.0, 24.0, 24.0, 38.0, 26.0, 25.0, 15.0, 9.0, 7.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1494140625, -0.1441936492919922, -0.13897323608398438, -0.13375282287597656, -0.12853240966796875, -0.12331199645996094, -0.11809158325195312, -0.11287117004394531, -0.1076507568359375, -0.10243034362792969, -0.09720993041992188, -0.09198951721191406, -0.08676910400390625, -0.08154869079589844, -0.07632827758789062, -0.07110786437988281, -0.065887451171875, -0.06066703796386719, -0.055446624755859375, -0.05022621154785156, -0.04500579833984375, -0.03978538513183594, -0.034564971923828125, -0.029344558715820312, -0.0241241455078125, -0.018903732299804688, -0.013683319091796875, -0.008462905883789062, -0.00324249267578125, 0.0019779205322265625, 0.007198333740234375, 0.012418746948242188, 0.01763916015625, 0.022859573364257812, 0.028079986572265625, 0.03330039978027344, 0.03852081298828125, 0.04374122619628906, 0.048961639404296875, 0.05418205261230469, 0.0594024658203125, 0.06462287902832031, 0.06984329223632812, 0.07506370544433594, 0.08028411865234375, 0.08550453186035156, 0.09072494506835938, 0.09594535827636719, 0.101165771484375, 0.10638618469238281, 0.11160659790039062, 0.11682701110839844, 0.12204742431640625, 0.12726783752441406, 0.13248825073242188, 0.1377086639404297, 0.1429290771484375, 0.1481494903564453, 0.15336990356445312, 0.15859031677246094, 0.16381072998046875, 0.16903114318847656, 0.17425155639648438, 0.1794719696044922, 0.1846923828125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 4.0, 5.0, 5.0, 17.0, 27.0, 30.0, 58.0, 76.0, 121.0, 210.0, 530.0, 3093.0, 95841.0, 935362.0, 11314.0, 1109.0, 306.0, 143.0, 95.0, 48.0, 47.0, 27.0, 18.0, 30.0, 11.0, 11.0, 5.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47314453125, -0.4600868225097656, -0.44702911376953125, -0.4339714050292969, -0.4209136962890625, -0.4078559875488281, -0.39479827880859375, -0.3817405700683594, -0.368682861328125, -0.3556251525878906, -0.34256744384765625, -0.3295097351074219, -0.3164520263671875, -0.3033943176269531, -0.29033660888671875, -0.2772789001464844, -0.26422119140625, -0.2511634826660156, -0.23810577392578125, -0.22504806518554688, -0.2119903564453125, -0.19893264770507812, -0.18587493896484375, -0.17281723022460938, -0.159759521484375, -0.14670181274414062, -0.13364410400390625, -0.12058639526367188, -0.1075286865234375, -0.09447097778320312, -0.08141326904296875, -0.06835556030273438, -0.0552978515625, -0.042240142822265625, -0.02918243408203125, -0.016124725341796875, -0.0030670166015625, 0.009990692138671875, 0.02304840087890625, 0.036106109619140625, 0.049163818359375, 0.062221527099609375, 0.07527923583984375, 0.08833694458007812, 0.1013946533203125, 0.11445236206054688, 0.12751007080078125, 0.14056777954101562, 0.15362548828125, 0.16668319702148438, 0.17974090576171875, 0.19279861450195312, 0.2058563232421875, 0.21891403198242188, 0.23197174072265625, 0.24502944946289062, 0.258087158203125, 0.2711448669433594, 0.28420257568359375, 0.2972602844238281, 0.3103179931640625, 0.3233757019042969, 0.33643341064453125, 0.3494911193847656, 0.362548828125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 4.0, 7.0, 7.0, 3.0, 9.0, 11.0, 17.0, 25.0, 43.0, 37.0, 54.0, 53.0, 57.0, 63.0, 65.0, 53.0, 72.0, 80.0, 52.0, 47.0, 51.0, 40.0, 36.0, 27.0, 19.0, 20.0, 18.0, 15.0, 10.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.264404296875, -0.2571239471435547, -0.24984359741210938, -0.24256324768066406, -0.23528289794921875, -0.22800254821777344, -0.22072219848632812, -0.2134418487548828, -0.2061614990234375, -0.1988811492919922, -0.19160079956054688, -0.18432044982910156, -0.17704010009765625, -0.16975975036621094, -0.16247940063476562, -0.1551990509033203, -0.147918701171875, -0.1406383514404297, -0.13335800170898438, -0.12607765197753906, -0.11879730224609375, -0.11151695251464844, -0.10423660278320312, -0.09695625305175781, -0.0896759033203125, -0.08239555358886719, -0.07511520385742188, -0.06783485412597656, -0.06055450439453125, -0.05327415466308594, -0.045993804931640625, -0.03871345520019531, -0.03143310546875, -0.024152755737304688, -0.016872406005859375, -0.009592056274414062, -0.00231170654296875, 0.0049686431884765625, 0.012248992919921875, 0.019529342651367188, 0.0268096923828125, 0.03409004211425781, 0.041370391845703125, 0.04865074157714844, 0.05593109130859375, 0.06321144104003906, 0.07049179077148438, 0.07777214050292969, 0.085052490234375, 0.09233283996582031, 0.09961318969726562, 0.10689353942871094, 0.11417388916015625, 0.12145423889160156, 0.12873458862304688, 0.1360149383544922, 0.1432952880859375, 0.1505756378173828, 0.15785598754882812, 0.16513633728027344, 0.17241668701171875, 0.17969703674316406, 0.18697738647460938, 0.1942577362060547, 0.2015380859375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 7.0, 10.0, 10.0, 17.0, 24.0, 33.0, 55.0, 78.0, 133.0, 247.0, 449.0, 918.0, 2384.0, 7469.0, 42421.0, 621680.0, 336352.0, 26908.0, 5720.0, 1900.0, 809.0, 386.0, 191.0, 112.0, 70.0, 49.0, 40.0, 22.0, 13.0, 9.0, 12.0, 6.0, 1.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0457763671875, -0.044599294662475586, -0.04342222213745117, -0.04224514961242676, -0.041068077087402344, -0.03989100456237793, -0.038713932037353516, -0.0375368595123291, -0.03635978698730469, -0.03518271446228027, -0.03400564193725586, -0.032828569412231445, -0.03165149688720703, -0.030474424362182617, -0.029297351837158203, -0.02812027931213379, -0.026943206787109375, -0.02576613426208496, -0.024589061737060547, -0.023411989212036133, -0.02223491668701172, -0.021057844161987305, -0.01988077163696289, -0.018703699111938477, -0.017526626586914062, -0.01634955406188965, -0.015172481536865234, -0.01399540901184082, -0.012818336486816406, -0.011641263961791992, -0.010464191436767578, -0.009287118911743164, -0.00811004638671875, -0.006932973861694336, -0.005755901336669922, -0.004578828811645508, -0.0034017562866210938, -0.0022246837615966797, -0.0010476112365722656, 0.00012946128845214844, 0.0013065338134765625, 0.0024836063385009766, 0.0036606788635253906, 0.004837751388549805, 0.006014823913574219, 0.007191896438598633, 0.008368968963623047, 0.009546041488647461, 0.010723114013671875, 0.011900186538696289, 0.013077259063720703, 0.014254331588745117, 0.015431404113769531, 0.016608476638793945, 0.01778554916381836, 0.018962621688842773, 0.020139694213867188, 0.0213167667388916, 0.022493839263916016, 0.02367091178894043, 0.024847984313964844, 0.026025056838989258, 0.027202129364013672, 0.028379201889038086, 0.0295562744140625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 5.0, 14.0, 9.0, 14.0, 22.0, 44.0, 94.0, 115.0, 149.0, 152.0, 150.0, 77.0, 49.0, 43.0, 16.0, 20.0, 6.0, 4.0, 4.0, 8.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.68899917602539e-06, -7.442198693752289e-06, -7.195398211479187e-06, -6.948597729206085e-06, -6.701797246932983e-06, -6.454996764659882e-06, -6.20819628238678e-06, -5.961395800113678e-06, -5.714595317840576e-06, -5.467794835567474e-06, -5.2209943532943726e-06, -4.974193871021271e-06, -4.727393388748169e-06, -4.480592906475067e-06, -4.233792424201965e-06, -3.9869919419288635e-06, -3.7401914596557617e-06, -3.49339097738266e-06, -3.246590495109558e-06, -2.9997900128364563e-06, -2.7529895305633545e-06, -2.5061890482902527e-06, -2.259388566017151e-06, -2.012588083744049e-06, -1.7657876014709473e-06, -1.5189871191978455e-06, -1.2721866369247437e-06, -1.0253861546516418e-06, -7.7858567237854e-07, -5.317851901054382e-07, -2.849847078323364e-07, -3.818422555923462e-08, 2.086162567138672e-07, 4.55416738986969e-07, 7.022172212600708e-07, 9.490177035331726e-07, 1.1958181858062744e-06, 1.4426186680793762e-06, 1.689419150352478e-06, 1.93621963262558e-06, 2.1830201148986816e-06, 2.4298205971717834e-06, 2.6766210794448853e-06, 2.923421561717987e-06, 3.170222043991089e-06, 3.4170225262641907e-06, 3.6638230085372925e-06, 3.910623490810394e-06, 4.157423973083496e-06, 4.404224455356598e-06, 4.6510249376297e-06, 4.8978254199028015e-06, 5.144625902175903e-06, 5.391426384449005e-06, 5.638226866722107e-06, 5.885027348995209e-06, 6.1318278312683105e-06, 6.378628313541412e-06, 6.625428795814514e-06, 6.872229278087616e-06, 7.119029760360718e-06, 7.36583024263382e-06, 7.612630724906921e-06, 7.859431207180023e-06, 8.106231689453125e-06]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 6.0, 10.0, 17.0, 16.0, 28.0, 39.0, 98.0, 156.0, 286.0, 619.0, 1754.0, 6793.0, 67260.0, 905192.0, 56972.0, 6346.0, 1686.0, 645.0, 296.0, 142.0, 75.0, 44.0, 25.0, 19.0, 6.0, 4.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.05230712890625, -0.050253868103027344, -0.04820060729980469, -0.04614734649658203, -0.044094085693359375, -0.04204082489013672, -0.03998756408691406, -0.037934303283691406, -0.03588104248046875, -0.033827781677246094, -0.03177452087402344, -0.02972126007080078, -0.027667999267578125, -0.02561473846435547, -0.023561477661132812, -0.021508216857910156, -0.0194549560546875, -0.017401695251464844, -0.015348434448242188, -0.013295173645019531, -0.011241912841796875, -0.009188652038574219, -0.0071353912353515625, -0.005082130432128906, -0.00302886962890625, -0.0009756088256835938, 0.0010776519775390625, 0.0031309127807617188, 0.005184173583984375, 0.007237434387207031, 0.009290695190429688, 0.011343955993652344, 0.013397216796875, 0.015450477600097656, 0.017503738403320312, 0.01955699920654297, 0.021610260009765625, 0.02366352081298828, 0.025716781616210938, 0.027770042419433594, 0.02982330322265625, 0.031876564025878906, 0.03392982482910156, 0.03598308563232422, 0.038036346435546875, 0.04008960723876953, 0.04214286804199219, 0.044196128845214844, 0.0462493896484375, 0.048302650451660156, 0.05035591125488281, 0.05240917205810547, 0.054462432861328125, 0.05651569366455078, 0.05856895446777344, 0.060622215270996094, 0.06267547607421875, 0.0647287368774414, 0.06678199768066406, 0.06883525848388672, 0.07088851928710938, 0.07294178009033203, 0.07499504089355469, 0.07704830169677734, 0.0791015625]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 1.0, 6.0, 5.0, 6.0, 13.0, 11.0, 9.0, 15.0, 26.0, 30.0, 33.0, 63.0, 83.0, 94.0, 122.0, 100.0, 103.0, 76.0, 46.0, 46.0, 28.0, 20.0, 17.0, 11.0, 8.0, 3.0, 3.0, 5.0, 2.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01136016845703125, -0.01098942756652832, -0.01061868667602539, -0.010247945785522461, -0.009877204895019531, -0.009506464004516602, -0.009135723114013672, -0.008764982223510742, -0.008394241333007812, -0.008023500442504883, -0.007652759552001953, -0.0072820186614990234, -0.006911277770996094, -0.006540536880493164, -0.006169795989990234, -0.005799055099487305, -0.005428314208984375, -0.005057573318481445, -0.004686832427978516, -0.004316091537475586, -0.003945350646972656, -0.0035746097564697266, -0.003203868865966797, -0.002833127975463867, -0.0024623870849609375, -0.002091646194458008, -0.0017209053039550781, -0.0013501644134521484, -0.0009794235229492188, -0.0006086826324462891, -0.00023794174194335938, 0.0001327991485595703, 0.0005035400390625, 0.0008742809295654297, 0.0012450218200683594, 0.001615762710571289, 0.0019865036010742188, 0.0023572444915771484, 0.002727985382080078, 0.003098726272583008, 0.0034694671630859375, 0.003840208053588867, 0.004210948944091797, 0.0045816898345947266, 0.004952430725097656, 0.005323171615600586, 0.005693912506103516, 0.006064653396606445, 0.006435394287109375, 0.006806135177612305, 0.007176876068115234, 0.007547616958618164, 0.007918357849121094, 0.008289098739624023, 0.008659839630126953, 0.009030580520629883, 0.009401321411132812, 0.009772062301635742, 0.010142803192138672, 0.010513544082641602, 0.010884284973144531, 0.011255025863647461, 0.01162576675415039, 0.01199650764465332, 0.01236724853515625]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 7.0, 6.0, 12.0, 27.0, 58.0, 90.0, 126.0, 164.0, 186.0, 114.0, 74.0, 62.0, 33.0, 19.0, 10.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.4505625069141388, -0.43900638818740845, -0.4274502396583557, -0.41589412093162537, -0.404338002204895, -0.3927818536758423, -0.38122573494911194, -0.3696696162223816, -0.35811346769332886, -0.3465573489665985, -0.3350012004375458, -0.32344508171081543, -0.3118889331817627, -0.30033281445503235, -0.288776695728302, -0.27722054719924927, -0.2656644284725189, -0.2541083097457886, -0.24255216121673584, -0.2309960424900055, -0.21943990886211395, -0.2078837752342224, -0.19632765650749207, -0.18477152287960052, -0.17321538925170898, -0.16165925562381744, -0.1501031219959259, -0.13854700326919556, -0.12699086964130402, -0.11543473601341248, -0.10387860983610153, -0.09232248365879059, -0.08076637983322144, -0.0692102462053299, -0.05765412002801895, -0.04609799012541771, -0.03454186022281647, -0.022985730320215225, -0.011429600417613983, 0.00012652575969696045, 0.011682659387588501, 0.023238789290189743, 0.034794919192790985, 0.04635104909539223, 0.05790717899799347, 0.06946331262588501, 0.08101943880319595, 0.0925755649805069, 0.10413169860839844, 0.11568783223628998, 0.12724396586418152, 0.13880008459091187, 0.1503562182188034, 0.16191235184669495, 0.1734684705734253, 0.18502460420131683, 0.19658073782920837, 0.20813687145709991, 0.21969300508499146, 0.2312491238117218, 0.24280525743961334, 0.2543613910675049, 0.26591750979423523, 0.2774736285209656, 0.2890297770500183]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 3.0, 1.0, 4.0, 8.0, 7.0, 9.0, 3.0, 6.0, 9.0, 19.0, 10.0, 14.0, 12.0, 33.0, 26.0, 28.0, 34.0, 23.0, 29.0, 30.0, 40.0, 34.0, 45.0, 40.0, 37.0, 49.0, 43.0, 44.0, 39.0, 42.0, 32.0, 28.0, 26.0, 34.0, 24.0, 23.0, 19.0, 17.0, 18.0, 12.0, 10.0, 8.0, 14.0, 7.0, 4.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.23896682262420654, -0.2311481088399887, -0.22332940995693207, -0.21551069617271423, -0.2076919972896576, -0.19987328350543976, -0.19205456972122192, -0.18423587083816528, -0.17641717195510864, -0.1685984581708908, -0.16077975928783417, -0.15296104550361633, -0.1451423466205597, -0.13732363283634186, -0.12950491905212402, -0.12168622016906738, -0.11386750638484955, -0.10604880005121231, -0.09823009371757507, -0.09041137993335724, -0.0825926810503006, -0.07477396726608276, -0.06695526093244553, -0.05913655459880829, -0.05131784826517105, -0.043499141931533813, -0.035680435597896576, -0.02786172553896904, -0.020043019205331802, -0.012224312871694565, -0.004405602812767029, 0.0034131035208702087, 0.011231809854507446, 0.019050516188144684, 0.02686922438442707, 0.03468793258070946, 0.042506638914346695, 0.05032534524798393, 0.05814405530691147, 0.0659627616405487, 0.07378146797418594, 0.08160017430782318, 0.08941888064146042, 0.09723758697509766, 0.10505630075931549, 0.11287499964237213, 0.12069371342658997, 0.1285124123096466, 0.13633112609386444, 0.14414983987808228, 0.15196853876113892, 0.15978725254535675, 0.1676059514284134, 0.17542466521263123, 0.18324336409568787, 0.1910620778799057, 0.19888079166412354, 0.20669950544834137, 0.214518204331398, 0.22233691811561584, 0.23015561699867249, 0.23797433078289032, 0.24579304456710815, 0.2536117434501648, 0.26143044233322144]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 0.0, 1.0, 1.0, 4.0, 10.0, 4.0, 9.0, 7.0, 21.0, 22.0, 26.0, 41.0, 53.0, 81.0, 99.0, 141.0, 207.0, 293.0, 385.0, 652.0, 950.0, 1511.0, 2585.0, 4842.0, 9592.0, 23540.0, 85643.0, 697571.0, 2606771.0, 633952.0, 81207.0, 22507.0, 9680.0, 4669.0, 2689.0, 1523.0, 953.0, 643.0, 422.0, 262.0, 198.0, 134.0, 100.0, 64.0, 53.0, 41.0, 38.0, 28.0, 14.0, 11.0, 12.0, 5.0, 7.0, 7.0, 5.0, 4.0, 1.0, 3.0], "bins": [-0.120361328125, -0.11687088012695312, -0.11338043212890625, -0.10988998413085938, -0.1063995361328125, -0.10290908813476562, -0.09941864013671875, -0.09592819213867188, -0.092437744140625, -0.08894729614257812, -0.08545684814453125, -0.08196640014648438, -0.0784759521484375, -0.07498550415039062, -0.07149505615234375, -0.06800460815429688, -0.06451416015625, -0.061023712158203125, -0.05753326416015625, -0.054042816162109375, -0.0505523681640625, -0.047061920166015625, -0.04357147216796875, -0.040081024169921875, -0.036590576171875, -0.033100128173828125, -0.02960968017578125, -0.026119232177734375, -0.0226287841796875, -0.019138336181640625, -0.01564788818359375, -0.012157440185546875, -0.0086669921875, -0.005176544189453125, -0.00168609619140625, 0.001804351806640625, 0.0052947998046875, 0.008785247802734375, 0.01227569580078125, 0.015766143798828125, 0.019256591796875, 0.022747039794921875, 0.02623748779296875, 0.029727935791015625, 0.0332183837890625, 0.036708831787109375, 0.04019927978515625, 0.043689727783203125, 0.04718017578125, 0.050670623779296875, 0.05416107177734375, 0.057651519775390625, 0.0611419677734375, 0.06463241577148438, 0.06812286376953125, 0.07161331176757812, 0.075103759765625, 0.07859420776367188, 0.08208465576171875, 0.08557510375976562, 0.0890655517578125, 0.09255599975585938, 0.09604644775390625, 0.09953689575195312, 0.10302734375]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 6.0, 5.0, 9.0, 4.0, 7.0, 19.0, 19.0, 26.0, 34.0, 31.0, 35.0, 42.0, 47.0, 57.0, 57.0, 46.0, 69.0, 68.0, 62.0, 51.0, 46.0, 46.0, 45.0, 26.0, 22.0, 35.0, 20.0, 14.0, 21.0, 15.0, 9.0, 10.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0888671875, -0.08586597442626953, -0.08286476135253906, -0.0798635482788086, -0.07686233520507812, -0.07386112213134766, -0.07085990905761719, -0.06785869598388672, -0.06485748291015625, -0.06185626983642578, -0.05885505676269531, -0.055853843688964844, -0.052852630615234375, -0.049851417541503906, -0.04685020446777344, -0.04384899139404297, -0.0408477783203125, -0.03784656524658203, -0.03484535217285156, -0.031844139099121094, -0.028842926025390625, -0.025841712951660156, -0.022840499877929688, -0.01983928680419922, -0.01683807373046875, -0.013836860656738281, -0.010835647583007812, -0.007834434509277344, -0.004833221435546875, -0.0018320083618164062, 0.0011692047119140625, 0.004170417785644531, 0.007171630859375, 0.010172843933105469, 0.013174057006835938, 0.016175270080566406, 0.019176483154296875, 0.022177696228027344, 0.025178909301757812, 0.02818012237548828, 0.03118133544921875, 0.03418254852294922, 0.03718376159667969, 0.040184974670410156, 0.043186187744140625, 0.046187400817871094, 0.04918861389160156, 0.05218982696533203, 0.0551910400390625, 0.05819225311279297, 0.06119346618652344, 0.0641946792602539, 0.06719589233398438, 0.07019710540771484, 0.07319831848144531, 0.07619953155517578, 0.07920074462890625, 0.08220195770263672, 0.08520317077636719, 0.08820438385009766, 0.09120559692382812, 0.0942068099975586, 0.09720802307128906, 0.10020923614501953, 0.10321044921875]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 8.0, 14.0, 12.0, 24.0, 43.0, 95.0, 208.0, 693.0, 4499.0, 153897.0, 4005177.0, 27040.0, 1826.0, 411.0, 168.0, 74.0, 35.0, 20.0, 12.0, 9.0, 8.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4326171875, -0.4183387756347656, -0.40406036376953125, -0.3897819519042969, -0.3755035400390625, -0.3612251281738281, -0.34694671630859375, -0.3326683044433594, -0.318389892578125, -0.3041114807128906, -0.28983306884765625, -0.2755546569824219, -0.2612762451171875, -0.24699783325195312, -0.23271942138671875, -0.21844100952148438, -0.20416259765625, -0.18988418579101562, -0.17560577392578125, -0.16132736206054688, -0.1470489501953125, -0.13277053833007812, -0.11849212646484375, -0.10421371459960938, -0.089935302734375, -0.07565689086914062, -0.06137847900390625, -0.047100067138671875, -0.0328216552734375, -0.018543243408203125, -0.00426483154296875, 0.010013580322265625, 0.0242919921875, 0.038570404052734375, 0.05284881591796875, 0.06712722778320312, 0.0814056396484375, 0.09568405151367188, 0.10996246337890625, 0.12424087524414062, 0.138519287109375, 0.15279769897460938, 0.16707611083984375, 0.18135452270507812, 0.1956329345703125, 0.20991134643554688, 0.22418975830078125, 0.23846817016601562, 0.25274658203125, 0.2670249938964844, 0.28130340576171875, 0.2955818176269531, 0.3098602294921875, 0.3241386413574219, 0.33841705322265625, 0.3526954650878906, 0.366973876953125, 0.3812522888183594, 0.39553070068359375, 0.4098091125488281, 0.4240875244140625, 0.4383659362792969, 0.45264434814453125, 0.4669227600097656, 0.481201171875]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 7.0, 4.0, 2.0, 8.0, 7.0, 6.0, 20.0, 22.0, 22.0, 30.0, 33.0, 59.0, 88.0, 114.0, 215.0, 336.0, 609.0, 725.0, 625.0, 411.0, 264.0, 149.0, 87.0, 60.0, 39.0, 42.0, 26.0, 15.0, 11.0, 13.0, 4.0, 4.0, 10.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.039306640625, -0.03788423538208008, -0.036461830139160156, -0.035039424896240234, -0.03361701965332031, -0.03219461441040039, -0.03077220916748047, -0.029349803924560547, -0.027927398681640625, -0.026504993438720703, -0.02508258819580078, -0.02366018295288086, -0.022237777709960938, -0.020815372467041016, -0.019392967224121094, -0.017970561981201172, -0.01654815673828125, -0.015125751495361328, -0.013703346252441406, -0.012280941009521484, -0.010858535766601562, -0.00943613052368164, -0.008013725280761719, -0.006591320037841797, -0.005168914794921875, -0.003746509552001953, -0.0023241043090820312, -0.0009016990661621094, 0.0005207061767578125, 0.0019431114196777344, 0.0033655166625976562, 0.004787921905517578, 0.0062103271484375, 0.007632732391357422, 0.009055137634277344, 0.010477542877197266, 0.011899948120117188, 0.01332235336303711, 0.014744758605957031, 0.016167163848876953, 0.017589569091796875, 0.019011974334716797, 0.02043437957763672, 0.02185678482055664, 0.023279190063476562, 0.024701595306396484, 0.026124000549316406, 0.027546405792236328, 0.02896881103515625, 0.030391216278076172, 0.031813621520996094, 0.033236026763916016, 0.03465843200683594, 0.03608083724975586, 0.03750324249267578, 0.0389256477355957, 0.040348052978515625, 0.04177045822143555, 0.04319286346435547, 0.04461526870727539, 0.04603767395019531, 0.047460079193115234, 0.048882484436035156, 0.05030488967895508, 0.051727294921875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 4.0, 10.0, 12.0, 22.0, 32.0, 44.0, 61.0, 73.0, 109.0, 113.0, 97.0, 100.0, 95.0, 78.0, 36.0, 43.0, 25.0, 20.0, 10.0, 12.0, 10.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22854658961296082, -0.22285278141498566, -0.2171589583158493, -0.21146515011787415, -0.205771341919899, -0.20007753372192383, -0.19438371062278748, -0.18868990242481232, -0.18299609422683716, -0.177302286028862, -0.17160846292972565, -0.1659146547317505, -0.16022084653377533, -0.15452703833580017, -0.14883321523666382, -0.14313940703868866, -0.1374455988407135, -0.13175179064273834, -0.126057967543602, -0.12036415934562683, -0.11467035114765167, -0.10897653549909592, -0.10328271985054016, -0.097588911652565, -0.09189508855342865, -0.0862012729048729, -0.08050746470689774, -0.07481364905834198, -0.06911984086036682, -0.06342602521181107, -0.05773221328854561, -0.05203840136528015, -0.04634459316730499, -0.040650781244039536, -0.03495696932077408, -0.029263155534863472, -0.023569343611598015, -0.017875531688332558, -0.012181717902421951, -0.006487905979156494, -0.000794094055891037, 0.0048997183330357075, 0.010593530721962452, 0.016287343576550484, 0.02198115549981594, 0.027674967423081398, 0.033368781208992004, 0.03906259313225746, 0.04475640505552292, 0.050450216978788376, 0.05614402890205383, 0.06183784455060959, 0.06753165274858475, 0.0732254683971405, 0.07891927659511566, 0.08461309224367142, 0.09030690789222717, 0.09600072354078293, 0.10169453173875809, 0.10738834738731384, 0.113082155585289, 0.11877597123384476, 0.12446978688240051, 0.13016359508037567, 0.13585740327835083]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 7.0, 3.0, 6.0, 8.0, 4.0, 6.0, 18.0, 19.0, 19.0, 23.0, 33.0, 22.0, 27.0, 26.0, 45.0, 34.0, 43.0, 47.0, 37.0, 49.0, 53.0, 45.0, 48.0, 41.0, 40.0, 38.0, 34.0, 30.0, 37.0, 30.0, 17.0, 23.0, 21.0, 20.0, 14.0, 8.0, 16.0, 6.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10078470408916473, -0.09767913073301315, -0.09457355737686157, -0.09146799147129059, -0.08836241811513901, -0.08525684475898743, -0.08215127885341644, -0.07904570549726486, -0.07594013214111328, -0.0728345587849617, -0.06972898542881012, -0.06662341952323914, -0.06351784616708755, -0.060412272810935974, -0.05730670318007469, -0.05420113354921341, -0.05109556019306183, -0.04798998683691025, -0.044884417206048965, -0.04177884757518768, -0.0386732742190361, -0.03556770086288452, -0.03246213123202324, -0.029356559738516808, -0.026250988245010376, -0.023145416751503944, -0.020039845257997513, -0.01693427376449108, -0.01382870227098465, -0.010723130777478218, -0.0076175592839717865, -0.004511987790465355, -0.0014064162969589233, 0.0016991551965475082, 0.00480472669005394, 0.007910298183560371, 0.011015869677066803, 0.014121441170573235, 0.017227012664079666, 0.020332584157586098, 0.02343815565109253, 0.02654372714459896, 0.029649298638105392, 0.032754868268966675, 0.035860441625118256, 0.038966014981269836, 0.04207158461213112, 0.0451771542429924, 0.04828272759914398, 0.05138830095529556, 0.054493870586156845, 0.05759944021701813, 0.06070501357316971, 0.06381058692932129, 0.06691615283489227, 0.07002172619104385, 0.07312729954719543, 0.07623287290334702, 0.0793384462594986, 0.08244401216506958, 0.08554958552122116, 0.08865515887737274, 0.09176072478294373, 0.0948662981390953, 0.09797187149524689]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 6.0, 8.0, 7.0, 9.0, 16.0, 24.0, 44.0, 39.0, 72.0, 93.0, 157.0, 248.0, 455.0, 774.0, 1298.0, 2438.0, 4528.0, 9428.0, 20521.0, 60095.0, 279263.0, 498608.0, 112020.0, 31798.0, 12993.0, 6254.0, 3240.0, 1727.0, 939.0, 547.0, 293.0, 214.0, 134.0, 88.0, 58.0, 33.0, 33.0, 20.0, 12.0, 11.0, 9.0, 0.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03985595703125, -0.038619041442871094, -0.03738212585449219, -0.03614521026611328, -0.034908294677734375, -0.03367137908935547, -0.03243446350097656, -0.031197547912597656, -0.02996063232421875, -0.028723716735839844, -0.027486801147460938, -0.02624988555908203, -0.025012969970703125, -0.02377605438232422, -0.022539138793945312, -0.021302223205566406, -0.0200653076171875, -0.018828392028808594, -0.017591476440429688, -0.01635456085205078, -0.015117645263671875, -0.013880729675292969, -0.012643814086914062, -0.011406898498535156, -0.01016998291015625, -0.008933067321777344, -0.0076961517333984375, -0.006459236145019531, -0.005222320556640625, -0.003985404968261719, -0.0027484893798828125, -0.0015115737915039062, -0.000274658203125, 0.0009622573852539062, 0.0021991729736328125, 0.0034360885620117188, 0.004673004150390625, 0.005909919738769531, 0.0071468353271484375, 0.008383750915527344, 0.00962066650390625, 0.010857582092285156, 0.012094497680664062, 0.013331413269042969, 0.014568328857421875, 0.01580524444580078, 0.017042160034179688, 0.018279075622558594, 0.0195159912109375, 0.020752906799316406, 0.021989822387695312, 0.02322673797607422, 0.024463653564453125, 0.02570056915283203, 0.026937484741210938, 0.028174400329589844, 0.02941131591796875, 0.030648231506347656, 0.03188514709472656, 0.03312206268310547, 0.034358978271484375, 0.03559589385986328, 0.03683280944824219, 0.038069725036621094, 0.039306640625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 5.0, 4.0, 9.0, 7.0, 9.0, 16.0, 16.0, 17.0, 15.0, 19.0, 33.0, 31.0, 26.0, 30.0, 39.0, 27.0, 49.0, 66.0, 52.0, 47.0, 56.0, 52.0, 32.0, 48.0, 43.0, 32.0, 34.0, 33.0, 28.0, 19.0, 17.0, 25.0, 12.0, 19.0, 9.0, 8.0, 7.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.058837890625, -0.056914329528808594, -0.05499076843261719, -0.05306720733642578, -0.051143646240234375, -0.04922008514404297, -0.04729652404785156, -0.045372962951660156, -0.04344940185546875, -0.041525840759277344, -0.03960227966308594, -0.03767871856689453, -0.035755157470703125, -0.03383159637451172, -0.03190803527832031, -0.029984474182128906, -0.0280609130859375, -0.026137351989746094, -0.024213790893554688, -0.02229022979736328, -0.020366668701171875, -0.01844310760498047, -0.016519546508789062, -0.014595985412597656, -0.01267242431640625, -0.010748863220214844, -0.008825302124023438, -0.006901741027832031, -0.004978179931640625, -0.0030546188354492188, -0.0011310577392578125, 0.0007925033569335938, 0.002716064453125, 0.004639625549316406, 0.0065631866455078125, 0.008486747741699219, 0.010410308837890625, 0.012333869934082031, 0.014257431030273438, 0.016180992126464844, 0.01810455322265625, 0.020028114318847656, 0.021951675415039062, 0.02387523651123047, 0.025798797607421875, 0.02772235870361328, 0.029645919799804688, 0.031569480895996094, 0.0334930419921875, 0.035416603088378906, 0.03734016418457031, 0.03926372528076172, 0.041187286376953125, 0.04311084747314453, 0.04503440856933594, 0.046957969665527344, 0.04888153076171875, 0.050805091857910156, 0.05272865295410156, 0.05465221405029297, 0.056575775146484375, 0.05849933624267578, 0.06042289733886719, 0.062346458435058594, 0.06427001953125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 6.0, 6.0, 4.0, 12.0, 10.0, 17.0, 22.0, 31.0, 40.0, 57.0, 91.0, 209.0, 439.0, 1299.0, 4339.0, 18015.0, 129246.0, 744998.0, 125895.0, 17380.0, 4195.0, 1287.0, 470.0, 188.0, 107.0, 54.0, 34.0, 29.0, 13.0, 10.0, 12.0, 8.0, 4.0, 5.0, 8.0, 3.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046356201171875, -0.04472923278808594, -0.043102264404296875, -0.04147529602050781, -0.03984832763671875, -0.03822135925292969, -0.036594390869140625, -0.03496742248535156, -0.0333404541015625, -0.03171348571777344, -0.030086517333984375, -0.028459548950195312, -0.02683258056640625, -0.025205612182617188, -0.023578643798828125, -0.021951675415039062, -0.02032470703125, -0.018697738647460938, -0.017070770263671875, -0.015443801879882812, -0.01381683349609375, -0.012189865112304688, -0.010562896728515625, -0.008935928344726562, -0.0073089599609375, -0.0056819915771484375, -0.004055023193359375, -0.0024280548095703125, -0.00080108642578125, 0.0008258819580078125, 0.002452850341796875, 0.0040798187255859375, 0.005706787109375, 0.0073337554931640625, 0.008960723876953125, 0.010587692260742188, 0.01221466064453125, 0.013841629028320312, 0.015468597412109375, 0.017095565795898438, 0.0187225341796875, 0.020349502563476562, 0.021976470947265625, 0.023603439331054688, 0.02523040771484375, 0.026857376098632812, 0.028484344482421875, 0.030111312866210938, 0.03173828125, 0.03336524963378906, 0.034992218017578125, 0.03661918640136719, 0.03824615478515625, 0.03987312316894531, 0.041500091552734375, 0.04312705993652344, 0.0447540283203125, 0.04638099670410156, 0.048007965087890625, 0.04963493347167969, 0.05126190185546875, 0.05288887023925781, 0.054515838623046875, 0.05614280700683594, 0.057769775390625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 6.0, 5.0, 13.0, 7.0, 7.0, 13.0, 15.0, 13.0, 12.0, 22.0, 24.0, 18.0, 38.0, 36.0, 44.0, 41.0, 48.0, 58.0, 28.0, 43.0, 46.0, 58.0, 49.0, 46.0, 39.0, 48.0, 35.0, 32.0, 29.0, 23.0, 15.0, 18.0, 19.0, 7.0, 12.0, 10.0, 6.0, 4.0, 8.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.12200927734375, -0.11800289154052734, -0.11399650573730469, -0.10999011993408203, -0.10598373413085938, -0.10197734832763672, -0.09797096252441406, -0.0939645767211914, -0.08995819091796875, -0.0859518051147461, -0.08194541931152344, -0.07793903350830078, -0.07393264770507812, -0.06992626190185547, -0.06591987609863281, -0.061913490295410156, -0.0579071044921875, -0.053900718688964844, -0.04989433288574219, -0.04588794708251953, -0.041881561279296875, -0.03787517547607422, -0.03386878967285156, -0.029862403869628906, -0.02585601806640625, -0.021849632263183594, -0.017843246459960938, -0.013836860656738281, -0.009830474853515625, -0.005824089050292969, -0.0018177032470703125, 0.0021886825561523438, 0.006195068359375, 0.010201454162597656, 0.014207839965820312, 0.01821422576904297, 0.022220611572265625, 0.02622699737548828, 0.030233383178710938, 0.034239768981933594, 0.03824615478515625, 0.042252540588378906, 0.04625892639160156, 0.05026531219482422, 0.054271697998046875, 0.05827808380126953, 0.06228446960449219, 0.06629085540771484, 0.0702972412109375, 0.07430362701416016, 0.07831001281738281, 0.08231639862060547, 0.08632278442382812, 0.09032917022705078, 0.09433555603027344, 0.0983419418334961, 0.10234832763671875, 0.1063547134399414, 0.11036109924316406, 0.11436748504638672, 0.11837387084960938, 0.12238025665283203, 0.1263866424560547, 0.13039302825927734, 0.1343994140625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 6.0, 2.0, 11.0, 8.0, 10.0, 14.0, 9.0, 26.0, 35.0, 49.0, 68.0, 114.0, 142.0, 241.0, 376.0, 622.0, 1032.0, 1910.0, 3602.0, 8001.0, 22183.0, 105460.0, 628460.0, 219045.0, 35580.0, 11047.0, 4774.0, 2402.0, 1274.0, 688.0, 486.0, 270.0, 186.0, 125.0, 85.0, 53.0, 39.0, 17.0, 21.0, 25.0, 10.0, 12.0, 12.0, 11.0, 5.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.016357421875, -0.01588571071624756, -0.015413999557495117, -0.014942288398742676, -0.014470577239990234, -0.013998866081237793, -0.013527154922485352, -0.01305544376373291, -0.012583732604980469, -0.012112021446228027, -0.011640310287475586, -0.011168599128723145, -0.010696887969970703, -0.010225176811218262, -0.00975346565246582, -0.009281754493713379, -0.008810043334960938, -0.008338332176208496, -0.007866621017456055, -0.007394909858703613, -0.006923198699951172, -0.0064514875411987305, -0.005979776382446289, -0.005508065223693848, -0.005036354064941406, -0.004564642906188965, -0.0040929317474365234, -0.003621220588684082, -0.0031495094299316406, -0.0026777982711791992, -0.002206087112426758, -0.0017343759536743164, -0.001262664794921875, -0.0007909536361694336, -0.0003192424774169922, 0.00015246868133544922, 0.0006241798400878906, 0.001095890998840332, 0.0015676021575927734, 0.002039313316345215, 0.0025110244750976562, 0.0029827356338500977, 0.003454446792602539, 0.0039261579513549805, 0.004397869110107422, 0.004869580268859863, 0.005341291427612305, 0.005813002586364746, 0.0062847137451171875, 0.006756424903869629, 0.00722813606262207, 0.007699847221374512, 0.008171558380126953, 0.008643269538879395, 0.009114980697631836, 0.009586691856384277, 0.010058403015136719, 0.01053011417388916, 0.011001825332641602, 0.011473536491394043, 0.011945247650146484, 0.012416958808898926, 0.012888669967651367, 0.013360381126403809, 0.01383209228515625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 4.0, 16.0, 8.0, 19.0, 26.0, 45.0, 43.0, 90.0, 89.0, 124.0, 108.0, 124.0, 90.0, 70.0, 48.0, 33.0, 19.0, 10.0, 12.0, 9.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.510185241699219e-06, -7.243826985359192e-06, -6.977468729019165e-06, -6.711110472679138e-06, -6.444752216339111e-06, -6.1783939599990845e-06, -5.912035703659058e-06, -5.645677447319031e-06, -5.379319190979004e-06, -5.112960934638977e-06, -4.84660267829895e-06, -4.580244421958923e-06, -4.3138861656188965e-06, -4.04752790927887e-06, -3.7811696529388428e-06, -3.514811396598816e-06, -3.248453140258789e-06, -2.982094883918762e-06, -2.7157366275787354e-06, -2.4493783712387085e-06, -2.1830201148986816e-06, -1.9166618585586548e-06, -1.650303602218628e-06, -1.383945345878601e-06, -1.1175870895385742e-06, -8.512288331985474e-07, -5.848705768585205e-07, -3.1851232051849365e-07, -5.21540641784668e-08, 2.1420419216156006e-07, 4.805624485015869e-07, 7.469207048416138e-07, 1.0132789611816406e-06, 1.2796372175216675e-06, 1.5459954738616943e-06, 1.8123537302017212e-06, 2.078711986541748e-06, 2.345070242881775e-06, 2.6114284992218018e-06, 2.8777867555618286e-06, 3.1441450119018555e-06, 3.4105032682418823e-06, 3.676861524581909e-06, 3.943219780921936e-06, 4.209578037261963e-06, 4.47593629360199e-06, 4.742294549942017e-06, 5.0086528062820435e-06, 5.27501106262207e-06, 5.541369318962097e-06, 5.807727575302124e-06, 6.074085831642151e-06, 6.340444087982178e-06, 6.606802344322205e-06, 6.8731606006622314e-06, 7.139518857002258e-06, 7.405877113342285e-06, 7.672235369682312e-06, 7.938593626022339e-06, 8.204951882362366e-06, 8.471310138702393e-06, 8.73766839504242e-06, 9.004026651382446e-06, 9.270384907722473e-06, 9.5367431640625e-06]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 6.0, 7.0, 6.0, 6.0, 14.0, 19.0, 26.0, 51.0, 71.0, 134.0, 218.0, 479.0, 968.0, 2269.0, 5625.0, 19753.0, 169328.0, 739909.0, 88020.0, 13751.0, 4472.0, 1768.0, 777.0, 382.0, 191.0, 112.0, 71.0, 42.0, 28.0, 16.0, 10.0, 5.0, 7.0, 3.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0249481201171875, -0.024126768112182617, -0.023305416107177734, -0.02248406410217285, -0.02166271209716797, -0.020841360092163086, -0.020020008087158203, -0.01919865608215332, -0.018377304077148438, -0.017555952072143555, -0.016734600067138672, -0.01591324806213379, -0.015091896057128906, -0.014270544052124023, -0.01344919204711914, -0.012627840042114258, -0.011806488037109375, -0.010985136032104492, -0.01016378402709961, -0.009342432022094727, -0.008521080017089844, -0.007699728012084961, -0.006878376007080078, -0.006057024002075195, -0.0052356719970703125, -0.00441431999206543, -0.003592967987060547, -0.002771615982055664, -0.0019502639770507812, -0.0011289119720458984, -0.0003075599670410156, 0.0005137920379638672, 0.00133514404296875, 0.002156496047973633, 0.0029778480529785156, 0.0037992000579833984, 0.004620552062988281, 0.005441904067993164, 0.006263256072998047, 0.00708460807800293, 0.007905960083007812, 0.008727312088012695, 0.009548664093017578, 0.010370016098022461, 0.011191368103027344, 0.012012720108032227, 0.01283407211303711, 0.013655424118041992, 0.014476776123046875, 0.015298128128051758, 0.01611948013305664, 0.016940832138061523, 0.017762184143066406, 0.01858353614807129, 0.019404888153076172, 0.020226240158081055, 0.021047592163085938, 0.02186894416809082, 0.022690296173095703, 0.023511648178100586, 0.02433300018310547, 0.02515435218811035, 0.025975704193115234, 0.026797056198120117, 0.027618408203125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 2.0, 8.0, 7.0, 11.0, 16.0, 24.0, 33.0, 72.0, 92.0, 148.0, 185.0, 126.0, 98.0, 62.0, 48.0, 20.0, 15.0, 10.0, 5.0, 2.0, 7.0, 2.0, 4.0, 0.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00662994384765625, -0.0064321160316467285, -0.006234288215637207, -0.0060364603996276855, -0.005838632583618164, -0.005640804767608643, -0.005442976951599121, -0.0052451491355896, -0.005047321319580078, -0.004849493503570557, -0.004651665687561035, -0.004453837871551514, -0.004256010055541992, -0.004058182239532471, -0.0038603544235229492, -0.0036625266075134277, -0.0034646987915039062, -0.0032668709754943848, -0.0030690431594848633, -0.002871215343475342, -0.0026733875274658203, -0.002475559711456299, -0.0022777318954467773, -0.002079904079437256, -0.0018820762634277344, -0.0016842484474182129, -0.0014864206314086914, -0.00128859281539917, -0.0010907649993896484, -0.000892937183380127, -0.0006951093673706055, -0.000497281551361084, -0.0002994537353515625, -0.00010162591934204102, 9.620189666748047e-05, 0.00029402971267700195, 0.0004918575286865234, 0.0006896853446960449, 0.0008875131607055664, 0.0010853409767150879, 0.0012831687927246094, 0.0014809966087341309, 0.0016788244247436523, 0.0018766522407531738, 0.0020744800567626953, 0.002272307872772217, 0.0024701356887817383, 0.0026679635047912598, 0.0028657913208007812, 0.0030636191368103027, 0.0032614469528198242, 0.0034592747688293457, 0.003657102584838867, 0.0038549304008483887, 0.00405275821685791, 0.004250586032867432, 0.004448413848876953, 0.004646241664886475, 0.004844069480895996, 0.005041897296905518, 0.005239725112915039, 0.0054375529289245605, 0.005635380744934082, 0.0058332085609436035, 0.006031036376953125]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 9.0, 10.0, 15.0, 51.0, 60.0, 99.0, 140.0, 152.0, 132.0, 134.0, 74.0, 56.0, 32.0, 18.0, 12.0, 7.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2007479965686798, -0.19636370241641998, -0.19197940826416016, -0.18759509921073914, -0.1832108050584793, -0.17882651090621948, -0.17444221675395966, -0.17005792260169983, -0.16567362844944, -0.16128933429718018, -0.15690504014492035, -0.15252074599266052, -0.1481364369392395, -0.14375214278697968, -0.13936784863471985, -0.13498355448246002, -0.1305992603302002, -0.12621496617794037, -0.12183066457509995, -0.11744637042284012, -0.11306207627058029, -0.10867777466773987, -0.10429348051548004, -0.09990918636322021, -0.0955248773097992, -0.09114058315753937, -0.08675628155469894, -0.08237198740243912, -0.07798769325017929, -0.07360339164733887, -0.06921909749507904, -0.06483480334281921, -0.060450516641139984, -0.05606621876358986, -0.05168192461133003, -0.04729762673377991, -0.04291333258152008, -0.038529034703969955, -0.03414473682641983, -0.029760440811514854, -0.02537614479660988, -0.020991848781704903, -0.016607552766799927, -0.012223254889249802, -0.007838958874344826, -0.00345466285943985, 0.0009296350181102753, 0.005313931033015251, 0.009698227047920227, 0.014082523062825203, 0.01846681907773018, 0.022851116955280304, 0.02723541297018528, 0.031619708985090256, 0.03600400686264038, 0.04038830101490021, 0.04477259889245033, 0.04915689677000046, 0.053541190922260284, 0.05792548879981041, 0.062309786677360535, 0.06669408082962036, 0.07107837498188019, 0.07546267658472061, 0.07984697073698044]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 2.0, 5.0, 2.0, 6.0, 6.0, 9.0, 14.0, 10.0, 21.0, 21.0, 28.0, 24.0, 35.0, 36.0, 40.0, 41.0, 39.0, 49.0, 49.0, 58.0, 61.0, 41.0, 49.0, 44.0, 41.0, 40.0, 30.0, 42.0, 30.0, 23.0, 23.0, 23.0, 14.0, 16.0, 10.0, 10.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06404274702072144, -0.062102433294057846, -0.06016211956739426, -0.05822180584073067, -0.05628149211406708, -0.05434117838740349, -0.0524008646607399, -0.05046054720878601, -0.04852023720741272, -0.04657992348074913, -0.04463960975408554, -0.04269929602742195, -0.04075898230075836, -0.03881866857409477, -0.03687835484743118, -0.034938037395477295, -0.032997723668813705, -0.031057409942150116, -0.029117096215486526, -0.027176782488822937, -0.025236468762159348, -0.023296155035495758, -0.02135583944618702, -0.01941552571952343, -0.01747521199285984, -0.015534898266196251, -0.013594584539532661, -0.011654269881546497, -0.009713956154882908, -0.007773642428219318, -0.005833327770233154, -0.003893014043569565, -0.0019527003169059753, -1.238635741174221e-05, 0.001927927602082491, 0.0038682417944073677, 0.005808555521070957, 0.007748869247734547, 0.00968918390572071, 0.0116294976323843, 0.01356981135904789, 0.01551012508571148, 0.01745043881237507, 0.019390754401683807, 0.021331068128347397, 0.023271381855010986, 0.025211695581674576, 0.027152009308338165, 0.029092323035001755, 0.031032636761665344, 0.032972950488328934, 0.03491326421499252, 0.03685357794165611, 0.0387938916683197, 0.04073420912027359, 0.04267451912164688, 0.04461483657360077, 0.04655515030026436, 0.04849546402692795, 0.05043577775359154, 0.05237609148025513, 0.054316405206918716, 0.056256718933582306, 0.058197036385536194, 0.060137346386909485]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 5.0, 2.0, 6.0, 9.0, 9.0, 17.0, 7.0, 33.0, 45.0, 33.0, 67.0, 73.0, 120.0, 185.0, 272.0, 364.0, 586.0, 874.0, 1475.0, 2388.0, 4032.0, 7352.0, 13613.0, 29518.0, 87082.0, 331149.0, 393576.0, 106481.0, 34402.0, 15107.0, 8017.0, 4457.0, 2571.0, 1554.0, 1006.0, 647.0, 440.0, 296.0, 209.0, 146.0, 91.0, 63.0, 45.0, 37.0, 25.0, 23.0, 25.0, 8.0, 8.0, 5.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05548095703125, -0.05363655090332031, -0.051792144775390625, -0.04994773864746094, -0.04810333251953125, -0.04625892639160156, -0.044414520263671875, -0.04257011413574219, -0.0407257080078125, -0.03888130187988281, -0.037036895751953125, -0.03519248962402344, -0.03334808349609375, -0.03150367736816406, -0.029659271240234375, -0.027814865112304688, -0.025970458984375, -0.024126052856445312, -0.022281646728515625, -0.020437240600585938, -0.01859283447265625, -0.016748428344726562, -0.014904022216796875, -0.013059616088867188, -0.0112152099609375, -0.009370803833007812, -0.007526397705078125, -0.0056819915771484375, -0.00383758544921875, -0.0019931793212890625, -0.000148773193359375, 0.0016956329345703125, 0.0035400390625, 0.0053844451904296875, 0.007228851318359375, 0.009073257446289062, 0.01091766357421875, 0.012762069702148438, 0.014606475830078125, 0.016450881958007812, 0.0182952880859375, 0.020139694213867188, 0.021984100341796875, 0.023828506469726562, 0.02567291259765625, 0.027517318725585938, 0.029361724853515625, 0.031206130981445312, 0.033050537109375, 0.03489494323730469, 0.036739349365234375, 0.03858375549316406, 0.04042816162109375, 0.04227256774902344, 0.044116973876953125, 0.04596138000488281, 0.0478057861328125, 0.04965019226074219, 0.051494598388671875, 0.05333900451660156, 0.05518341064453125, 0.05702781677246094, 0.058872222900390625, 0.06071662902832031, 0.06256103515625]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 5.0, 5.0, 6.0, 4.0, 10.0, 14.0, 14.0, 17.0, 28.0, 24.0, 30.0, 24.0, 42.0, 35.0, 45.0, 44.0, 51.0, 72.0, 45.0, 49.0, 47.0, 47.0, 46.0, 48.0, 30.0, 37.0, 36.0, 26.0, 18.0, 15.0, 32.0, 14.0, 16.0, 9.0, 7.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.15087890625, -0.1466541290283203, -0.14242935180664062, -0.13820457458496094, -0.13397979736328125, -0.12975502014160156, -0.12553024291992188, -0.12130546569824219, -0.1170806884765625, -0.11285591125488281, -0.10863113403320312, -0.10440635681152344, -0.10018157958984375, -0.09595680236816406, -0.09173202514648438, -0.08750724792480469, -0.083282470703125, -0.07905769348144531, -0.07483291625976562, -0.07060813903808594, -0.06638336181640625, -0.06215858459472656, -0.057933807373046875, -0.05370903015136719, -0.0494842529296875, -0.04525947570800781, -0.041034698486328125, -0.03680992126464844, -0.03258514404296875, -0.028360366821289062, -0.024135589599609375, -0.019910812377929688, -0.01568603515625, -0.011461257934570312, -0.007236480712890625, -0.0030117034912109375, 0.00121307373046875, 0.0054378509521484375, 0.009662628173828125, 0.013887405395507812, 0.0181121826171875, 0.022336959838867188, 0.026561737060546875, 0.030786514282226562, 0.03501129150390625, 0.03923606872558594, 0.043460845947265625, 0.04768562316894531, 0.051910400390625, 0.05613517761230469, 0.060359954833984375, 0.06458473205566406, 0.06880950927734375, 0.07303428649902344, 0.07725906372070312, 0.08148384094238281, 0.0857086181640625, 0.08993339538574219, 0.09415817260742188, 0.09838294982910156, 0.10260772705078125, 0.10683250427246094, 0.11105728149414062, 0.11528205871582031, 0.1195068359375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 1.0, 3.0, 4.0, 10.0, 15.0, 12.0, 22.0, 22.0, 29.0, 44.0, 41.0, 97.0, 107.0, 213.0, 441.0, 1249.0, 5551.0, 37811.0, 715767.0, 263285.0, 18900.0, 3208.0, 797.0, 357.0, 173.0, 107.0, 93.0, 53.0, 42.0, 24.0, 22.0, 16.0, 9.0, 4.0, 6.0, 5.0, 4.0, 2.0, 8.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.1610107421875, -0.1562519073486328, -0.15149307250976562, -0.14673423767089844, -0.14197540283203125, -0.13721656799316406, -0.13245773315429688, -0.1276988983154297, -0.1229400634765625, -0.11818122863769531, -0.11342239379882812, -0.10866355895996094, -0.10390472412109375, -0.09914588928222656, -0.09438705444335938, -0.08962821960449219, -0.084869384765625, -0.08011054992675781, -0.07535171508789062, -0.07059288024902344, -0.06583404541015625, -0.06107521057128906, -0.056316375732421875, -0.05155754089355469, -0.0467987060546875, -0.04203987121582031, -0.037281036376953125, -0.03252220153808594, -0.02776336669921875, -0.023004531860351562, -0.018245697021484375, -0.013486862182617188, -0.00872802734375, -0.0039691925048828125, 0.000789642333984375, 0.0055484771728515625, 0.01030731201171875, 0.015066146850585938, 0.019824981689453125, 0.024583816528320312, 0.0293426513671875, 0.03410148620605469, 0.038860321044921875, 0.04361915588378906, 0.04837799072265625, 0.05313682556152344, 0.057895660400390625, 0.06265449523925781, 0.067413330078125, 0.07217216491699219, 0.07693099975585938, 0.08168983459472656, 0.08644866943359375, 0.09120750427246094, 0.09596633911132812, 0.10072517395019531, 0.1054840087890625, 0.11024284362792969, 0.11500167846679688, 0.11976051330566406, 0.12451934814453125, 0.12927818298339844, 0.13403701782226562, 0.1387958526611328, 0.1435546875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 4.0, 7.0, 4.0, 6.0, 9.0, 8.0, 11.0, 15.0, 16.0, 19.0, 33.0, 24.0, 41.0, 32.0, 28.0, 42.0, 35.0, 40.0, 46.0, 55.0, 53.0, 56.0, 43.0, 49.0, 30.0, 44.0, 21.0, 29.0, 27.0, 30.0, 28.0, 23.0, 16.0, 13.0, 14.0, 9.0, 3.0, 9.0, 11.0, 6.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1373291015625, -0.1331806182861328, -0.12903213500976562, -0.12488365173339844, -0.12073516845703125, -0.11658668518066406, -0.11243820190429688, -0.10828971862792969, -0.1041412353515625, -0.09999275207519531, -0.09584426879882812, -0.09169578552246094, -0.08754730224609375, -0.08339881896972656, -0.07925033569335938, -0.07510185241699219, -0.070953369140625, -0.06680488586425781, -0.06265640258789062, -0.05850791931152344, -0.05435943603515625, -0.05021095275878906, -0.046062469482421875, -0.04191398620605469, -0.0377655029296875, -0.03361701965332031, -0.029468536376953125, -0.025320053100585938, -0.02117156982421875, -0.017023086547851562, -0.012874603271484375, -0.008726119995117188, -0.00457763671875, -0.0004291534423828125, 0.003719329833984375, 0.007867813110351562, 0.01201629638671875, 0.016164779663085938, 0.020313262939453125, 0.024461746215820312, 0.0286102294921875, 0.03275871276855469, 0.036907196044921875, 0.04105567932128906, 0.04520416259765625, 0.04935264587402344, 0.053501129150390625, 0.05764961242675781, 0.061798095703125, 0.06594657897949219, 0.07009506225585938, 0.07424354553222656, 0.07839202880859375, 0.08254051208496094, 0.08668899536132812, 0.09083747863769531, 0.0949859619140625, 0.09913444519042969, 0.10328292846679688, 0.10743141174316406, 0.11157989501953125, 0.11572837829589844, 0.11987686157226562, 0.12402534484863281, 0.128173828125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 4.0, 11.0, 12.0, 22.0, 23.0, 33.0, 54.0, 87.0, 228.0, 548.0, 2004.0, 14981.0, 418281.0, 589725.0, 19070.0, 2377.0, 591.0, 227.0, 102.0, 57.0, 43.0, 23.0, 16.0, 11.0, 8.0, 3.0, 6.0, 0.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0438232421875, -0.04236459732055664, -0.04090595245361328, -0.03944730758666992, -0.03798866271972656, -0.0365300178527832, -0.035071372985839844, -0.033612728118896484, -0.032154083251953125, -0.030695438385009766, -0.029236793518066406, -0.027778148651123047, -0.026319503784179688, -0.024860858917236328, -0.02340221405029297, -0.02194356918334961, -0.02048492431640625, -0.01902627944946289, -0.01756763458251953, -0.016108989715576172, -0.014650344848632812, -0.013191699981689453, -0.011733055114746094, -0.010274410247802734, -0.008815765380859375, -0.007357120513916016, -0.005898475646972656, -0.004439830780029297, -0.0029811859130859375, -0.0015225410461425781, -6.389617919921875e-05, 0.0013947486877441406, 0.0028533935546875, 0.004312038421630859, 0.005770683288574219, 0.007229328155517578, 0.008687973022460938, 0.010146617889404297, 0.011605262756347656, 0.013063907623291016, 0.014522552490234375, 0.015981197357177734, 0.017439842224121094, 0.018898487091064453, 0.020357131958007812, 0.021815776824951172, 0.02327442169189453, 0.02473306655883789, 0.02619171142578125, 0.02765035629272461, 0.02910900115966797, 0.030567646026611328, 0.03202629089355469, 0.03348493576049805, 0.034943580627441406, 0.036402225494384766, 0.037860870361328125, 0.039319515228271484, 0.040778160095214844, 0.0422368049621582, 0.04369544982910156, 0.04515409469604492, 0.04661273956298828, 0.04807138442993164, 0.049530029296875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 7.0, 9.0, 7.0, 13.0, 23.0, 9.0, 27.0, 44.0, 36.0, 50.0, 90.0, 79.0, 101.0, 119.0, 78.0, 101.0, 44.0, 41.0, 32.0, 27.0, 17.0, 15.0, 12.0, 8.0, 5.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.516674041748047e-06, -3.3760443329811096e-06, -3.2354146242141724e-06, -3.094784915447235e-06, -2.954155206680298e-06, -2.8135254979133606e-06, -2.6728957891464233e-06, -2.532266080379486e-06, -2.391636371612549e-06, -2.2510066628456116e-06, -2.1103769540786743e-06, -1.969747245311737e-06, -1.8291175365447998e-06, -1.6884878277778625e-06, -1.5478581190109253e-06, -1.407228410243988e-06, -1.2665987014770508e-06, -1.1259689927101135e-06, -9.853392839431763e-07, -8.44709575176239e-07, -7.040798664093018e-07, -5.634501576423645e-07, -4.2282044887542725e-07, -2.8219074010849e-07, -1.4156103134155273e-07, -9.313225746154785e-10, 1.3969838619232178e-07, 2.8032809495925903e-07, 4.209578037261963e-07, 5.615875124931335e-07, 7.022172212600708e-07, 8.428469300270081e-07, 9.834766387939453e-07, 1.1241063475608826e-06, 1.2647360563278198e-06, 1.405365765094757e-06, 1.5459954738616943e-06, 1.6866251826286316e-06, 1.8272548913955688e-06, 1.967884600162506e-06, 2.1085143089294434e-06, 2.2491440176963806e-06, 2.389773726463318e-06, 2.530403435230255e-06, 2.6710331439971924e-06, 2.8116628527641296e-06, 2.952292561531067e-06, 3.092922270298004e-06, 3.2335519790649414e-06, 3.3741816878318787e-06, 3.514811396598816e-06, 3.655441105365753e-06, 3.7960708141326904e-06, 3.936700522899628e-06, 4.077330231666565e-06, 4.217959940433502e-06, 4.3585896492004395e-06, 4.499219357967377e-06, 4.639849066734314e-06, 4.780478775501251e-06, 4.9211084842681885e-06, 5.061738193035126e-06, 5.202367901802063e-06, 5.342997610569e-06, 5.4836273193359375e-06]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 8.0, 6.0, 7.0, 4.0, 13.0, 19.0, 21.0, 17.0, 44.0, 128.0, 275.0, 872.0, 2779.0, 13770.0, 474735.0, 536802.0, 14894.0, 2765.0, 837.0, 297.0, 122.0, 48.0, 29.0, 14.0, 15.0, 10.0, 5.0, 4.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.057586669921875, -0.05572986602783203, -0.05387306213378906, -0.052016258239746094, -0.050159454345703125, -0.048302650451660156, -0.04644584655761719, -0.04458904266357422, -0.04273223876953125, -0.04087543487548828, -0.03901863098144531, -0.037161827087402344, -0.035305023193359375, -0.033448219299316406, -0.03159141540527344, -0.02973461151123047, -0.0278778076171875, -0.02602100372314453, -0.024164199829101562, -0.022307395935058594, -0.020450592041015625, -0.018593788146972656, -0.016736984252929688, -0.014880180358886719, -0.01302337646484375, -0.011166572570800781, -0.009309768676757812, -0.007452964782714844, -0.005596160888671875, -0.0037393569946289062, -0.0018825531005859375, -2.574920654296875e-05, 0.0018310546875, 0.0036878585815429688, 0.0055446624755859375, 0.007401466369628906, 0.009258270263671875, 0.011115074157714844, 0.012971878051757812, 0.014828681945800781, 0.01668548583984375, 0.01854228973388672, 0.020399093627929688, 0.022255897521972656, 0.024112701416015625, 0.025969505310058594, 0.027826309204101562, 0.02968311309814453, 0.0315399169921875, 0.03339672088623047, 0.03525352478027344, 0.037110328674316406, 0.038967132568359375, 0.040823936462402344, 0.04268074035644531, 0.04453754425048828, 0.04639434814453125, 0.04825115203857422, 0.05010795593261719, 0.051964759826660156, 0.053821563720703125, 0.055678367614746094, 0.05753517150878906, 0.05939197540283203, 0.061248779296875]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 4.0, 5.0, 13.0, 15.0, 14.0, 27.0, 49.0, 60.0, 72.0, 118.0, 140.0, 143.0, 87.0, 79.0, 51.0, 39.0, 15.0, 17.0, 10.0, 2.0, 1.0, 3.0, 6.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0170440673828125, -0.01652050018310547, -0.015996932983398438, -0.015473365783691406, -0.014949798583984375, -0.014426231384277344, -0.013902664184570312, -0.013379096984863281, -0.01285552978515625, -0.012331962585449219, -0.011808395385742188, -0.011284828186035156, -0.010761260986328125, -0.010237693786621094, -0.009714126586914062, -0.009190559387207031, -0.0086669921875, -0.008143424987792969, -0.0076198577880859375, -0.007096290588378906, -0.006572723388671875, -0.006049156188964844, -0.0055255889892578125, -0.005002021789550781, -0.00447845458984375, -0.003954887390136719, -0.0034313201904296875, -0.0029077529907226562, -0.002384185791015625, -0.0018606185913085938, -0.0013370513916015625, -0.0008134841918945312, -0.0002899169921875, 0.00023365020751953125, 0.0007572174072265625, 0.0012807846069335938, 0.001804351806640625, 0.0023279190063476562, 0.0028514862060546875, 0.0033750534057617188, 0.00389862060546875, 0.004422187805175781, 0.0049457550048828125, 0.005469322204589844, 0.005992889404296875, 0.006516456604003906, 0.0070400238037109375, 0.007563591003417969, 0.008087158203125, 0.008610725402832031, 0.009134292602539062, 0.009657859802246094, 0.010181427001953125, 0.010704994201660156, 0.011228561401367188, 0.011752128601074219, 0.01227569580078125, 0.012799263000488281, 0.013322830200195312, 0.013846397399902344, 0.014369964599609375, 0.014893531799316406, 0.015417098999023438, 0.01594066619873047, 0.0164642333984375]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 27.0, 108.0, 352.0, 328.0, 146.0, 38.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2014520168304443, -1.1774336099624634, -1.1534150838851929, -1.129396677017212, -1.1053781509399414, -1.0813597440719604, -1.0573413372039795, -1.033322811126709, -1.009304404258728, -0.9852859377861023, -0.9612674713134766, -0.9372490644454956, -0.9132305979728699, -0.8892121315002441, -0.8651936650276184, -0.8411751985549927, -0.8171567916870117, -0.793138325214386, -0.7691198587417603, -0.7451014518737793, -0.7210829854011536, -0.6970645189285278, -0.6730460524559021, -0.6490275859832764, -0.6250091195106506, -0.6009906530380249, -0.5769721865653992, -0.5529537796974182, -0.5289353132247925, -0.5049168467521667, -0.480898380279541, -0.45687994360923767, -0.4328615367412567, -0.408843070268631, -0.38482463359832764, -0.3608061671257019, -0.33678773045539856, -0.3127692639827728, -0.2887508273124695, -0.26473236083984375, -0.2407139092683792, -0.21669545769691467, -0.19267700612545013, -0.1686585545539856, -0.14464008808135986, -0.12062164396047592, -0.09660318493843079, -0.07258473336696625, -0.04856628179550171, -0.02454782836139202, -0.0005293749272823334, 0.023489080369472504, 0.04750753194093704, 0.07152598351240158, 0.09554444253444672, 0.11956289410591125, 0.1435813456773758, 0.16759979724884033, 0.19161824882030487, 0.2156367003917694, 0.23965516686439514, 0.2636736035346985, 0.2876920700073242, 0.31171053647994995, 0.3357289731502533]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 5.0, 6.0, 4.0, 5.0, 15.0, 9.0, 14.0, 18.0, 29.0, 22.0, 27.0, 22.0, 30.0, 30.0, 41.0, 53.0, 41.0, 49.0, 42.0, 49.0, 54.0, 48.0, 44.0, 44.0, 42.0, 37.0, 33.0, 24.0, 29.0, 32.0, 27.0, 18.0, 18.0, 10.0, 12.0, 8.0, 7.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.23862014710903168, -0.23129092156887054, -0.2239616960287094, -0.21663247048854828, -0.20930324494838715, -0.20197400450706482, -0.1946447789669037, -0.18731555342674255, -0.17998632788658142, -0.1726571023464203, -0.16532787680625916, -0.15799865126609802, -0.1506694257259369, -0.14334020018577576, -0.13601097464561462, -0.1286817342042923, -0.12135251611471176, -0.11402329057455063, -0.1066940650343895, -0.09936483204364777, -0.09203560650348663, -0.0847063809633255, -0.07737715542316437, -0.07004792988300323, -0.0627187043428421, -0.05538947880268097, -0.04806024953722954, -0.040731023997068405, -0.033401794731616974, -0.02607256919145584, -0.018743343651294708, -0.011414114385843277, -0.004084885120391846, 0.003244341816753149, 0.010573568753898144, 0.01790279522538185, 0.025232022628188133, 0.032561250030994415, 0.03989047557115555, 0.04721970483660698, 0.05454893037676811, 0.061878155916929245, 0.06920738518238068, 0.07653661072254181, 0.08386583626270294, 0.09119506180286407, 0.09852428734302521, 0.10585352033376694, 0.11318274587392807, 0.1205119714140892, 0.12784120440483093, 0.13517042994499207, 0.1424996554851532, 0.14982888102531433, 0.15715810656547546, 0.1644873321056366, 0.17181655764579773, 0.17914578318595886, 0.18647500872612, 0.19380423426628113, 0.20113345980644226, 0.2084626853466034, 0.21579191088676453, 0.22312115132808685, 0.23045037686824799]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 11.0, 9.0, 13.0, 15.0, 23.0, 31.0, 27.0, 60.0, 93.0, 129.0, 245.0, 458.0, 932.0, 2012.0, 4507.0, 12198.0, 54653.0, 1149307.0, 2792097.0, 146474.0, 19365.0, 6480.0, 2542.0, 1209.0, 558.0, 298.0, 167.0, 108.0, 63.0, 49.0, 34.0, 23.0, 19.0, 16.0, 10.0, 8.0, 9.0, 4.0, 4.0, 4.0, 6.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1455078125, -0.1406879425048828, -0.13586807250976562, -0.13104820251464844, -0.12622833251953125, -0.12140846252441406, -0.11658859252929688, -0.11176872253417969, -0.1069488525390625, -0.10212898254394531, -0.09730911254882812, -0.09248924255371094, -0.08766937255859375, -0.08284950256347656, -0.07802963256835938, -0.07320976257324219, -0.068389892578125, -0.06357002258300781, -0.058750152587890625, -0.05393028259277344, -0.04911041259765625, -0.04429054260253906, -0.039470672607421875, -0.03465080261230469, -0.0298309326171875, -0.025011062622070312, -0.020191192626953125, -0.015371322631835938, -0.01055145263671875, -0.0057315826416015625, -0.000911712646484375, 0.0039081573486328125, 0.00872802734375, 0.013547897338867188, 0.018367767333984375, 0.023187637329101562, 0.02800750732421875, 0.03282737731933594, 0.037647247314453125, 0.04246711730957031, 0.0472869873046875, 0.05210685729980469, 0.056926727294921875, 0.06174659729003906, 0.06656646728515625, 0.07138633728027344, 0.07620620727539062, 0.08102607727050781, 0.085845947265625, 0.09066581726074219, 0.09548568725585938, 0.10030555725097656, 0.10512542724609375, 0.10994529724121094, 0.11476516723632812, 0.11958503723144531, 0.1244049072265625, 0.1292247772216797, 0.13404464721679688, 0.13886451721191406, 0.14368438720703125, 0.14850425720214844, 0.15332412719726562, 0.1581439971923828, 0.1629638671875]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 3.0, 7.0, 6.0, 8.0, 8.0, 4.0, 6.0, 14.0, 18.0, 21.0, 22.0, 28.0, 24.0, 20.0, 42.0, 48.0, 36.0, 55.0, 46.0, 52.0, 55.0, 56.0, 44.0, 40.0, 43.0, 43.0, 37.0, 24.0, 30.0, 31.0, 20.0, 23.0, 19.0, 24.0, 13.0, 8.0, 7.0, 9.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06585693359375, -0.06384086608886719, -0.061824798583984375, -0.05980873107910156, -0.05779266357421875, -0.05577659606933594, -0.053760528564453125, -0.05174446105957031, -0.0497283935546875, -0.04771232604980469, -0.045696258544921875, -0.04368019104003906, -0.04166412353515625, -0.03964805603027344, -0.037631988525390625, -0.03561592102050781, -0.033599853515625, -0.03158378601074219, -0.029567718505859375, -0.027551651000976562, -0.02553558349609375, -0.023519515991210938, -0.021503448486328125, -0.019487380981445312, -0.0174713134765625, -0.015455245971679688, -0.013439178466796875, -0.011423110961914062, -0.00940704345703125, -0.0073909759521484375, -0.005374908447265625, -0.0033588409423828125, -0.0013427734375, 0.0006732940673828125, 0.002689361572265625, 0.0047054290771484375, 0.00672149658203125, 0.008737564086914062, 0.010753631591796875, 0.012769699096679688, 0.0147857666015625, 0.016801834106445312, 0.018817901611328125, 0.020833969116210938, 0.02285003662109375, 0.024866104125976562, 0.026882171630859375, 0.028898239135742188, 0.030914306640625, 0.03293037414550781, 0.034946441650390625, 0.03696250915527344, 0.03897857666015625, 0.04099464416503906, 0.043010711669921875, 0.04502677917480469, 0.0470428466796875, 0.04905891418457031, 0.051074981689453125, 0.05309104919433594, 0.05510711669921875, 0.05712318420410156, 0.059139251708984375, 0.06115531921386719, 0.06317138671875]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 8.0, 7.0, 14.0, 18.0, 24.0, 50.0, 59.0, 111.0, 209.0, 498.0, 1689.0, 8866.0, 110193.0, 3951781.0, 109228.0, 8790.0, 1731.0, 505.0, 206.0, 94.0, 65.0, 46.0, 25.0, 21.0, 9.0, 10.0, 4.0, 9.0, 0.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.295166015625, -0.2854881286621094, -0.27581024169921875, -0.2661323547363281, -0.2564544677734375, -0.24677658081054688, -0.23709869384765625, -0.22742080688476562, -0.217742919921875, -0.20806503295898438, -0.19838714599609375, -0.18870925903320312, -0.1790313720703125, -0.16935348510742188, -0.15967559814453125, -0.14999771118164062, -0.14031982421875, -0.13064193725585938, -0.12096405029296875, -0.11128616333007812, -0.1016082763671875, -0.09193038940429688, -0.08225250244140625, -0.07257461547851562, -0.062896728515625, -0.053218841552734375, -0.04354095458984375, -0.033863067626953125, -0.0241851806640625, -0.014507293701171875, -0.00482940673828125, 0.004848480224609375, 0.0145263671875, 0.024204254150390625, 0.03388214111328125, 0.043560028076171875, 0.0532379150390625, 0.06291580200195312, 0.07259368896484375, 0.08227157592773438, 0.091949462890625, 0.10162734985351562, 0.11130523681640625, 0.12098312377929688, 0.1306610107421875, 0.14033889770507812, 0.15001678466796875, 0.15969467163085938, 0.16937255859375, 0.17905044555664062, 0.18872833251953125, 0.19840621948242188, 0.2080841064453125, 0.21776199340820312, 0.22743988037109375, 0.23711776733398438, 0.246795654296875, 0.2564735412597656, 0.26615142822265625, 0.2758293151855469, 0.2855072021484375, 0.2951850891113281, 0.30486297607421875, 0.3145408630371094, 0.32421875]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 6.0, 6.0, 7.0, 8.0, 14.0, 23.0, 15.0, 34.0, 39.0, 48.0, 84.0, 120.0, 198.0, 348.0, 526.0, 732.0, 648.0, 422.0, 275.0, 158.0, 81.0, 77.0, 55.0, 40.0, 27.0, 18.0, 13.0, 13.0, 7.0, 11.0, 7.0, 8.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.052947998046875, -0.05154561996459961, -0.05014324188232422, -0.04874086380004883, -0.04733848571777344, -0.04593610763549805, -0.044533729553222656, -0.043131351470947266, -0.041728973388671875, -0.040326595306396484, -0.038924217224121094, -0.0375218391418457, -0.03611946105957031, -0.03471708297729492, -0.03331470489501953, -0.03191232681274414, -0.03050994873046875, -0.02910757064819336, -0.02770519256591797, -0.026302814483642578, -0.024900436401367188, -0.023498058319091797, -0.022095680236816406, -0.020693302154541016, -0.019290924072265625, -0.017888545989990234, -0.016486167907714844, -0.015083789825439453, -0.013681411743164062, -0.012279033660888672, -0.010876655578613281, -0.00947427749633789, -0.0080718994140625, -0.006669521331787109, -0.005267143249511719, -0.003864765167236328, -0.0024623870849609375, -0.0010600090026855469, 0.00034236907958984375, 0.0017447471618652344, 0.003147125244140625, 0.004549503326416016, 0.005951881408691406, 0.007354259490966797, 0.008756637573242188, 0.010159015655517578, 0.011561393737792969, 0.01296377182006836, 0.01436614990234375, 0.01576852798461914, 0.01717090606689453, 0.018573284149169922, 0.019975662231445312, 0.021378040313720703, 0.022780418395996094, 0.024182796478271484, 0.025585174560546875, 0.026987552642822266, 0.028389930725097656, 0.029792308807373047, 0.031194686889648438, 0.03259706497192383, 0.03399944305419922, 0.03540182113647461, 0.03680419921875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 4.0, 1.0, 5.0, 10.0, 7.0, 9.0, 7.0, 13.0, 15.0, 22.0, 26.0, 32.0, 34.0, 41.0, 50.0, 55.0, 48.0, 56.0, 64.0, 69.0, 51.0, 54.0, 54.0, 43.0, 36.0, 49.0, 27.0, 19.0, 20.0, 17.0, 8.0, 10.0, 8.0, 5.0, 11.0, 5.0, 2.0, 4.0, 2.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.1027679517865181, -0.09981711208820343, -0.09686627238988876, -0.0939154252409935, -0.09096458554267883, -0.08801374584436417, -0.0850629061460495, -0.08211205899715424, -0.07916121929883957, -0.0762103796005249, -0.07325953990221024, -0.07030869275331497, -0.0673578530550003, -0.06440701335668564, -0.06145617365837097, -0.058505330234766006, -0.05555449053645134, -0.05260365083813667, -0.04965280741453171, -0.04670196771621704, -0.043751124292612076, -0.04080028459429741, -0.037849441170692444, -0.03489860147237778, -0.03194776177406311, -0.028996920213103294, -0.02604607865214348, -0.02309523895382881, -0.020144395530223846, -0.01719355583190918, -0.014242714270949364, -0.011291872709989548, -0.008341029286384583, -0.0053901877254247665, -0.002439346630126238, 0.0005114944651722908, 0.0034623360261321068, 0.006413177587091923, 0.009364018216729164, 0.01231485977768898, 0.015265701338648796, 0.018216542899608612, 0.021167384460568428, 0.024118226021528244, 0.02706906571984291, 0.030019909143447876, 0.03297074884176254, 0.03592158854007721, 0.038872431963682175, 0.04182327166199684, 0.04477411508560181, 0.04772495478391647, 0.05067579820752144, 0.053626637905836105, 0.05657748132944107, 0.05952832102775574, 0.062479160726070404, 0.06543000042438507, 0.06838084012269974, 0.071331687271595, 0.07428252696990967, 0.07723336666822433, 0.080184206366539, 0.08313505351543427, 0.08608589321374893]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 4.0, 3.0, 14.0, 7.0, 12.0, 7.0, 17.0, 20.0, 11.0, 26.0, 31.0, 22.0, 26.0, 33.0, 33.0, 38.0, 44.0, 44.0, 54.0, 54.0, 41.0, 44.0, 40.0, 46.0, 46.0, 35.0, 42.0, 27.0, 34.0, 19.0, 20.0, 14.0, 11.0, 19.0, 20.0, 12.0, 10.0, 10.0, 5.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.085527203977108, -0.08281069993972778, -0.08009420335292816, -0.07737770676612854, -0.07466120272874832, -0.0719446986913681, -0.06922820210456848, -0.06651170551776886, -0.06379520148038864, -0.06107870116829872, -0.0583622008562088, -0.05564570054411888, -0.05292920023202896, -0.05021269991993904, -0.04749619960784912, -0.0447796992957592, -0.04206319898366928, -0.03934669867157936, -0.03663019835948944, -0.03391369804739952, -0.0311971977353096, -0.02848069742321968, -0.02576419711112976, -0.02304769679903984, -0.02033119648694992, -0.01761469617486, -0.01489819586277008, -0.01218169555068016, -0.00946519523859024, -0.0067486949265003204, -0.0040321946144104, -0.0013156943023204803, 0.0014008134603500366, 0.004117313772439957, 0.006833814084529877, 0.009550314396619797, 0.012266814708709717, 0.014983315020799637, 0.017699815332889557, 0.020416315644979477, 0.023132815957069397, 0.025849316269159317, 0.028565816581249237, 0.03128231689333916, 0.03399881720542908, 0.036715317517519, 0.03943181782960892, 0.04214831814169884, 0.04486481845378876, 0.04758131876587868, 0.0502978190779686, 0.05301431939005852, 0.05573081970214844, 0.05844732001423836, 0.06116382032632828, 0.0638803243637085, 0.06659682095050812, 0.06931331753730774, 0.07202982157468796, 0.07474632561206818, 0.0774628221988678, 0.08017931878566742, 0.08289582282304764, 0.08561232686042786, 0.08832882344722748]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 10.0, 15.0, 10.0, 23.0, 34.0, 35.0, 61.0, 107.0, 153.0, 246.0, 392.0, 724.0, 1259.0, 2242.0, 4099.0, 8658.0, 23162.0, 127062.0, 655597.0, 176433.0, 28087.0, 9813.0, 4582.0, 2463.0, 1313.0, 757.0, 436.0, 303.0, 173.0, 103.0, 78.0, 43.0, 23.0, 30.0, 10.0, 8.0, 8.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03851318359375, -0.037210941314697266, -0.03590869903564453, -0.0346064567565918, -0.03330421447753906, -0.03200197219848633, -0.030699729919433594, -0.02939748764038086, -0.028095245361328125, -0.02679300308227539, -0.025490760803222656, -0.024188518524169922, -0.022886276245117188, -0.021584033966064453, -0.02028179168701172, -0.018979549407958984, -0.01767730712890625, -0.016375064849853516, -0.015072822570800781, -0.013770580291748047, -0.012468338012695312, -0.011166095733642578, -0.009863853454589844, -0.00856161117553711, -0.007259368896484375, -0.005957126617431641, -0.004654884338378906, -0.003352642059326172, -0.0020503997802734375, -0.0007481575012207031, 0.0005540847778320312, 0.0018563270568847656, 0.0031585693359375, 0.004460811614990234, 0.005763053894042969, 0.007065296173095703, 0.008367538452148438, 0.009669780731201172, 0.010972023010253906, 0.01227426528930664, 0.013576507568359375, 0.01487874984741211, 0.016180992126464844, 0.017483234405517578, 0.018785476684570312, 0.020087718963623047, 0.02138996124267578, 0.022692203521728516, 0.02399444580078125, 0.025296688079833984, 0.02659893035888672, 0.027901172637939453, 0.029203414916992188, 0.030505657196044922, 0.031807899475097656, 0.03311014175415039, 0.034412384033203125, 0.03571462631225586, 0.037016868591308594, 0.03831911087036133, 0.03962135314941406, 0.0409235954284668, 0.04222583770751953, 0.043528079986572266, 0.044830322265625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 6.0, 3.0, 8.0, 2.0, 11.0, 9.0, 17.0, 14.0, 21.0, 29.0, 26.0, 29.0, 40.0, 33.0, 39.0, 54.0, 39.0, 45.0, 62.0, 52.0, 63.0, 45.0, 40.0, 49.0, 41.0, 39.0, 26.0, 23.0, 31.0, 26.0, 13.0, 15.0, 11.0, 16.0, 11.0, 9.0, 6.0, 6.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06646728515625, -0.0644845962524414, -0.06250190734863281, -0.06051921844482422, -0.058536529541015625, -0.05655384063720703, -0.05457115173339844, -0.052588462829589844, -0.05060577392578125, -0.048623085021972656, -0.04664039611816406, -0.04465770721435547, -0.042675018310546875, -0.04069232940673828, -0.03870964050292969, -0.036726951599121094, -0.0347442626953125, -0.032761573791503906, -0.030778884887695312, -0.02879619598388672, -0.026813507080078125, -0.02483081817626953, -0.022848129272460938, -0.020865440368652344, -0.01888275146484375, -0.016900062561035156, -0.014917373657226562, -0.012934684753417969, -0.010951995849609375, -0.008969306945800781, -0.0069866180419921875, -0.005003929138183594, -0.003021240234375, -0.0010385513305664062, 0.0009441375732421875, 0.0029268264770507812, 0.004909515380859375, 0.006892204284667969, 0.008874893188476562, 0.010857582092285156, 0.01284027099609375, 0.014822959899902344, 0.016805648803710938, 0.01878833770751953, 0.020771026611328125, 0.02275371551513672, 0.024736404418945312, 0.026719093322753906, 0.0287017822265625, 0.030684471130371094, 0.03266716003417969, 0.03464984893798828, 0.036632537841796875, 0.03861522674560547, 0.04059791564941406, 0.042580604553222656, 0.04456329345703125, 0.046545982360839844, 0.04852867126464844, 0.05051136016845703, 0.052494049072265625, 0.05447673797607422, 0.05645942687988281, 0.058442115783691406, 0.0604248046875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 4.0, 2.0, 7.0, 7.0, 10.0, 11.0, 14.0, 18.0, 28.0, 33.0, 56.0, 99.0, 198.0, 379.0, 821.0, 2308.0, 7341.0, 33551.0, 333778.0, 594582.0, 59167.0, 10872.0, 3152.0, 1111.0, 464.0, 228.0, 92.0, 74.0, 49.0, 26.0, 20.0, 16.0, 7.0, 7.0, 8.0, 5.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037200927734375, -0.035924434661865234, -0.03464794158935547, -0.0333714485168457, -0.03209495544433594, -0.030818462371826172, -0.029541969299316406, -0.02826547622680664, -0.026988983154296875, -0.02571249008178711, -0.024435997009277344, -0.023159503936767578, -0.021883010864257812, -0.020606517791748047, -0.01933002471923828, -0.018053531646728516, -0.01677703857421875, -0.015500545501708984, -0.014224052429199219, -0.012947559356689453, -0.011671066284179688, -0.010394573211669922, -0.009118080139160156, -0.00784158706665039, -0.006565093994140625, -0.005288600921630859, -0.004012107849121094, -0.002735614776611328, -0.0014591217041015625, -0.00018262863159179688, 0.0010938644409179688, 0.0023703575134277344, 0.0036468505859375, 0.004923343658447266, 0.006199836730957031, 0.007476329803466797, 0.008752822875976562, 0.010029315948486328, 0.011305809020996094, 0.01258230209350586, 0.013858795166015625, 0.01513528823852539, 0.016411781311035156, 0.017688274383544922, 0.018964767456054688, 0.020241260528564453, 0.02151775360107422, 0.022794246673583984, 0.02407073974609375, 0.025347232818603516, 0.02662372589111328, 0.027900218963623047, 0.029176712036132812, 0.030453205108642578, 0.031729698181152344, 0.03300619125366211, 0.034282684326171875, 0.03555917739868164, 0.036835670471191406, 0.03811216354370117, 0.03938865661621094, 0.0406651496887207, 0.04194164276123047, 0.043218135833740234, 0.04449462890625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 3.0, 5.0, 10.0, 7.0, 15.0, 23.0, 15.0, 21.0, 26.0, 26.0, 32.0, 31.0, 39.0, 34.0, 28.0, 47.0, 54.0, 37.0, 45.0, 52.0, 34.0, 50.0, 41.0, 62.0, 31.0, 26.0, 28.0, 28.0, 19.0, 14.0, 27.0, 21.0, 15.0, 9.0, 8.0, 8.0, 4.0, 5.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.137451171875, -0.13332176208496094, -0.12919235229492188, -0.1250629425048828, -0.12093353271484375, -0.11680412292480469, -0.11267471313476562, -0.10854530334472656, -0.1044158935546875, -0.10028648376464844, -0.09615707397460938, -0.09202766418457031, -0.08789825439453125, -0.08376884460449219, -0.07963943481445312, -0.07551002502441406, -0.071380615234375, -0.06725120544433594, -0.06312179565429688, -0.05899238586425781, -0.05486297607421875, -0.05073356628417969, -0.046604156494140625, -0.04247474670410156, -0.0383453369140625, -0.03421592712402344, -0.030086517333984375, -0.025957107543945312, -0.02182769775390625, -0.017698287963867188, -0.013568878173828125, -0.009439468383789062, -0.00531005859375, -0.0011806488037109375, 0.002948760986328125, 0.0070781707763671875, 0.01120758056640625, 0.015336990356445312, 0.019466400146484375, 0.023595809936523438, 0.0277252197265625, 0.03185462951660156, 0.035984039306640625, 0.04011344909667969, 0.04424285888671875, 0.04837226867675781, 0.052501678466796875, 0.05663108825683594, 0.060760498046875, 0.06488990783691406, 0.06901931762695312, 0.07314872741699219, 0.07727813720703125, 0.08140754699707031, 0.08553695678710938, 0.08966636657714844, 0.0937957763671875, 0.09792518615722656, 0.10205459594726562, 0.10618400573730469, 0.11031341552734375, 0.11444282531738281, 0.11857223510742188, 0.12270164489746094, 0.1268310546875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 7.0, 6.0, 7.0, 22.0, 40.0, 50.0, 85.0, 143.0, 368.0, 873.0, 2530.0, 11345.0, 136673.0, 811649.0, 73422.0, 8055.0, 1962.0, 688.0, 295.0, 149.0, 71.0, 45.0, 20.0, 16.0, 9.0, 7.0, 6.0, 2.0, 3.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0173187255859375, -0.01663684844970703, -0.015954971313476562, -0.015273094177246094, -0.014591217041015625, -0.013909339904785156, -0.013227462768554688, -0.012545585632324219, -0.01186370849609375, -0.011181831359863281, -0.010499954223632812, -0.009818077087402344, -0.009136199951171875, -0.008454322814941406, -0.0077724456787109375, -0.007090568542480469, -0.00640869140625, -0.005726814270019531, -0.0050449371337890625, -0.004363059997558594, -0.003681182861328125, -0.0029993057250976562, -0.0023174285888671875, -0.0016355514526367188, -0.00095367431640625, -0.00027179718017578125, 0.0004100799560546875, 0.0010919570922851562, 0.001773834228515625, 0.0024557113647460938, 0.0031375885009765625, 0.0038194656372070312, 0.0045013427734375, 0.005183219909667969, 0.0058650970458984375, 0.006546974182128906, 0.007228851318359375, 0.007910728454589844, 0.008592605590820312, 0.009274482727050781, 0.00995635986328125, 0.010638236999511719, 0.011320114135742188, 0.012001991271972656, 0.012683868408203125, 0.013365745544433594, 0.014047622680664062, 0.014729499816894531, 0.015411376953125, 0.01609325408935547, 0.016775131225585938, 0.017457008361816406, 0.018138885498046875, 0.018820762634277344, 0.019502639770507812, 0.02018451690673828, 0.02086639404296875, 0.02154827117919922, 0.022230148315429688, 0.022912025451660156, 0.023593902587890625, 0.024275779724121094, 0.024957656860351562, 0.02563953399658203, 0.0263214111328125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 6.0, 8.0, 18.0, 22.0, 37.0, 51.0, 71.0, 118.0, 135.0, 145.0, 110.0, 112.0, 67.0, 43.0, 18.0, 14.0, 11.0, 2.0, 5.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.59634780883789e-06, -9.299255907535553e-06, -9.002164006233215e-06, -8.705072104930878e-06, -8.40798020362854e-06, -8.110888302326202e-06, -7.813796401023865e-06, -7.516704499721527e-06, -7.2196125984191895e-06, -6.922520697116852e-06, -6.625428795814514e-06, -6.3283368945121765e-06, -6.031244993209839e-06, -5.734153091907501e-06, -5.4370611906051636e-06, -5.139969289302826e-06, -4.842877388000488e-06, -4.545785486698151e-06, -4.248693585395813e-06, -3.951601684093475e-06, -3.6545097827911377e-06, -3.3574178814888e-06, -3.0603259801864624e-06, -2.7632340788841248e-06, -2.466142177581787e-06, -2.1690502762794495e-06, -1.8719583749771118e-06, -1.5748664736747742e-06, -1.2777745723724365e-06, -9.806826710700989e-07, -6.835907697677612e-07, -3.864988684654236e-07, -8.940696716308594e-08, 2.076849341392517e-07, 5.047768354415894e-07, 8.01868736743927e-07, 1.0989606380462646e-06, 1.3960525393486023e-06, 1.69314444065094e-06, 1.9902363419532776e-06, 2.2873282432556152e-06, 2.584420144557953e-06, 2.8815120458602905e-06, 3.178603947162628e-06, 3.475695848464966e-06, 3.7727877497673035e-06, 4.069879651069641e-06, 4.366971552371979e-06, 4.664063453674316e-06, 4.961155354976654e-06, 5.258247256278992e-06, 5.555339157581329e-06, 5.852431058883667e-06, 6.149522960186005e-06, 6.446614861488342e-06, 6.74370676279068e-06, 7.040798664093018e-06, 7.337890565395355e-06, 7.634982466697693e-06, 7.93207436800003e-06, 8.229166269302368e-06, 8.526258170604706e-06, 8.823350071907043e-06, 9.120441973209381e-06, 9.417533874511719e-06]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 6.0, 3.0, 7.0, 5.0, 13.0, 7.0, 27.0, 26.0, 36.0, 49.0, 68.0, 95.0, 132.0, 197.0, 288.0, 444.0, 621.0, 1023.0, 1838.0, 3003.0, 5599.0, 11208.0, 23930.0, 55666.0, 134985.0, 275806.0, 281411.0, 141066.0, 59268.0, 25609.0, 11906.0, 5947.0, 3194.0, 1860.0, 1099.0, 667.0, 456.0, 296.0, 182.0, 137.0, 102.0, 73.0, 54.0, 40.0, 32.0, 17.0, 20.0, 17.0, 12.0, 6.0, 4.0, 2.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.00681304931640625, -0.0066002607345581055, -0.006387472152709961, -0.006174683570861816, -0.005961894989013672, -0.005749106407165527, -0.005536317825317383, -0.005323529243469238, -0.005110740661621094, -0.004897952079772949, -0.004685163497924805, -0.00447237491607666, -0.004259586334228516, -0.004046797752380371, -0.0038340091705322266, -0.003621220588684082, -0.0034084320068359375, -0.003195643424987793, -0.0029828548431396484, -0.002770066261291504, -0.0025572776794433594, -0.002344489097595215, -0.0021317005157470703, -0.0019189119338989258, -0.0017061233520507812, -0.0014933347702026367, -0.0012805461883544922, -0.0010677576065063477, -0.0008549690246582031, -0.0006421804428100586, -0.00042939186096191406, -0.00021660327911376953, -3.814697265625e-06, 0.00020897388458251953, 0.00042176246643066406, 0.0006345510482788086, 0.0008473396301269531, 0.0010601282119750977, 0.0012729167938232422, 0.0014857053756713867, 0.0016984939575195312, 0.0019112825393676758, 0.0021240711212158203, 0.002336859703063965, 0.0025496482849121094, 0.002762436866760254, 0.0029752254486083984, 0.003188014030456543, 0.0034008026123046875, 0.003613591194152832, 0.0038263797760009766, 0.004039168357849121, 0.004251956939697266, 0.00446474552154541, 0.004677534103393555, 0.004890322685241699, 0.005103111267089844, 0.005315899848937988, 0.005528688430786133, 0.005741477012634277, 0.005954265594482422, 0.006167054176330566, 0.006379842758178711, 0.0065926313400268555, 0.006805419921875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 4.0, 1.0, 4.0, 2.0, 2.0, 3.0, 15.0, 6.0, 11.0, 13.0, 16.0, 23.0, 18.0, 27.0, 36.0, 51.0, 58.0, 57.0, 65.0, 50.0, 56.0, 57.0, 60.0, 61.0, 44.0, 43.0, 52.0, 30.0, 19.0, 24.0, 19.0, 16.0, 12.0, 6.0, 12.0, 6.0, 6.0, 8.0, 0.0, 4.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.002399444580078125, -0.002327144145965576, -0.0022548437118530273, -0.0021825432777404785, -0.0021102428436279297, -0.002037942409515381, -0.001965641975402832, -0.0018933415412902832, -0.0018210411071777344, -0.0017487406730651855, -0.0016764402389526367, -0.0016041398048400879, -0.001531839370727539, -0.0014595389366149902, -0.0013872385025024414, -0.0013149380683898926, -0.0012426376342773438, -0.001170337200164795, -0.001098036766052246, -0.0010257363319396973, -0.0009534358978271484, -0.0008811354637145996, -0.0008088350296020508, -0.000736534595489502, -0.0006642341613769531, -0.0005919337272644043, -0.0005196332931518555, -0.00044733285903930664, -0.0003750324249267578, -0.000302731990814209, -0.00023043155670166016, -0.00015813112258911133, -8.58306884765625e-05, -1.3530254364013672e-05, 5.8770179748535156e-05, 0.00013107061386108398, 0.0002033710479736328, 0.00027567148208618164, 0.00034797191619873047, 0.0004202723503112793, 0.0004925727844238281, 0.000564873218536377, 0.0006371736526489258, 0.0007094740867614746, 0.0007817745208740234, 0.0008540749549865723, 0.0009263753890991211, 0.00099867582321167, 0.0010709762573242188, 0.0011432766914367676, 0.0012155771255493164, 0.0012878775596618652, 0.001360177993774414, 0.0014324784278869629, 0.0015047788619995117, 0.0015770792961120605, 0.0016493797302246094, 0.0017216801643371582, 0.001793980598449707, 0.0018662810325622559, 0.0019385814666748047, 0.0020108819007873535, 0.0020831823348999023, 0.002155482769012451, 0.002227783203125]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 3.0, 1.0, 4.0, 5.0, 2.0, 2.0, 5.0, 6.0, 7.0, 5.0, 19.0, 18.0, 23.0, 22.0, 35.0, 29.0, 31.0, 43.0, 56.0, 50.0, 49.0, 63.0, 52.0, 59.0, 50.0, 41.0, 39.0, 46.0, 40.0, 30.0, 33.0, 17.0, 21.0, 13.0, 15.0, 7.0, 4.0, 13.0, 8.0, 8.0, 5.0, 7.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.05102512985467911, -0.04939844086766243, -0.04777175560593605, -0.04614506661891937, -0.044518377631902695, -0.042891692370176315, -0.04126500338315964, -0.03963831812143326, -0.03801162913441658, -0.0363849401473999, -0.03475825488567352, -0.033131565898656845, -0.03150487691164017, -0.029878191649913788, -0.02825150266289711, -0.02662481553852558, -0.024998126551508904, -0.023371439427137375, -0.021744750440120697, -0.02011806331574917, -0.01849137619137764, -0.016864687204360962, -0.015238000079989433, -0.013611312955617905, -0.011984624899923801, -0.010357936844229698, -0.00873124971985817, -0.007104561664164066, -0.00547787407413125, -0.0038511864840984344, -0.002224498428404331, -0.0005978113040328026, 0.0010288767516613007, 0.0026555643416941166, 0.0042822519317269325, 0.005908939987421036, 0.007535627577453852, 0.009162315167486668, 0.010789003223180771, 0.0124156903475523, 0.014042378403246403, 0.015669066458940506, 0.017295753583312035, 0.018922440707683563, 0.02054912969470024, 0.02217581681907177, 0.0238025039434433, 0.025429192930459976, 0.027055880054831505, 0.028682567179203033, 0.03030925616621971, 0.03193594515323639, 0.03356263041496277, 0.035189319401979446, 0.036816008388996124, 0.038442693650722504, 0.04006938263773918, 0.04169607162475586, 0.04332275688648224, 0.04494944587349892, 0.046576134860515594, 0.048202820122241974, 0.04982950910925865, 0.05145619809627533, 0.05308288335800171]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 8.0, 8.0, 6.0, 6.0, 18.0, 11.0, 19.0, 15.0, 30.0, 22.0, 22.0, 37.0, 29.0, 40.0, 45.0, 53.0, 41.0, 61.0, 52.0, 45.0, 42.0, 46.0, 46.0, 45.0, 34.0, 34.0, 36.0, 20.0, 15.0, 19.0, 23.0, 17.0, 13.0, 16.0, 12.0, 6.0, 7.0, 1.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05878680944442749, -0.0570182241499424, -0.055249642580747604, -0.05348105728626251, -0.05171247199177742, -0.04994388669729233, -0.048175305128097534, -0.04640671983361244, -0.04463813453912735, -0.04286954924464226, -0.041100967675447464, -0.03933238238096237, -0.03756379708647728, -0.03579521179199219, -0.034026630222797394, -0.0322580449283123, -0.030489463359117508, -0.028720879927277565, -0.026952294632792473, -0.02518371120095253, -0.023415125906467438, -0.021646542474627495, -0.019877959042787552, -0.01810937374830246, -0.016340790316462517, -0.0145722059533, -0.012803621590137482, -0.011035038158297539, -0.009266453795135021, -0.007497869431972504, -0.005729286000132561, -0.003960701636970043, -0.0021921172738075256, -0.00042353314347565174, 0.0013450509868562222, 0.0031136348843574524, 0.00488221924751997, 0.0066508036106824875, 0.00841938704252243, 0.010187971405684948, 0.011956555768847466, 0.013725140132009983, 0.0154937244951725, 0.017262307927012444, 0.019030891358852386, 0.02079947665333748, 0.02256806008517742, 0.024336643517017365, 0.026105228811502457, 0.0278738122433424, 0.029642397537827492, 0.031410980969667435, 0.03317956626415253, 0.03494814783334732, 0.03671673312783241, 0.038485318422317505, 0.0402538999915123, 0.04202248528599739, 0.043791066855192184, 0.04555965214967728, 0.04732823744416237, 0.04909682273864746, 0.050865404307842255, 0.05263398960232735, 0.05440257489681244]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 8.0, 6.0, 11.0, 12.0, 23.0, 35.0, 61.0, 78.0, 109.0, 227.0, 404.0, 620.0, 1148.0, 2323.0, 4282.0, 8485.0, 19840.0, 54875.0, 206434.0, 473940.0, 188463.0, 51387.0, 18733.0, 8186.0, 4183.0, 1999.0, 1127.0, 644.0, 369.0, 203.0, 126.0, 73.0, 48.0, 31.0, 19.0, 21.0, 12.0, 5.0, 6.0, 1.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09771728515625, -0.09451007843017578, -0.09130287170410156, -0.08809566497802734, -0.08488845825195312, -0.0816812515258789, -0.07847404479980469, -0.07526683807373047, -0.07205963134765625, -0.06885242462158203, -0.06564521789550781, -0.062438011169433594, -0.059230804443359375, -0.056023597717285156, -0.05281639099121094, -0.04960918426513672, -0.0464019775390625, -0.04319477081298828, -0.03998756408691406, -0.036780357360839844, -0.033573150634765625, -0.030365943908691406, -0.027158737182617188, -0.02395153045654297, -0.02074432373046875, -0.01753711700439453, -0.014329910278320312, -0.011122703552246094, -0.007915496826171875, -0.004708290100097656, -0.0015010833740234375, 0.0017061233520507812, 0.004913330078125, 0.008120536804199219, 0.011327743530273438, 0.014534950256347656, 0.017742156982421875, 0.020949363708496094, 0.024156570434570312, 0.02736377716064453, 0.03057098388671875, 0.03377819061279297, 0.03698539733886719, 0.040192604064941406, 0.043399810791015625, 0.046607017517089844, 0.04981422424316406, 0.05302143096923828, 0.0562286376953125, 0.05943584442138672, 0.06264305114746094, 0.06585025787353516, 0.06905746459960938, 0.0722646713256836, 0.07547187805175781, 0.07867908477783203, 0.08188629150390625, 0.08509349822998047, 0.08830070495605469, 0.0915079116821289, 0.09471511840820312, 0.09792232513427734, 0.10112953186035156, 0.10433673858642578, 0.1075439453125]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 5.0, 4.0, 3.0, 9.0, 16.0, 14.0, 22.0, 18.0, 28.0, 20.0, 29.0, 33.0, 40.0, 49.0, 38.0, 58.0, 55.0, 63.0, 53.0, 55.0, 48.0, 39.0, 45.0, 34.0, 41.0, 31.0, 27.0, 27.0, 19.0, 11.0, 16.0, 14.0, 13.0, 6.0, 8.0, 5.0, 0.0, 4.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.117431640625, -0.11417102813720703, -0.11091041564941406, -0.1076498031616211, -0.10438919067382812, -0.10112857818603516, -0.09786796569824219, -0.09460735321044922, -0.09134674072265625, -0.08808612823486328, -0.08482551574707031, -0.08156490325927734, -0.07830429077148438, -0.0750436782836914, -0.07178306579589844, -0.06852245330810547, -0.0652618408203125, -0.06200122833251953, -0.05874061584472656, -0.055480003356933594, -0.052219390869140625, -0.048958778381347656, -0.04569816589355469, -0.04243755340576172, -0.03917694091796875, -0.03591632843017578, -0.03265571594238281, -0.029395103454589844, -0.026134490966796875, -0.022873878479003906, -0.019613265991210938, -0.01635265350341797, -0.013092041015625, -0.009831428527832031, -0.0065708160400390625, -0.0033102035522460938, -4.9591064453125e-05, 0.0032110214233398438, 0.0064716339111328125, 0.009732246398925781, 0.01299285888671875, 0.01625347137451172, 0.019514083862304688, 0.022774696350097656, 0.026035308837890625, 0.029295921325683594, 0.03255653381347656, 0.03581714630126953, 0.0390777587890625, 0.04233837127685547, 0.04559898376464844, 0.048859596252441406, 0.052120208740234375, 0.055380821228027344, 0.05864143371582031, 0.06190204620361328, 0.06516265869140625, 0.06842327117919922, 0.07168388366699219, 0.07494449615478516, 0.07820510864257812, 0.0814657211303711, 0.08472633361816406, 0.08798694610595703, 0.09124755859375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 2.0, 6.0, 4.0, 11.0, 15.0, 22.0, 25.0, 37.0, 57.0, 84.0, 120.0, 202.0, 318.0, 634.0, 1332.0, 3177.0, 8166.0, 24798.0, 94689.0, 428919.0, 371525.0, 79452.0, 21892.0, 7447.0, 2932.0, 1221.0, 598.0, 317.0, 186.0, 139.0, 82.0, 39.0, 28.0, 17.0, 21.0, 18.0, 8.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1328125, -0.12865447998046875, -0.1244964599609375, -0.12033843994140625, -0.116180419921875, -0.11202239990234375, -0.1078643798828125, -0.10370635986328125, -0.09954833984375, -0.09539031982421875, -0.0912322998046875, -0.08707427978515625, -0.082916259765625, -0.07875823974609375, -0.0746002197265625, -0.07044219970703125, -0.0662841796875, -0.06212615966796875, -0.0579681396484375, -0.05381011962890625, -0.049652099609375, -0.04549407958984375, -0.0413360595703125, -0.03717803955078125, -0.03302001953125, -0.02886199951171875, -0.0247039794921875, -0.02054595947265625, -0.016387939453125, -0.01222991943359375, -0.0080718994140625, -0.00391387939453125, 0.000244140625, 0.00440216064453125, 0.0085601806640625, 0.01271820068359375, 0.016876220703125, 0.02103424072265625, 0.0251922607421875, 0.02935028076171875, 0.03350830078125, 0.03766632080078125, 0.0418243408203125, 0.04598236083984375, 0.050140380859375, 0.05429840087890625, 0.0584564208984375, 0.06261444091796875, 0.0667724609375, 0.07093048095703125, 0.0750885009765625, 0.07924652099609375, 0.083404541015625, 0.08756256103515625, 0.0917205810546875, 0.09587860107421875, 0.10003662109375, 0.10419464111328125, 0.1083526611328125, 0.11251068115234375, 0.116668701171875, 0.12082672119140625, 0.1249847412109375, 0.12914276123046875, 0.13330078125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 3.0, 3.0, 5.0, 8.0, 10.0, 21.0, 27.0, 12.0, 16.0, 36.0, 30.0, 30.0, 58.0, 45.0, 49.0, 56.0, 54.0, 67.0, 48.0, 66.0, 58.0, 46.0, 42.0, 42.0, 32.0, 41.0, 21.0, 17.0, 14.0, 3.0, 7.0, 5.0, 9.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1131591796875, -0.10931205749511719, -0.10546493530273438, -0.10161781311035156, -0.09777069091796875, -0.09392356872558594, -0.09007644653320312, -0.08622932434082031, -0.0823822021484375, -0.07853507995605469, -0.07468795776367188, -0.07084083557128906, -0.06699371337890625, -0.06314659118652344, -0.059299468994140625, -0.05545234680175781, -0.051605224609375, -0.04775810241699219, -0.043910980224609375, -0.04006385803222656, -0.03621673583984375, -0.03236961364746094, -0.028522491455078125, -0.024675369262695312, -0.0208282470703125, -0.016981124877929688, -0.013134002685546875, -0.009286880493164062, -0.00543975830078125, -0.0015926361083984375, 0.002254486083984375, 0.0061016082763671875, 0.00994873046875, 0.013795852661132812, 0.017642974853515625, 0.021490097045898438, 0.02533721923828125, 0.029184341430664062, 0.033031463623046875, 0.03687858581542969, 0.0407257080078125, 0.04457283020019531, 0.048419952392578125, 0.05226707458496094, 0.05611419677734375, 0.05996131896972656, 0.06380844116210938, 0.06765556335449219, 0.071502685546875, 0.07534980773925781, 0.07919692993164062, 0.08304405212402344, 0.08689117431640625, 0.09073829650878906, 0.09458541870117188, 0.09843254089355469, 0.1022796630859375, 0.10612678527832031, 0.10997390747070312, 0.11382102966308594, 0.11766815185546875, 0.12151527404785156, 0.12536239624023438, 0.1292095184326172, 0.133056640625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 5.0, 5.0, 5.0, 2.0, 7.0, 7.0, 21.0, 26.0, 33.0, 60.0, 116.0, 165.0, 300.0, 528.0, 887.0, 1702.0, 3426.0, 7415.0, 18074.0, 53113.0, 177722.0, 450940.0, 225855.0, 68437.0, 22479.0, 8723.0, 4045.0, 1962.0, 1071.0, 569.0, 318.0, 201.0, 141.0, 67.0, 49.0, 25.0, 15.0, 15.0, 10.0, 5.0, 7.0, 5.0, 1.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.018463134765625, -0.01789689064025879, -0.017330646514892578, -0.016764402389526367, -0.016198158264160156, -0.015631914138793945, -0.015065670013427734, -0.014499425888061523, -0.013933181762695312, -0.013366937637329102, -0.01280069351196289, -0.01223444938659668, -0.011668205261230469, -0.011101961135864258, -0.010535717010498047, -0.009969472885131836, -0.009403228759765625, -0.008836984634399414, -0.008270740509033203, -0.007704496383666992, -0.007138252258300781, -0.00657200813293457, -0.006005764007568359, -0.0054395198822021484, -0.0048732757568359375, -0.0043070316314697266, -0.0037407875061035156, -0.0031745433807373047, -0.0026082992553710938, -0.002042055130004883, -0.0014758110046386719, -0.0009095668792724609, -0.00034332275390625, 0.00022292137145996094, 0.0007891654968261719, 0.0013554096221923828, 0.0019216537475585938, 0.0024878978729248047, 0.0030541419982910156, 0.0036203861236572266, 0.0041866302490234375, 0.0047528743743896484, 0.005319118499755859, 0.00588536262512207, 0.006451606750488281, 0.007017850875854492, 0.007584095001220703, 0.008150339126586914, 0.008716583251953125, 0.009282827377319336, 0.009849071502685547, 0.010415315628051758, 0.010981559753417969, 0.01154780387878418, 0.01211404800415039, 0.012680292129516602, 0.013246536254882812, 0.013812780380249023, 0.014379024505615234, 0.014945268630981445, 0.015511512756347656, 0.016077756881713867, 0.016644001007080078, 0.01721024513244629, 0.0177764892578125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 7.0, 5.0, 6.0, 9.0, 5.0, 18.0, 19.0, 19.0, 36.0, 46.0, 54.0, 66.0, 76.0, 78.0, 95.0, 100.0, 61.0, 50.0, 57.0, 34.0, 30.0, 29.0, 23.0, 18.0, 17.0, 6.0, 7.0, 10.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6954879760742188e-06, -3.579072654247284e-06, -3.462657332420349e-06, -3.3462420105934143e-06, -3.2298266887664795e-06, -3.1134113669395447e-06, -2.99699604511261e-06, -2.880580723285675e-06, -2.7641654014587402e-06, -2.6477500796318054e-06, -2.5313347578048706e-06, -2.414919435977936e-06, -2.298504114151001e-06, -2.182088792324066e-06, -2.0656734704971313e-06, -1.9492581486701965e-06, -1.8328428268432617e-06, -1.716427505016327e-06, -1.600012183189392e-06, -1.4835968613624573e-06, -1.3671815395355225e-06, -1.2507662177085876e-06, -1.1343508958816528e-06, -1.017935574054718e-06, -9.015202522277832e-07, -7.851049304008484e-07, -6.686896085739136e-07, -5.522742867469788e-07, -4.3585896492004395e-07, -3.1944364309310913e-07, -2.0302832126617432e-07, -8.66129994392395e-08, 2.9802322387695312e-08, 1.4621764421463013e-07, 2.6263296604156494e-07, 3.7904828786849976e-07, 4.954636096954346e-07, 6.118789315223694e-07, 7.282942533493042e-07, 8.44709575176239e-07, 9.611248970031738e-07, 1.0775402188301086e-06, 1.1939555406570435e-06, 1.3103708624839783e-06, 1.426786184310913e-06, 1.543201506137848e-06, 1.6596168279647827e-06, 1.7760321497917175e-06, 1.8924474716186523e-06, 2.008862793445587e-06, 2.125278115272522e-06, 2.2416934370994568e-06, 2.3581087589263916e-06, 2.4745240807533264e-06, 2.5909394025802612e-06, 2.707354724407196e-06, 2.823770046234131e-06, 2.9401853680610657e-06, 3.0566006898880005e-06, 3.1730160117149353e-06, 3.28943133354187e-06, 3.405846655368805e-06, 3.5222619771957397e-06, 3.6386772990226746e-06, 3.7550926208496094e-06]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 9.0, 6.0, 10.0, 16.0, 12.0, 30.0, 46.0, 55.0, 66.0, 113.0, 173.0, 245.0, 355.0, 583.0, 830.0, 1291.0, 2104.0, 3457.0, 5889.0, 10642.0, 21665.0, 48487.0, 127491.0, 373708.0, 267867.0, 102218.0, 40126.0, 18191.0, 9284.0, 5222.0, 2958.0, 1880.0, 1200.0, 807.0, 470.0, 313.0, 227.0, 144.0, 119.0, 61.0, 47.0, 37.0, 28.0, 18.0, 12.0, 6.0, 13.0, 6.0, 10.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.0181732177734375, -0.017603397369384766, -0.01703357696533203, -0.016463756561279297, -0.015893936157226562, -0.015324115753173828, -0.014754295349121094, -0.01418447494506836, -0.013614654541015625, -0.01304483413696289, -0.012475013732910156, -0.011905193328857422, -0.011335372924804688, -0.010765552520751953, -0.010195732116699219, -0.009625911712646484, -0.00905609130859375, -0.008486270904541016, -0.007916450500488281, -0.007346630096435547, -0.0067768096923828125, -0.006206989288330078, -0.005637168884277344, -0.005067348480224609, -0.004497528076171875, -0.003927707672119141, -0.0033578872680664062, -0.002788066864013672, -0.0022182464599609375, -0.0016484260559082031, -0.0010786056518554688, -0.0005087852478027344, 6.103515625e-05, 0.0006308555603027344, 0.0012006759643554688, 0.0017704963684082031, 0.0023403167724609375, 0.002910137176513672, 0.0034799575805664062, 0.004049777984619141, 0.004619598388671875, 0.005189418792724609, 0.005759239196777344, 0.006329059600830078, 0.0068988800048828125, 0.007468700408935547, 0.008038520812988281, 0.008608341217041016, 0.00917816162109375, 0.009747982025146484, 0.010317802429199219, 0.010887622833251953, 0.011457443237304688, 0.012027263641357422, 0.012597084045410156, 0.01316690444946289, 0.013736724853515625, 0.01430654525756836, 0.014876365661621094, 0.015446186065673828, 0.016016006469726562, 0.016585826873779297, 0.01715564727783203, 0.017725467681884766, 0.0182952880859375]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 9.0, 6.0, 11.0, 13.0, 12.0, 22.0, 29.0, 53.0, 56.0, 82.0, 101.0, 206.0, 102.0, 85.0, 64.0, 42.0, 37.0, 25.0, 11.0, 8.0, 6.0, 3.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014404296875, -0.013816356658935547, -0.013228416442871094, -0.01264047622680664, -0.012052536010742188, -0.011464595794677734, -0.010876655578613281, -0.010288715362548828, -0.009700775146484375, -0.009112834930419922, -0.008524894714355469, -0.007936954498291016, -0.0073490142822265625, -0.006761074066162109, -0.006173133850097656, -0.005585193634033203, -0.00499725341796875, -0.004409313201904297, -0.0038213729858398438, -0.0032334327697753906, -0.0026454925537109375, -0.0020575523376464844, -0.0014696121215820312, -0.0008816719055175781, -0.000293731689453125, 0.0002942085266113281, 0.0008821487426757812, 0.0014700889587402344, 0.0020580291748046875, 0.0026459693908691406, 0.0032339096069335938, 0.003821849822998047, 0.0044097900390625, 0.004997730255126953, 0.005585670471191406, 0.006173610687255859, 0.0067615509033203125, 0.007349491119384766, 0.007937431335449219, 0.008525371551513672, 0.009113311767578125, 0.009701251983642578, 0.010289192199707031, 0.010877132415771484, 0.011465072631835938, 0.01205301284790039, 0.012640953063964844, 0.013228893280029297, 0.01381683349609375, 0.014404773712158203, 0.014992713928222656, 0.01558065414428711, 0.016168594360351562, 0.016756534576416016, 0.01734447479248047, 0.017932415008544922, 0.018520355224609375, 0.019108295440673828, 0.01969623565673828, 0.020284175872802734, 0.020872116088867188, 0.02146005630493164, 0.022047996520996094, 0.022635936737060547, 0.023223876953125]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 3.0, 7.0, 9.0, 8.0, 24.0, 33.0, 50.0, 62.0, 119.0, 136.0, 141.0, 119.0, 104.0, 61.0, 53.0, 32.0, 16.0, 7.0, 13.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.36785775423049927, -0.359567791223526, -0.35127779841423035, -0.3429878354072571, -0.3346978425979614, -0.32640787959098816, -0.3181179165840149, -0.30982792377471924, -0.30153796076774597, -0.2932479977607727, -0.28495800495147705, -0.2766680419445038, -0.2683780789375305, -0.26008808612823486, -0.2517981231212616, -0.24350814521312714, -0.23521816730499268, -0.22692818939685822, -0.21863821148872375, -0.2103482484817505, -0.20205827057361603, -0.19376829266548157, -0.1854783296585083, -0.17718835175037384, -0.16889837384223938, -0.16060839593410492, -0.15231841802597046, -0.1440284550189972, -0.13573847711086273, -0.12744849920272827, -0.11915852874517441, -0.11086855828762054, -0.10257861018180847, -0.09428863227367401, -0.08599866181612015, -0.07770869135856628, -0.06941871345043182, -0.06112873926758766, -0.0528387650847435, -0.04454879090189934, -0.036258816719055176, -0.027968842536211014, -0.019678868353366852, -0.01138889417052269, -0.003098919987678528, 0.005191054195165634, 0.013481028378009796, 0.021771002560853958, 0.03006097674369812, 0.03835095092654228, 0.046640925109386444, 0.054930899292230606, 0.06322087347507477, 0.07151085138320923, 0.07980082184076309, 0.08809079229831696, 0.09638077020645142, 0.10467074811458588, 0.11296071857213974, 0.1212506890296936, 0.12954066693782806, 0.13783064484596252, 0.1461206078529358, 0.15441058576107025, 0.1627005636692047]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 5.0, 3.0, 5.0, 9.0, 9.0, 11.0, 15.0, 8.0, 20.0, 27.0, 13.0, 23.0, 37.0, 29.0, 40.0, 38.0, 33.0, 46.0, 47.0, 36.0, 49.0, 39.0, 43.0, 43.0, 64.0, 48.0, 24.0, 42.0, 22.0, 23.0, 28.0, 18.0, 17.0, 17.0, 11.0, 13.0, 14.0, 7.0, 6.0, 4.0, 4.0, 5.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17499539256095886, -0.16934356093406677, -0.16369174420833588, -0.1580399125814438, -0.1523880958557129, -0.1467362642288208, -0.1410844326019287, -0.13543261587619781, -0.12978079915046692, -0.12412897497415543, -0.11847715079784393, -0.11282531917095184, -0.10717350244522095, -0.10152167081832886, -0.09586984664201736, -0.09021802246570587, -0.08456619083881378, -0.07891436666250229, -0.0732625424861908, -0.0676107108592987, -0.06195889040827751, -0.05630706623196602, -0.05065523833036423, -0.045003414154052734, -0.03935158997774124, -0.03369976580142975, -0.028047939762473106, -0.022396113723516464, -0.01674428954720497, -0.011092465370893478, -0.005440637469291687, 0.0002111867070198059, 0.005863025784492493, 0.01151485089212656, 0.017166675999760628, 0.02281850203871727, 0.028470326215028763, 0.034122150391340256, 0.03977397829294205, 0.04542580246925354, 0.05107762664556503, 0.056729450821876526, 0.06238127499818802, 0.06803309917449951, 0.0736849308013916, 0.0793367475271225, 0.08498857915401459, 0.09064040333032608, 0.09629222750663757, 0.10194405168294907, 0.10759587585926056, 0.11324770748615265, 0.11889952421188354, 0.12455135583877563, 0.13020318746566772, 0.13585500419139862, 0.14150682091712952, 0.1471586525440216, 0.1528104692697525, 0.1584623008966446, 0.1641141176223755, 0.16976594924926758, 0.17541778087615967, 0.18106959760189056, 0.18672142922878265]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 2.0, 10.0, 3.0, 6.0, 16.0, 23.0, 23.0, 41.0, 46.0, 65.0, 74.0, 97.0, 135.0, 177.0, 219.0, 327.0, 366.0, 636.0, 946.0, 1544.0, 5191.0, 1035301.0, 1867.0, 960.0, 709.0, 434.0, 356.0, 252.0, 192.0, 160.0, 99.0, 86.0, 55.0, 52.0, 36.0, 22.0, 20.0, 10.0, 15.0, 8.0, 9.0, 2.0, 2.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.23735788464546204, -0.23019158840179443, -0.22302527725696564, -0.21585898101329803, -0.20869266986846924, -0.20152637362480164, -0.19436007738113403, -0.18719376623630524, -0.18002746999263763, -0.17286117374897003, -0.16569486260414124, -0.15852856636047363, -0.15136225521564484, -0.14419595897197723, -0.13702964782714844, -0.12986335158348083, -0.12269704788923264, -0.11553074419498444, -0.10836444050073624, -0.10119813680648804, -0.09403184056282043, -0.08686553686857224, -0.07969923317432404, -0.07253293693065643, -0.06536662578582764, -0.05820032209157944, -0.051034022122621536, -0.04386771842837334, -0.036701418459415436, -0.029535114765167236, -0.022368811070919037, -0.015202511101961136, -0.008036211133003235, -0.0008699088357388973, 0.00629639346152544, 0.013462696224451065, 0.020628998056054115, 0.027795299887657166, 0.034961603581905365, 0.042127903550863266, 0.049294207245111465, 0.056460510939359665, 0.06362681090831757, 0.07079311460256577, 0.07795941829681396, 0.08512571454048157, 0.09229202568531036, 0.09945832192897797, 0.10662462562322617, 0.11379092931747437, 0.12095723301172256, 0.12812353670597076, 0.13528983294963837, 0.14245614409446716, 0.14962244033813477, 0.15678873658180237, 0.16395504772663116, 0.17112134397029877, 0.17828765511512756, 0.18545395135879517, 0.19262026250362396, 0.19978655874729156, 0.20695286989212036, 0.21411916613578796, 0.22128546237945557]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 11.0, 35.0, 81.0, 164.0, 351.0, 715.0, 2182.0, 51463196.0, 2178.0, 719.0, 375.0, 181.0, 77.0, 36.0, 10.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.037178039550781, -14.60129451751709, -14.165410995483398, -13.729527473449707, -13.293643951416016, -12.857759475708008, -12.421875953674316, -11.985992431640625, -11.550108909606934, -11.114225387573242, -10.67834186553955, -10.24245834350586, -9.806573867797852, -9.370691299438477, -8.934806823730469, -8.498923301696777, -8.063039779663086, -7.6271562576293945, -7.191272735595703, -6.7553887367248535, -6.319505214691162, -5.883621692657471, -5.447737693786621, -5.01185417175293, -4.575970649719238, -4.140087127685547, -3.7042033672332764, -3.268319606781006, -2.8324360847473145, -2.396552562713623, -1.9606688022613525, -1.524785041809082, -1.0889015197753906, -0.6530178785324097, -0.2171342372894287, 0.21874940395355225, 0.6546330451965332, 1.0905165672302246, 1.5264003276824951, 1.9622840881347656, 2.398167610168457, 2.8340511322021484, 3.269934892654419, 3.7058186531066895, 4.141702175140381, 4.577585697174072, 5.013469696044922, 5.449353218078613, 5.885236740112305, 6.321120262145996, 6.7570037841796875, 7.192887783050537, 7.6287713050842285, 8.064655303955078, 8.50053882598877, 8.936422348022461, 9.372305870056152, 9.808189392089844, 10.244072914123535, 10.679956436157227, 11.115840911865234, 11.55172348022461, 11.987607955932617, 12.423491477966309, 12.859375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 6.0, 11.0, 17.0, 15.0, 28.0, 23.0, 67.0, 86.0, 124.0, 189.0, 339.0, 450.0, 812.0, 1119.0, 1941.0, 3300.0, 5780.0, 10671.0, 20078.0, 39358.0, 77760.0, 152343.0, 293168.0, 526494.0, 3530526.0, 820511.0, 382079.0, 205652.0, 105403.0, 53032.0, 27279.0, 14125.0, 7610.0, 4362.0, 2522.0, 1457.0, 967.0, 629.0, 357.0, 273.0, 166.0, 95.0, 63.0, 48.0, 29.0, 26.0, 20.0, 11.0, 4.0, 3.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3759765625, -0.3644866943359375, -0.352996826171875, -0.3415069580078125, -0.33001708984375, -0.3185272216796875, -0.307037353515625, -0.2955474853515625, -0.2840576171875, -0.2725677490234375, -0.261077880859375, -0.2495880126953125, -0.23809814453125, -0.2266082763671875, -0.215118408203125, -0.2036285400390625, -0.192138671875, -0.1806488037109375, -0.169158935546875, -0.1576690673828125, -0.14617919921875, -0.1346893310546875, -0.123199462890625, -0.1117095947265625, -0.1002197265625, -0.0887298583984375, -0.077239990234375, -0.0657501220703125, -0.05426025390625, -0.0427703857421875, -0.031280517578125, -0.0197906494140625, -0.00830078125, 0.0031890869140625, 0.014678955078125, 0.0261688232421875, 0.03765869140625, 0.0491485595703125, 0.060638427734375, 0.0721282958984375, 0.0836181640625, 0.0951080322265625, 0.106597900390625, 0.1180877685546875, 0.12957763671875, 0.1410675048828125, 0.152557373046875, 0.1640472412109375, 0.175537109375, 0.1870269775390625, 0.198516845703125, 0.2100067138671875, 0.22149658203125, 0.2329864501953125, 0.244476318359375, 0.2559661865234375, 0.2674560546875, 0.2789459228515625, 0.290435791015625, 0.3019256591796875, 0.31341552734375, 0.3249053955078125, 0.336395263671875, 0.3478851318359375, 0.359375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 7.0, 5.0, 12.0, 15.0, 19.0, 17.0, 15.0, 23.0, 22.0, 26.0, 35.0, 33.0, 29.0, 33.0, 33.0, 45.0, 55.0, 142.0, 681.0, 298.0, 55.0, 64.0, 39.0, 46.0, 38.0, 50.0, 23.0, 30.0, 30.0, 11.0, 20.0, 19.0, 7.0, 14.0, 6.0, 7.0, 3.0, 2.0, 5.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.091796875, -2.0279693603515625, -1.964141845703125, -1.9003143310546875, -1.83648681640625, -1.7726593017578125, -1.708831787109375, -1.6450042724609375, -1.5811767578125, -1.5173492431640625, -1.453521728515625, -1.3896942138671875, -1.32586669921875, -1.2620391845703125, -1.198211669921875, -1.1343841552734375, -1.070556640625, -1.0067291259765625, -0.942901611328125, -0.8790740966796875, -0.81524658203125, -0.7514190673828125, -0.687591552734375, -0.6237640380859375, -0.5599365234375, -0.4961090087890625, -0.432281494140625, -0.3684539794921875, -0.30462646484375, -0.2407989501953125, -0.176971435546875, -0.1131439208984375, -0.04931640625, 0.0145111083984375, 0.078338623046875, 0.1421661376953125, 0.20599365234375, 0.2698211669921875, 0.333648681640625, 0.3974761962890625, 0.4613037109375, 0.5251312255859375, 0.588958740234375, 0.6527862548828125, 0.71661376953125, 0.7804412841796875, 0.844268798828125, 0.9080963134765625, 0.971923828125, 1.0357513427734375, 1.099578857421875, 1.1634063720703125, 1.22723388671875, 1.2910614013671875, 1.354888916015625, 1.4187164306640625, 1.4825439453125, 1.5463714599609375, 1.610198974609375, 1.6740264892578125, 1.73785400390625, 1.8016815185546875, 1.865509033203125, 1.9293365478515625, 1.9931640625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 8.0, 5.0, 8.0, 9.0, 24.0, 33.0, 62.0, 94.0, 152.0, 220.0, 407.0, 553.0, 937.0, 1504.0, 2424.0, 3930.0, 6448.0, 10332.0, 17564.0, 29004.0, 48549.0, 78882.0, 125231.0, 195277.0, 285537.0, 386234.0, 2747942.0, 1255965.0, 361722.0, 264218.0, 177348.0, 113117.0, 69998.0, 42484.0, 26041.0, 15348.0, 9438.0, 5562.0, 3427.0, 2020.0, 1271.0, 780.0, 486.0, 310.0, 201.0, 118.0, 92.0, 52.0, 30.0, 15.0, 11.0, 13.0, 6.0, 4.0], "bins": [-0.230224609375, -0.2239837646484375, -0.217742919921875, -0.2115020751953125, -0.20526123046875, -0.1990203857421875, -0.192779541015625, -0.1865386962890625, -0.1802978515625, -0.1740570068359375, -0.167816162109375, -0.1615753173828125, -0.15533447265625, -0.1490936279296875, -0.142852783203125, -0.1366119384765625, -0.13037109375, -0.1241302490234375, -0.117889404296875, -0.1116485595703125, -0.10540771484375, -0.0991668701171875, -0.092926025390625, -0.0866851806640625, -0.0804443359375, -0.0742034912109375, -0.067962646484375, -0.0617218017578125, -0.05548095703125, -0.0492401123046875, -0.042999267578125, -0.0367584228515625, -0.030517578125, -0.0242767333984375, -0.018035888671875, -0.0117950439453125, -0.00555419921875, 0.0006866455078125, 0.006927490234375, 0.0131683349609375, 0.0194091796875, 0.0256500244140625, 0.031890869140625, 0.0381317138671875, 0.04437255859375, 0.0506134033203125, 0.056854248046875, 0.0630950927734375, 0.0693359375, 0.0755767822265625, 0.081817626953125, 0.0880584716796875, 0.09429931640625, 0.1005401611328125, 0.106781005859375, 0.1130218505859375, 0.1192626953125, 0.1255035400390625, 0.131744384765625, 0.1379852294921875, 0.14422607421875, 0.1504669189453125, 0.156707763671875, 0.1629486083984375, 0.169189453125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 6.0, 3.0, 1.0, 1.0, 5.0, 7.0, 10.0, 8.0, 10.0, 11.0, 11.0, 16.0, 13.0, 14.0, 18.0, 16.0, 22.0, 21.0, 20.0, 28.0, 18.0, 31.0, 30.0, 45.0, 33.0, 40.0, 386.0, 635.0, 113.0, 30.0, 42.0, 30.0, 34.0, 33.0, 30.0, 39.0, 24.0, 20.0, 22.0, 22.0, 21.0, 19.0, 15.0, 11.0, 14.0, 10.0, 5.0, 9.0, 10.0, 3.0, 4.0, 5.0, 5.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0], "bins": [-1.5595703125, -1.511199951171875, -1.46282958984375, -1.414459228515625, -1.3660888671875, -1.317718505859375, -1.26934814453125, -1.220977783203125, -1.172607421875, -1.124237060546875, -1.07586669921875, -1.027496337890625, -0.9791259765625, -0.930755615234375, -0.88238525390625, -0.834014892578125, -0.78564453125, -0.737274169921875, -0.68890380859375, -0.640533447265625, -0.5921630859375, -0.543792724609375, -0.49542236328125, -0.447052001953125, -0.398681640625, -0.350311279296875, -0.30194091796875, -0.253570556640625, -0.2052001953125, -0.156829833984375, -0.10845947265625, -0.060089111328125, -0.01171875, 0.036651611328125, 0.08502197265625, 0.133392333984375, 0.1817626953125, 0.230133056640625, 0.27850341796875, 0.326873779296875, 0.375244140625, 0.423614501953125, 0.47198486328125, 0.520355224609375, 0.5687255859375, 0.617095947265625, 0.66546630859375, 0.713836669921875, 0.76220703125, 0.810577392578125, 0.85894775390625, 0.907318115234375, 0.9556884765625, 1.004058837890625, 1.05242919921875, 1.100799560546875, 1.149169921875, 1.197540283203125, 1.24591064453125, 1.294281005859375, 1.3426513671875, 1.391021728515625, 1.43939208984375, 1.487762451171875, 1.5361328125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 4.0, 6.0, 2.0, 4.0, 9.0, 14.0, 14.0, 15.0, 18.0, 29.0, 30.0, 38.0, 45.0, 77.0, 72.0, 115.0, 163.0, 183.0, 263.0, 338.0, 514.0, 726.0, 992.0, 1683.0, 3165.0, 6413.0, 15056.0, 37747.0, 100554.0, 5125828.0, 840043.0, 94186.0, 34932.0, 13846.0, 6075.0, 3041.0, 1633.0, 1030.0, 688.0, 500.0, 361.0, 257.0, 183.0, 118.0, 126.0, 64.0, 48.0, 43.0, 31.0, 27.0, 17.0, 15.0, 25.0, 13.0, 10.0, 8.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0], "bins": [-0.7294921875, -0.7059326171875, -0.682373046875, -0.6588134765625, -0.63525390625, -0.6116943359375, -0.588134765625, -0.5645751953125, -0.541015625, -0.5174560546875, -0.493896484375, -0.4703369140625, -0.44677734375, -0.4232177734375, -0.399658203125, -0.3760986328125, -0.3525390625, -0.3289794921875, -0.305419921875, -0.2818603515625, -0.25830078125, -0.2347412109375, -0.211181640625, -0.1876220703125, -0.1640625, -0.1405029296875, -0.116943359375, -0.0933837890625, -0.06982421875, -0.0462646484375, -0.022705078125, 0.0008544921875, 0.0244140625, 0.0479736328125, 0.071533203125, 0.0950927734375, 0.11865234375, 0.1422119140625, 0.165771484375, 0.1893310546875, 0.212890625, 0.2364501953125, 0.260009765625, 0.2835693359375, 0.30712890625, 0.3306884765625, 0.354248046875, 0.3778076171875, 0.4013671875, 0.4249267578125, 0.448486328125, 0.4720458984375, 0.49560546875, 0.5191650390625, 0.542724609375, 0.5662841796875, 0.58984375, 0.6134033203125, 0.636962890625, 0.6605224609375, 0.68408203125, 0.7076416015625, 0.731201171875, 0.7547607421875, 0.7783203125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 8.0, 5.0, 7.0, 11.0, 11.0, 11.0, 16.0, 23.0, 23.0, 22.0, 27.0, 45.0, 29.0, 38.0, 50.0, 29.0, 47.0, 51.0, 349.0, 737.0, 80.0, 41.0, 34.0, 36.0, 43.0, 32.0, 30.0, 36.0, 34.0, 17.0, 20.0, 17.0, 15.0, 13.0, 4.0, 7.0, 6.0, 10.0, 2.0, 2.0, 6.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.126953125, -2.0609130859375, -1.994873046875, -1.9288330078125, -1.86279296875, -1.7967529296875, -1.730712890625, -1.6646728515625, -1.5986328125, -1.5325927734375, -1.466552734375, -1.4005126953125, -1.33447265625, -1.2684326171875, -1.202392578125, -1.1363525390625, -1.0703125, -1.0042724609375, -0.938232421875, -0.8721923828125, -0.80615234375, -0.7401123046875, -0.674072265625, -0.6080322265625, -0.5419921875, -0.4759521484375, -0.409912109375, -0.3438720703125, -0.27783203125, -0.2117919921875, -0.145751953125, -0.0797119140625, -0.013671875, 0.0523681640625, 0.118408203125, 0.1844482421875, 0.25048828125, 0.3165283203125, 0.382568359375, 0.4486083984375, 0.5146484375, 0.5806884765625, 0.646728515625, 0.7127685546875, 0.77880859375, 0.8448486328125, 0.910888671875, 0.9769287109375, 1.04296875, 1.1090087890625, 1.175048828125, 1.2410888671875, 1.30712890625, 1.3731689453125, 1.439208984375, 1.5052490234375, 1.5712890625, 1.6373291015625, 1.703369140625, 1.7694091796875, 1.83544921875, 1.9014892578125, 1.967529296875, 2.0335693359375, 2.099609375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 1.0, 4.0, 3.0, 5.0, 9.0, 13.0, 14.0, 29.0, 33.0, 38.0, 54.0, 79.0, 158.0, 243.0, 92.0, 69.0, 34.0, 29.0, 27.0, 17.0, 18.0, 10.0, 7.0, 4.0, 1.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.225685119628906, -18.520082473754883, -17.814477920532227, -17.108875274658203, -16.403270721435547, -15.697668075561523, -14.9920654296875, -14.28646183013916, -13.58085823059082, -12.87525463104248, -12.16965103149414, -11.464048385620117, -10.758444786071777, -10.052841186523438, -9.347238540649414, -8.641634941101074, -7.936031341552734, -7.2304277420043945, -6.524824619293213, -5.819221496582031, -5.113617897033691, -4.408014297485352, -3.70241117477417, -2.9968080520629883, -2.2912044525146484, -1.5856010913848877, -0.879997730255127, -0.1743943691253662, 0.5312089920043945, 1.2368123531341553, 1.942415714263916, 2.6480188369750977, 3.3536205291748047, 4.0592241287231445, 4.764827251434326, 5.470430374145508, 6.176033973693848, 6.8816375732421875, 7.587240695953369, 8.29284381866455, 8.99844741821289, 9.70405101776123, 10.40965461730957, 11.115257263183594, 11.820860862731934, 12.526464462280273, 13.232067108154297, 13.937670707702637, 14.643274307250977, 15.348877906799316, 16.054481506347656, 16.76008415222168, 17.465686798095703, 18.17129135131836, 18.876893997192383, 19.582496643066406, 20.288101196289062, 20.993703842163086, 21.699308395385742, 22.404911041259766, 23.110515594482422, 23.816118240356445, 24.52172088623047, 25.227325439453125, 25.93292808532715]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 2.0, 5.0, 6.0, 6.0, 11.0, 8.0, 11.0, 10.0, 22.0, 15.0, 20.0, 22.0, 31.0, 34.0, 42.0, 74.0, 123.0, 155.0, 87.0, 54.0, 37.0, 31.0, 34.0, 28.0, 15.0, 24.0, 15.0, 12.0, 8.0, 13.0, 5.0, 7.0, 5.0, 8.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-44.22477722167969, -42.76165008544922, -41.29852294921875, -39.83539581298828, -38.37226867675781, -36.909141540527344, -35.446014404296875, -33.982887268066406, -32.51976013183594, -31.05663299560547, -29.593505859375, -28.13037872314453, -26.667251586914062, -25.204124450683594, -23.740997314453125, -22.277870178222656, -20.814741134643555, -19.351613998413086, -17.888486862182617, -16.42535972595215, -14.96223258972168, -13.499105453491211, -12.035977363586426, -10.572850227355957, -9.109723091125488, -7.6465959548950195, -6.183468818664551, -4.720341205596924, -3.257214069366455, -1.7940869331359863, -0.3309593200683594, 1.1321678161621094, 2.595294952392578, 4.058422088623047, 5.521549224853516, 6.984676837921143, 8.447803497314453, 9.910930633544922, 11.374058723449707, 12.837185859680176, 14.300312995910645, 15.763440132141113, 17.2265682220459, 18.689695358276367, 20.152822494506836, 21.615949630737305, 23.079076766967773, 24.542203903198242, 26.00533103942871, 27.46845817565918, 28.93158531188965, 30.394712448120117, 31.857839584350586, 33.32096862792969, 34.784095764160156, 36.247222900390625, 37.710350036621094, 39.17347717285156, 40.63660430908203, 42.0997314453125, 43.56285858154297, 45.02598571777344, 46.489112854003906, 47.952239990234375, 49.415367126464844]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 9.0, 8.0, 16.0, 15.0, 18.0, 34.0, 50.0, 61.0, 110.0, 163.0, 269.0, 366.0, 661.0, 1119.0, 2171.0, 4570.0, 11810.0, 46200.0, 3299952.0, 769936.0, 36147.0, 10864.0, 4482.0, 2202.0, 1171.0, 651.0, 425.0, 262.0, 165.0, 111.0, 79.0, 55.0, 42.0, 30.0, 13.0, 20.0, 11.0, 7.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038787841796875, -0.03749227523803711, -0.03619670867919922, -0.03490114212036133, -0.03360557556152344, -0.03231000900268555, -0.031014442443847656, -0.029718875885009766, -0.028423309326171875, -0.027127742767333984, -0.025832176208496094, -0.024536609649658203, -0.023241043090820312, -0.021945476531982422, -0.02064990997314453, -0.01935434341430664, -0.01805877685546875, -0.01676321029663086, -0.015467643737792969, -0.014172077178955078, -0.012876510620117188, -0.011580944061279297, -0.010285377502441406, -0.008989810943603516, -0.007694244384765625, -0.006398677825927734, -0.005103111267089844, -0.003807544708251953, -0.0025119781494140625, -0.0012164115905761719, 7.915496826171875e-05, 0.0013747215270996094, 0.0026702880859375, 0.003965854644775391, 0.005261421203613281, 0.006556987762451172, 0.007852554321289062, 0.009148120880126953, 0.010443687438964844, 0.011739253997802734, 0.013034820556640625, 0.014330387115478516, 0.015625953674316406, 0.016921520233154297, 0.018217086791992188, 0.019512653350830078, 0.02080821990966797, 0.02210378646850586, 0.02339935302734375, 0.02469491958618164, 0.02599048614501953, 0.027286052703857422, 0.028581619262695312, 0.029877185821533203, 0.031172752380371094, 0.032468318939208984, 0.033763885498046875, 0.035059452056884766, 0.036355018615722656, 0.03765058517456055, 0.03894615173339844, 0.04024171829223633, 0.04153728485107422, 0.04283285140991211, 0.04412841796875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 1.0, 4.0, 4.0, 5.0, 6.0, 10.0, 11.0, 15.0, 19.0, 27.0, 32.0, 29.0, 40.0, 57.0, 394.0, 87.0, 55.0, 45.0, 27.0, 19.0, 22.0, 15.0, 15.0, 15.0, 6.0, 8.0, 7.0, 6.0, 2.0, 2.0, 5.0, 3.0, 5.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0204620361328125, -0.019802093505859375, -0.01914215087890625, -0.018482208251953125, -0.017822265625, -0.017162322998046875, -0.01650238037109375, -0.015842437744140625, -0.0151824951171875, -0.014522552490234375, -0.01386260986328125, -0.013202667236328125, -0.012542724609375, -0.011882781982421875, -0.01122283935546875, -0.010562896728515625, -0.0099029541015625, -0.009243011474609375, -0.00858306884765625, -0.007923126220703125, -0.00726318359375, -0.006603240966796875, -0.00594329833984375, -0.005283355712890625, -0.0046234130859375, -0.003963470458984375, -0.00330352783203125, -0.002643585205078125, -0.001983642578125, -0.001323699951171875, -0.00066375732421875, -3.814697265625e-06, 0.0006561279296875, 0.001316070556640625, 0.00197601318359375, 0.002635955810546875, 0.0032958984375, 0.003955841064453125, 0.00461578369140625, 0.005275726318359375, 0.0059356689453125, 0.006595611572265625, 0.00725555419921875, 0.007915496826171875, 0.008575439453125, 0.009235382080078125, 0.00989532470703125, 0.010555267333984375, 0.0112152099609375, 0.011875152587890625, 0.01253509521484375, 0.013195037841796875, 0.01385498046875, 0.014514923095703125, 0.01517486572265625, 0.015834808349609375, 0.0164947509765625, 0.017154693603515625, 0.01781463623046875, 0.018474578857421875, 0.019134521484375, 0.019794464111328125, 0.02045440673828125, 0.021114349365234375, 0.0217742919921875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 7.0, 5.0, 5.0, 10.0, 19.0, 31.0, 48.0, 80.0, 120.0, 214.0, 571.0, 1459.0, 4465.0, 18442.0, 125084.0, 3660554.0, 334354.0, 36554.0, 8262.0, 2415.0, 832.0, 314.0, 174.0, 72.0, 60.0, 36.0, 32.0, 29.0, 12.0, 11.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0594482421875, -0.05773353576660156, -0.056018829345703125, -0.05430412292480469, -0.05258941650390625, -0.05087471008300781, -0.049160003662109375, -0.04744529724121094, -0.0457305908203125, -0.04401588439941406, -0.042301177978515625, -0.04058647155761719, -0.03887176513671875, -0.03715705871582031, -0.035442352294921875, -0.03372764587402344, -0.032012939453125, -0.030298233032226562, -0.028583526611328125, -0.026868820190429688, -0.02515411376953125, -0.023439407348632812, -0.021724700927734375, -0.020009994506835938, -0.0182952880859375, -0.016580581665039062, -0.014865875244140625, -0.013151168823242188, -0.01143646240234375, -0.009721755981445312, -0.008007049560546875, -0.0062923431396484375, -0.00457763671875, -0.0028629302978515625, -0.001148223876953125, 0.0005664825439453125, 0.00228118896484375, 0.0039958953857421875, 0.005710601806640625, 0.0074253082275390625, 0.0091400146484375, 0.010854721069335938, 0.012569427490234375, 0.014284133911132812, 0.01599884033203125, 0.017713546752929688, 0.019428253173828125, 0.021142959594726562, 0.022857666015625, 0.024572372436523438, 0.026287078857421875, 0.028001785278320312, 0.02971649169921875, 0.03143119812011719, 0.033145904541015625, 0.03486061096191406, 0.0365753173828125, 0.03829002380371094, 0.040004730224609375, 0.04171943664550781, 0.04343414306640625, 0.04514884948730469, 0.046863555908203125, 0.04857826232910156, 0.05029296875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 4.0, 3.0, 7.0, 9.0, 7.0, 10.0, 17.0, 25.0, 27.0, 39.0, 68.0, 61.0, 119.0, 216.0, 537.0, 1313.0, 746.0, 312.0, 149.0, 108.0, 61.0, 49.0, 35.0, 20.0, 24.0, 27.0, 13.0, 14.0, 9.0, 15.0, 8.0, 5.0, 4.0, 10.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0191802978515625, -0.018611431121826172, -0.018042564392089844, -0.017473697662353516, -0.016904830932617188, -0.01633596420288086, -0.01576709747314453, -0.015198230743408203, -0.014629364013671875, -0.014060497283935547, -0.013491630554199219, -0.01292276382446289, -0.012353897094726562, -0.011785030364990234, -0.011216163635253906, -0.010647296905517578, -0.01007843017578125, -0.009509563446044922, -0.008940696716308594, -0.008371829986572266, -0.0078029632568359375, -0.007234096527099609, -0.006665229797363281, -0.006096363067626953, -0.005527496337890625, -0.004958629608154297, -0.004389762878417969, -0.0038208961486816406, -0.0032520294189453125, -0.0026831626892089844, -0.0021142959594726562, -0.0015454292297363281, -0.0009765625, -0.0004076957702636719, 0.00016117095947265625, 0.0007300376892089844, 0.0012989044189453125, 0.0018677711486816406, 0.0024366378784179688, 0.003005504608154297, 0.003574371337890625, 0.004143238067626953, 0.004712104797363281, 0.005280971527099609, 0.0058498382568359375, 0.006418704986572266, 0.006987571716308594, 0.007556438446044922, 0.00812530517578125, 0.008694171905517578, 0.009263038635253906, 0.009831905364990234, 0.010400772094726562, 0.01096963882446289, 0.011538505554199219, 0.012107372283935547, 0.012676239013671875, 0.013245105743408203, 0.013813972473144531, 0.01438283920288086, 0.014951705932617188, 0.015520572662353516, 0.016089439392089844, 0.016658306121826172, 0.0172271728515625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 5.0, 40.0, 402.0, 481.0, 61.0, 10.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06465546041727066, -0.05390220135450363, -0.0431489422917366, -0.032395679503679276, -0.021642420440912247, -0.010889161378145218, -0.00013589859008789062, 0.010617360472679138, 0.021370619535446167, 0.032123878598213196, 0.042877137660980225, 0.05363040044903755, 0.06438365578651428, 0.07513691484928131, 0.08589018136262894, 0.09664344042539597, 0.107396699488163, 0.11814995855093002, 0.12890322506427765, 0.13965648412704468, 0.1504097431898117, 0.16116300225257874, 0.17191626131534576, 0.1826695203781128, 0.19342277944087982, 0.20417603850364685, 0.21492929756641388, 0.2256825566291809, 0.23643581569194794, 0.24718907475471497, 0.2579423487186432, 0.268695592880249, 0.27944883704185486, 0.2902021110057831, 0.3009553551673889, 0.31170862913131714, 0.322461873292923, 0.3332151472568512, 0.34396839141845703, 0.35472166538238525, 0.3654749095439911, 0.3762281835079193, 0.38698142766952515, 0.39773470163345337, 0.4084879457950592, 0.4192412197589874, 0.42999446392059326, 0.4407477378845215, 0.4515010118484497, 0.46225428581237793, 0.47300752997398376, 0.483760803937912, 0.4945140480995178, 0.505267322063446, 0.5160205960273743, 0.5267738103866577, 0.5375270843505859, 0.5482803583145142, 0.5590336322784424, 0.5697868466377258, 0.580540120601654, 0.5912933945655823, 0.6020466685295105, 0.612799882888794, 0.6235531568527222]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 0.0, 1.0, 4.0, 11.0, 3.0, 3.0, 9.0, 13.0, 15.0, 12.0, 19.0, 21.0, 30.0, 25.0, 38.0, 41.0, 73.0, 52.0, 55.0, 52.0, 59.0, 51.0, 50.0, 48.0, 50.0, 51.0, 49.0, 31.0, 32.0, 25.0, 22.0, 19.0, 20.0, 5.0, 8.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.09513932466506958, -0.0924723893404007, -0.08980545401573181, -0.08713851869106293, -0.08447158336639404, -0.08180464804172516, -0.07913771271705627, -0.07647077739238739, -0.0738038420677185, -0.07113690674304962, -0.06846997141838074, -0.06580303609371185, -0.06313610076904297, -0.060469165444374084, -0.0578022301197052, -0.055135294795036316, -0.05246835947036743, -0.04980142414569855, -0.04713448882102966, -0.04446755349636078, -0.041800618171691895, -0.03913368284702301, -0.036466747522354126, -0.03379981219768524, -0.031132876873016357, -0.028465941548347473, -0.02579900622367859, -0.023132070899009705, -0.02046513557434082, -0.017798200249671936, -0.015131264925003052, -0.012464329600334167, -0.009797394275665283, -0.007130458950996399, -0.004463523626327515, -0.0017965883016586304, 0.0008703470230102539, 0.003537282347679138, 0.0062042176723480225, 0.008871152997016907, 0.011538088321685791, 0.014205023646354675, 0.01687195897102356, 0.019538894295692444, 0.022205829620361328, 0.024872764945030212, 0.027539700269699097, 0.03020663559436798, 0.032873570919036865, 0.03554050624370575, 0.038207441568374634, 0.04087437689304352, 0.0435413122177124, 0.04620824754238129, 0.04887518286705017, 0.051542118191719055, 0.05420905351638794, 0.056875988841056824, 0.05954292416572571, 0.06220985949039459, 0.06487679481506348, 0.06754373013973236, 0.07021066546440125, 0.07287760078907013, 0.07554453611373901]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 12.0, 13.0, 9.0, 14.0, 27.0, 46.0, 45.0, 75.0, 121.0, 153.0, 244.0, 383.0, 519.0, 765.0, 1279.0, 2027.0, 3212.0, 5691.0, 9989.0, 19980.0, 44920.0, 144195.0, 661855.0, 85401.0, 32294.0, 15261.0, 7942.0, 4417.0, 2774.0, 1731.0, 1101.0, 656.0, 455.0, 349.0, 199.0, 131.0, 86.0, 66.0, 34.0, 26.0, 19.0, 9.0, 8.0, 8.0, 7.0, 1.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0438232421875, -0.04250764846801758, -0.041192054748535156, -0.039876461029052734, -0.03856086730957031, -0.03724527359008789, -0.03592967987060547, -0.03461408615112305, -0.033298492431640625, -0.0319828987121582, -0.03066730499267578, -0.02935171127319336, -0.028036117553710938, -0.026720523834228516, -0.025404930114746094, -0.024089336395263672, -0.02277374267578125, -0.021458148956298828, -0.020142555236816406, -0.018826961517333984, -0.017511367797851562, -0.01619577407836914, -0.014880180358886719, -0.013564586639404297, -0.012248992919921875, -0.010933399200439453, -0.009617805480957031, -0.00830221176147461, -0.0069866180419921875, -0.005671024322509766, -0.004355430603027344, -0.003039836883544922, -0.0017242431640625, -0.0004086494445800781, 0.0009069442749023438, 0.0022225379943847656, 0.0035381317138671875, 0.004853725433349609, 0.006169319152832031, 0.007484912872314453, 0.008800506591796875, 0.010116100311279297, 0.011431694030761719, 0.01274728775024414, 0.014062881469726562, 0.015378475189208984, 0.016694068908691406, 0.018009662628173828, 0.01932525634765625, 0.020640850067138672, 0.021956443786621094, 0.023272037506103516, 0.024587631225585938, 0.02590322494506836, 0.02721881866455078, 0.028534412384033203, 0.029850006103515625, 0.031165599822998047, 0.03248119354248047, 0.03379678726196289, 0.03511238098144531, 0.036427974700927734, 0.037743568420410156, 0.03905916213989258, 0.040374755859375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 4.0, 4.0, 3.0, 2.0, 6.0, 6.0, 6.0, 12.0, 15.0, 22.0, 27.0, 22.0, 33.0, 42.0, 55.0, 252.0, 220.0, 67.0, 41.0, 29.0, 24.0, 18.0, 24.0, 9.0, 19.0, 7.0, 5.0, 9.0, 1.0, 5.0, 3.0, 3.0, 7.0, 4.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020751953125, -0.020085811614990234, -0.01941967010498047, -0.018753528594970703, -0.018087387084960938, -0.017421245574951172, -0.016755104064941406, -0.01608896255493164, -0.015422821044921875, -0.01475667953491211, -0.014090538024902344, -0.013424396514892578, -0.012758255004882812, -0.012092113494873047, -0.011425971984863281, -0.010759830474853516, -0.01009368896484375, -0.009427547454833984, -0.008761405944824219, -0.008095264434814453, -0.0074291229248046875, -0.006762981414794922, -0.006096839904785156, -0.005430698394775391, -0.004764556884765625, -0.004098415374755859, -0.0034322738647460938, -0.002766132354736328, -0.0020999908447265625, -0.0014338493347167969, -0.0007677078247070312, -0.00010156631469726562, 0.0005645751953125, 0.0012307167053222656, 0.0018968582153320312, 0.002562999725341797, 0.0032291412353515625, 0.003895282745361328, 0.004561424255371094, 0.005227565765380859, 0.005893707275390625, 0.006559848785400391, 0.007225990295410156, 0.007892131805419922, 0.008558273315429688, 0.009224414825439453, 0.009890556335449219, 0.010556697845458984, 0.01122283935546875, 0.011888980865478516, 0.012555122375488281, 0.013221263885498047, 0.013887405395507812, 0.014553546905517578, 0.015219688415527344, 0.01588582992553711, 0.016551971435546875, 0.01721811294555664, 0.017884254455566406, 0.018550395965576172, 0.019216537475585938, 0.019882678985595703, 0.02054882049560547, 0.021214962005615234, 0.021881103515625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 1.0, 7.0, 9.0, 12.0, 16.0, 16.0, 24.0, 36.0, 59.0, 89.0, 97.0, 139.0, 231.0, 418.0, 776.0, 1721.0, 5350.0, 22662.0, 150600.0, 694923.0, 141035.0, 21619.0, 5060.0, 1751.0, 759.0, 397.0, 242.0, 137.0, 103.0, 77.0, 49.0, 38.0, 35.0, 21.0, 12.0, 16.0, 9.0, 6.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.057464599609375, -0.05574846267700195, -0.054032325744628906, -0.05231618881225586, -0.05060005187988281, -0.048883914947509766, -0.04716777801513672, -0.04545164108276367, -0.043735504150390625, -0.04201936721801758, -0.04030323028564453, -0.038587093353271484, -0.03687095642089844, -0.03515481948852539, -0.033438682556152344, -0.0317225456237793, -0.03000640869140625, -0.028290271759033203, -0.026574134826660156, -0.02485799789428711, -0.023141860961914062, -0.021425724029541016, -0.01970958709716797, -0.017993450164794922, -0.016277313232421875, -0.014561176300048828, -0.012845039367675781, -0.011128902435302734, -0.009412765502929688, -0.007696628570556641, -0.005980491638183594, -0.004264354705810547, -0.0025482177734375, -0.0008320808410644531, 0.0008840560913085938, 0.0026001930236816406, 0.0043163299560546875, 0.006032466888427734, 0.007748603820800781, 0.009464740753173828, 0.011180877685546875, 0.012897014617919922, 0.014613151550292969, 0.016329288482666016, 0.018045425415039062, 0.01976156234741211, 0.021477699279785156, 0.023193836212158203, 0.02490997314453125, 0.026626110076904297, 0.028342247009277344, 0.03005838394165039, 0.03177452087402344, 0.033490657806396484, 0.03520679473876953, 0.03692293167114258, 0.038639068603515625, 0.04035520553588867, 0.04207134246826172, 0.043787479400634766, 0.04550361633300781, 0.04721975326538086, 0.048935890197753906, 0.05065202713012695, 0.0523681640625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 6.0, 10.0, 12.0, 8.0, 16.0, 15.0, 26.0, 25.0, 35.0, 23.0, 41.0, 40.0, 40.0, 48.0, 36.0, 50.0, 56.0, 42.0, 41.0, 57.0, 45.0, 33.0, 32.0, 33.0, 28.0, 29.0, 21.0, 31.0, 21.0, 21.0, 19.0, 13.0, 17.0, 6.0, 8.0, 5.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.08544921875, -0.08315610885620117, -0.08086299896240234, -0.07856988906860352, -0.07627677917480469, -0.07398366928100586, -0.07169055938720703, -0.0693974494934082, -0.06710433959960938, -0.06481122970581055, -0.06251811981201172, -0.06022500991821289, -0.05793190002441406, -0.055638790130615234, -0.053345680236816406, -0.05105257034301758, -0.04875946044921875, -0.04646635055541992, -0.044173240661621094, -0.041880130767822266, -0.03958702087402344, -0.03729391098022461, -0.03500080108642578, -0.03270769119262695, -0.030414581298828125, -0.028121471405029297, -0.02582836151123047, -0.02353525161743164, -0.021242141723632812, -0.018949031829833984, -0.016655921936035156, -0.014362812042236328, -0.0120697021484375, -0.009776592254638672, -0.007483482360839844, -0.005190372467041016, -0.0028972625732421875, -0.0006041526794433594, 0.0016889572143554688, 0.003982067108154297, 0.006275177001953125, 0.008568286895751953, 0.010861396789550781, 0.01315450668334961, 0.015447616577148438, 0.017740726470947266, 0.020033836364746094, 0.022326946258544922, 0.02462005615234375, 0.026913166046142578, 0.029206275939941406, 0.031499385833740234, 0.03379249572753906, 0.03608560562133789, 0.03837871551513672, 0.04067182540893555, 0.042964935302734375, 0.0452580451965332, 0.04755115509033203, 0.04984426498413086, 0.05213737487792969, 0.054430484771728516, 0.056723594665527344, 0.05901670455932617, 0.061309814453125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 9.0, 20.0, 21.0, 25.0, 79.0, 129.0, 239.0, 556.0, 1603.0, 7862.0, 197388.0, 819547.0, 17024.0, 2608.0, 762.0, 308.0, 170.0, 79.0, 46.0, 26.0, 11.0, 13.0, 8.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0316162109375, -0.030601978302001953, -0.029587745666503906, -0.02857351303100586, -0.027559280395507812, -0.026545047760009766, -0.02553081512451172, -0.024516582489013672, -0.023502349853515625, -0.022488117218017578, -0.02147388458251953, -0.020459651947021484, -0.019445419311523438, -0.01843118667602539, -0.017416954040527344, -0.016402721405029297, -0.01538848876953125, -0.014374256134033203, -0.013360023498535156, -0.01234579086303711, -0.011331558227539062, -0.010317325592041016, -0.009303092956542969, -0.008288860321044922, -0.007274627685546875, -0.006260395050048828, -0.005246162414550781, -0.004231929779052734, -0.0032176971435546875, -0.0022034645080566406, -0.0011892318725585938, -0.00017499923706054688, 0.0008392333984375, 0.0018534660339355469, 0.0028676986694335938, 0.0038819313049316406, 0.0048961639404296875, 0.005910396575927734, 0.006924629211425781, 0.007938861846923828, 0.008953094482421875, 0.009967327117919922, 0.010981559753417969, 0.011995792388916016, 0.013010025024414062, 0.01402425765991211, 0.015038490295410156, 0.016052722930908203, 0.01706695556640625, 0.018081188201904297, 0.019095420837402344, 0.02010965347290039, 0.021123886108398438, 0.022138118743896484, 0.02315235137939453, 0.024166584014892578, 0.025180816650390625, 0.026195049285888672, 0.02720928192138672, 0.028223514556884766, 0.029237747192382812, 0.03025197982788086, 0.031266212463378906, 0.03228044509887695, 0.033294677734375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 6.0, 8.0, 13.0, 9.0, 13.0, 21.0, 24.0, 25.0, 30.0, 39.0, 55.0, 60.0, 66.0, 45.0, 71.0, 69.0, 66.0, 63.0, 41.0, 53.0, 48.0, 27.0, 28.0, 30.0, 28.0, 32.0, 10.0, 7.0, 6.0, 9.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1563301086425781e-05, -1.1213123798370361e-05, -1.0862946510314941e-05, -1.0512769222259521e-05, -1.0162591934204102e-05, -9.812414646148682e-06, -9.462237358093262e-06, -9.112060070037842e-06, -8.761882781982422e-06, -8.411705493927002e-06, -8.061528205871582e-06, -7.711350917816162e-06, -7.361173629760742e-06, -7.010996341705322e-06, -6.660819053649902e-06, -6.310641765594482e-06, -5.9604644775390625e-06, -5.610287189483643e-06, -5.260109901428223e-06, -4.909932613372803e-06, -4.559755325317383e-06, -4.209578037261963e-06, -3.859400749206543e-06, -3.509223461151123e-06, -3.159046173095703e-06, -2.808868885040283e-06, -2.4586915969848633e-06, -2.1085143089294434e-06, -1.7583370208740234e-06, -1.4081597328186035e-06, -1.0579824447631836e-06, -7.078051567077637e-07, -3.5762786865234375e-07, -7.450580596923828e-09, 3.427267074584961e-07, 6.92903995513916e-07, 1.043081283569336e-06, 1.3932585716247559e-06, 1.7434358596801758e-06, 2.0936131477355957e-06, 2.4437904357910156e-06, 2.7939677238464355e-06, 3.1441450119018555e-06, 3.4943222999572754e-06, 3.844499588012695e-06, 4.194676876068115e-06, 4.544854164123535e-06, 4.895031452178955e-06, 5.245208740234375e-06, 5.595386028289795e-06, 5.945563316345215e-06, 6.295740604400635e-06, 6.645917892456055e-06, 6.996095180511475e-06, 7.3462724685668945e-06, 7.696449756622314e-06, 8.046627044677734e-06, 8.396804332733154e-06, 8.746981620788574e-06, 9.097158908843994e-06, 9.447336196899414e-06, 9.797513484954834e-06, 1.0147690773010254e-05, 1.0497868061065674e-05, 1.0848045349121094e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 3.0, 6.0, 5.0, 6.0, 7.0, 18.0, 26.0, 40.0, 49.0, 89.0, 167.0, 366.0, 780.0, 2370.0, 9471.0, 75666.0, 756400.0, 181316.0, 16377.0, 3431.0, 1056.0, 417.0, 209.0, 113.0, 59.0, 38.0, 24.0, 16.0, 10.0, 6.0, 4.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.02227783203125, -0.021635055541992188, -0.020992279052734375, -0.020349502563476562, -0.01970672607421875, -0.019063949584960938, -0.018421173095703125, -0.017778396606445312, -0.0171356201171875, -0.016492843627929688, -0.015850067138671875, -0.015207290649414062, -0.01456451416015625, -0.013921737670898438, -0.013278961181640625, -0.012636184692382812, -0.011993408203125, -0.011350631713867188, -0.010707855224609375, -0.010065078735351562, -0.00942230224609375, -0.008779525756835938, -0.008136749267578125, -0.0074939727783203125, -0.0068511962890625, -0.0062084197998046875, -0.005565643310546875, -0.0049228668212890625, -0.00428009033203125, -0.0036373138427734375, -0.002994537353515625, -0.0023517608642578125, -0.001708984375, -0.0010662078857421875, -0.000423431396484375, 0.0002193450927734375, 0.00086212158203125, 0.0015048980712890625, 0.002147674560546875, 0.0027904510498046875, 0.0034332275390625, 0.0040760040283203125, 0.004718780517578125, 0.0053615570068359375, 0.00600433349609375, 0.0066471099853515625, 0.007289886474609375, 0.007932662963867188, 0.008575439453125, 0.009218215942382812, 0.009860992431640625, 0.010503768920898438, 0.01114654541015625, 0.011789321899414062, 0.012432098388671875, 0.013074874877929688, 0.0137176513671875, 0.014360427856445312, 0.015003204345703125, 0.015645980834960938, 0.01628875732421875, 0.016931533813476562, 0.017574310302734375, 0.018217086791992188, 0.01885986328125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 3.0, 11.0, 12.0, 11.0, 15.0, 17.0, 34.0, 41.0, 78.0, 73.0, 108.0, 106.0, 97.0, 87.0, 73.0, 66.0, 48.0, 38.0, 30.0, 18.0, 13.0, 6.0, 8.0, 2.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.024169921875, -0.0234830379486084, -0.022796154022216797, -0.022109270095825195, -0.021422386169433594, -0.020735502243041992, -0.02004861831665039, -0.01936173439025879, -0.018674850463867188, -0.017987966537475586, -0.017301082611083984, -0.016614198684692383, -0.01592731475830078, -0.01524043083190918, -0.014553546905517578, -0.013866662979125977, -0.013179779052734375, -0.012492895126342773, -0.011806011199951172, -0.01111912727355957, -0.010432243347167969, -0.009745359420776367, -0.009058475494384766, -0.008371591567993164, -0.0076847076416015625, -0.006997823715209961, -0.006310939788818359, -0.005624055862426758, -0.004937171936035156, -0.004250288009643555, -0.003563404083251953, -0.0028765201568603516, -0.00218963623046875, -0.0015027523040771484, -0.0008158683776855469, -0.0001289844512939453, 0.0005578994750976562, 0.0012447834014892578, 0.0019316673278808594, 0.002618551254272461, 0.0033054351806640625, 0.003992319107055664, 0.004679203033447266, 0.005366086959838867, 0.006052970886230469, 0.00673985481262207, 0.007426738739013672, 0.008113622665405273, 0.008800506591796875, 0.009487390518188477, 0.010174274444580078, 0.01086115837097168, 0.011548042297363281, 0.012234926223754883, 0.012921810150146484, 0.013608694076538086, 0.014295578002929688, 0.014982461929321289, 0.01566934585571289, 0.016356229782104492, 0.017043113708496094, 0.017729997634887695, 0.018416881561279297, 0.0191037654876709, 0.0197906494140625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [2.0, 13.0, 31.0, 395.0, 538.0, 31.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20775380730628967, -0.15670248866081238, -0.10565116256475449, -0.054599836468696594, -0.0035485178232192993, 0.04750281572341919, 0.09855413436889648, 0.14960545301437378, 0.20065677165985107, 0.25170809030532837, 0.30275940895080566, 0.35381072759628296, 0.40486204624176025, 0.45591339468955994, 0.5069646835327148, 0.5580160617828369, 0.6090673208236694, 0.6601186394691467, 0.711169958114624, 0.7622212767601013, 0.8132725954055786, 0.8643239736557007, 0.9153752326965332, 0.9664266109466553, 1.0174779891967773, 1.0685293674468994, 1.119580626487732, 1.170632004737854, 1.2216832637786865, 1.2727346420288086, 1.3237859010696411, 1.3748372793197632, 1.4258884191513062, 1.4769397974014282, 1.5279910564422607, 1.5790424346923828, 1.6300936937332153, 1.6811450719833374, 1.73219633102417, 1.783247709274292, 1.8342989683151245, 1.8853503465652466, 1.936401605606079, 1.9874529838562012, 2.0385043621063232, 2.089555501937866, 2.1406068801879883, 2.1916582584381104, 2.2427096366882324, 2.2937610149383545, 2.3448123931884766, 2.3958635330200195, 2.4469149112701416, 2.4979662895202637, 2.5490176677703857, 2.6000688076019287, 2.651120185852051, 2.702171564102173, 2.753222942352295, 2.804274082183838, 2.85532546043396, 2.906376838684082, 2.957428216934204, 3.008479356765747, 3.059530735015869]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 8.0, 1.0, 4.0, 3.0, 7.0, 9.0, 9.0, 7.0, 8.0, 9.0, 14.0, 32.0, 48.0, 102.0, 110.0, 167.0, 153.0, 127.0, 69.0, 36.0, 18.0, 19.0, 6.0, 5.0, 2.0, 4.0, 3.0, 4.0, 3.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4588866233825684, -1.418999433517456, -1.3791122436523438, -1.3392250537872314, -1.2993378639221191, -1.2594506740570068, -1.2195634841918945, -1.1796762943267822, -1.13978910446167, -1.0999019145965576, -1.0600147247314453, -1.020127534866333, -0.9802403450012207, -0.9403531551361084, -0.9004659652709961, -0.8605787754058838, -0.8206915855407715, -0.7808043956756592, -0.7409172058105469, -0.7010300159454346, -0.6611428260803223, -0.62125563621521, -0.5813684463500977, -0.5414812564849854, -0.501594066619873, -0.46170687675476074, -0.42181968688964844, -0.38193249702453613, -0.34204530715942383, -0.3021581172943115, -0.2622709274291992, -0.22238373756408691, -0.1824965476989746, -0.1426093578338623, -0.10272216796875, -0.0628349781036377, -0.02294778823852539, 0.016939401626586914, 0.05682659149169922, 0.09671378135681152, 0.13660097122192383, 0.17648816108703613, 0.21637535095214844, 0.25626254081726074, 0.29614973068237305, 0.33603692054748535, 0.37592411041259766, 0.41581130027770996, 0.45569849014282227, 0.49558568000793457, 0.5354728698730469, 0.5753600597381592, 0.6152472496032715, 0.6551344394683838, 0.6950216293334961, 0.7349088191986084, 0.7747960090637207, 0.814683198928833, 0.8545703887939453, 0.8944575786590576, 0.9343447685241699, 0.9742319583892822, 1.0141191482543945, 1.0540063381195068, 1.0938935279846191]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 8.0, 9.0, 19.0, 21.0, 25.0, 40.0, 46.0, 85.0, 103.0, 184.0, 236.0, 368.0, 568.0, 887.0, 1470.0, 2372.0, 4193.0, 7981.0, 16318.0, 43379.0, 255070.0, 3706340.0, 100439.0, 27748.0, 11918.0, 6051.0, 3261.0, 1913.0, 1148.0, 662.0, 508.0, 324.0, 195.0, 125.0, 67.0, 64.0, 40.0, 32.0, 25.0, 13.0, 10.0, 7.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.098388671875, -0.09534263610839844, -0.09229660034179688, -0.08925056457519531, -0.08620452880859375, -0.08315849304199219, -0.08011245727539062, -0.07706642150878906, -0.0740203857421875, -0.07097434997558594, -0.06792831420898438, -0.06488227844238281, -0.06183624267578125, -0.05879020690917969, -0.055744171142578125, -0.05269813537597656, -0.049652099609375, -0.04660606384277344, -0.043560028076171875, -0.04051399230957031, -0.03746795654296875, -0.03442192077636719, -0.031375885009765625, -0.028329849243164062, -0.0252838134765625, -0.022237777709960938, -0.019191741943359375, -0.016145706176757812, -0.01309967041015625, -0.010053634643554688, -0.007007598876953125, -0.0039615631103515625, -0.00091552734375, 0.0021305084228515625, 0.005176544189453125, 0.008222579956054688, 0.01126861572265625, 0.014314651489257812, 0.017360687255859375, 0.020406723022460938, 0.0234527587890625, 0.026498794555664062, 0.029544830322265625, 0.03259086608886719, 0.03563690185546875, 0.03868293762207031, 0.041728973388671875, 0.04477500915527344, 0.047821044921875, 0.05086708068847656, 0.053913116455078125, 0.05695915222167969, 0.06000518798828125, 0.06305122375488281, 0.06609725952148438, 0.06914329528808594, 0.0721893310546875, 0.07523536682128906, 0.07828140258789062, 0.08132743835449219, 0.08437347412109375, 0.08741950988769531, 0.09046554565429688, 0.09351158142089844, 0.0965576171875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 7.0, 5.0, 6.0, 7.0, 15.0, 13.0, 15.0, 27.0, 22.0, 25.0, 36.0, 43.0, 81.0, 182.0, 191.0, 96.0, 41.0, 34.0, 33.0, 17.0, 18.0, 17.0, 12.0, 17.0, 5.0, 8.0, 6.0, 8.0, 4.0, 2.0, 1.0, 2.0, 0.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0208587646484375, -0.0203096866607666, -0.019760608673095703, -0.019211530685424805, -0.018662452697753906, -0.018113374710083008, -0.01756429672241211, -0.01701521873474121, -0.016466140747070312, -0.015917062759399414, -0.015367984771728516, -0.014818906784057617, -0.014269828796386719, -0.01372075080871582, -0.013171672821044922, -0.012622594833374023, -0.012073516845703125, -0.011524438858032227, -0.010975360870361328, -0.01042628288269043, -0.009877204895019531, -0.009328126907348633, -0.008779048919677734, -0.008229970932006836, -0.0076808929443359375, -0.007131814956665039, -0.006582736968994141, -0.006033658981323242, -0.005484580993652344, -0.004935503005981445, -0.004386425018310547, -0.0038373470306396484, -0.00328826904296875, -0.0027391910552978516, -0.002190113067626953, -0.0016410350799560547, -0.0010919570922851562, -0.0005428791046142578, 6.198883056640625e-06, 0.0005552768707275391, 0.0011043548583984375, 0.001653432846069336, 0.0022025108337402344, 0.002751588821411133, 0.0033006668090820312, 0.0038497447967529297, 0.004398822784423828, 0.0049479007720947266, 0.005496978759765625, 0.0060460567474365234, 0.006595134735107422, 0.00714421272277832, 0.007693290710449219, 0.008242368698120117, 0.008791446685791016, 0.009340524673461914, 0.009889602661132812, 0.010438680648803711, 0.01098775863647461, 0.011536836624145508, 0.012085914611816406, 0.012634992599487305, 0.013184070587158203, 0.013733148574829102, 0.0142822265625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 5.0, 1.0, 3.0, 4.0, 5.0, 8.0, 16.0, 13.0, 13.0, 22.0, 40.0, 48.0, 78.0, 125.0, 220.0, 389.0, 668.0, 1433.0, 3366.0, 8682.0, 26489.0, 111000.0, 3259480.0, 680511.0, 70604.0, 19197.0, 6634.0, 2682.0, 1128.0, 593.0, 290.0, 204.0, 115.0, 65.0, 51.0, 33.0, 22.0, 12.0, 10.0, 7.0, 3.0, 8.0, 4.0, 0.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09619140625, -0.09317207336425781, -0.09015274047851562, -0.08713340759277344, -0.08411407470703125, -0.08109474182128906, -0.07807540893554688, -0.07505607604980469, -0.0720367431640625, -0.06901741027832031, -0.06599807739257812, -0.06297874450683594, -0.05995941162109375, -0.05694007873535156, -0.053920745849609375, -0.05090141296386719, -0.047882080078125, -0.04486274719238281, -0.041843414306640625, -0.03882408142089844, -0.03580474853515625, -0.03278541564941406, -0.029766082763671875, -0.026746749877929688, -0.0237274169921875, -0.020708084106445312, -0.017688751220703125, -0.014669418334960938, -0.01165008544921875, -0.008630752563476562, -0.005611419677734375, -0.0025920867919921875, 0.00042724609375, 0.0034465789794921875, 0.006465911865234375, 0.009485244750976562, 0.01250457763671875, 0.015523910522460938, 0.018543243408203125, 0.021562576293945312, 0.0245819091796875, 0.027601242065429688, 0.030620574951171875, 0.03363990783691406, 0.03665924072265625, 0.03967857360839844, 0.042697906494140625, 0.04571723937988281, 0.048736572265625, 0.05175590515136719, 0.054775238037109375, 0.05779457092285156, 0.06081390380859375, 0.06383323669433594, 0.06685256958007812, 0.06987190246582031, 0.0728912353515625, 0.07591056823730469, 0.07892990112304688, 0.08194923400878906, 0.08496856689453125, 0.08798789978027344, 0.09100723266601562, 0.09402656555175781, 0.0970458984375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 5.0, 2.0, 14.0, 9.0, 13.0, 15.0, 16.0, 28.0, 53.0, 58.0, 82.0, 136.0, 251.0, 629.0, 1837.0, 365.0, 172.0, 107.0, 65.0, 52.0, 37.0, 25.0, 21.0, 17.0, 14.0, 10.0, 8.0, 4.0, 3.0, 6.0, 7.0, 2.0, 0.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0224151611328125, -0.021828889846801758, -0.021242618560791016, -0.020656347274780273, -0.02007007598876953, -0.01948380470275879, -0.018897533416748047, -0.018311262130737305, -0.017724990844726562, -0.01713871955871582, -0.016552448272705078, -0.015966176986694336, -0.015379905700683594, -0.014793634414672852, -0.01420736312866211, -0.013621091842651367, -0.013034820556640625, -0.012448549270629883, -0.01186227798461914, -0.011276006698608398, -0.010689735412597656, -0.010103464126586914, -0.009517192840576172, -0.00893092155456543, -0.008344650268554688, -0.007758378982543945, -0.007172107696533203, -0.006585836410522461, -0.005999565124511719, -0.0054132938385009766, -0.004827022552490234, -0.004240751266479492, -0.00365447998046875, -0.003068208694458008, -0.0024819374084472656, -0.0018956661224365234, -0.0013093948364257812, -0.0007231235504150391, -0.00013685226440429688, 0.0004494190216064453, 0.0010356903076171875, 0.0016219615936279297, 0.002208232879638672, 0.002794504165649414, 0.0033807754516601562, 0.0039670467376708984, 0.004553318023681641, 0.005139589309692383, 0.005725860595703125, 0.006312131881713867, 0.006898403167724609, 0.0074846744537353516, 0.008070945739746094, 0.008657217025756836, 0.009243488311767578, 0.00982975959777832, 0.010416030883789062, 0.011002302169799805, 0.011588573455810547, 0.012174844741821289, 0.012761116027832031, 0.013347387313842773, 0.013933658599853516, 0.014519929885864258, 0.015106201171875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 32.0, 142.0, 435.0, 303.0, 68.0, 19.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08249970525503159, -0.07544651627540588, -0.06839332729578018, -0.06134013831615448, -0.05428694933652878, -0.047233764082193375, -0.04018057510256767, -0.03312738612294197, -0.02607419714331627, -0.019021008163690567, -0.01196782011538744, -0.0049146320670843124, 0.0021385569125413895, 0.009191744029521942, 0.016244933009147644, 0.023298121988773346, 0.030351310968399048, 0.03740449994802475, 0.04445768892765045, 0.051510877907276154, 0.058564066886901855, 0.06561724841594696, 0.07267044484615326, 0.07972362637519836, 0.08677682280540466, 0.09383001178503036, 0.10088320076465607, 0.10793638974428177, 0.11498957872390747, 0.12204276025295258, 0.12909595668315887, 0.13614913821220398, 0.14320231974124908, 0.1502555012702942, 0.1573086977005005, 0.1643618792295456, 0.1714150756597519, 0.178468257188797, 0.1855214536190033, 0.1925746351480484, 0.1996278315782547, 0.2066810131072998, 0.2137342095375061, 0.2207873910665512, 0.2278405874967575, 0.2348937690258026, 0.2419469654560089, 0.24900014698505402, 0.2560533285140991, 0.2631065249443054, 0.27015969157218933, 0.27721288800239563, 0.28426608443260193, 0.2913192808628082, 0.29837244749069214, 0.30542564392089844, 0.31247884035110474, 0.31953203678131104, 0.32658520340919495, 0.33363839983940125, 0.34069159626960754, 0.34774479269981384, 0.35479795932769775, 0.36185115575790405, 0.36890435218811035]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 10.0, 6.0, 9.0, 16.0, 13.0, 19.0, 25.0, 35.0, 51.0, 49.0, 75.0, 57.0, 77.0, 86.0, 77.0, 76.0, 59.0, 53.0, 33.0, 35.0, 28.0, 25.0, 10.0, 21.0, 11.0, 4.0, 8.0, 6.0, 5.0, 4.0, 4.0, 2.0, 0.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.08272719383239746, -0.08022410422563553, -0.0777210146188736, -0.07521792501211166, -0.07271483540534973, -0.0702117532491684, -0.06770866364240646, -0.06520557403564453, -0.0627024844288826, -0.060199394822120667, -0.057696305215358734, -0.0551932193338871, -0.05269012972712517, -0.050187040120363235, -0.0476839542388916, -0.04518086463212967, -0.04267777502536774, -0.040174685418605804, -0.03767159581184387, -0.03516850993037224, -0.032665420323610306, -0.030162330716848373, -0.02765924297273159, -0.025156155228614807, -0.022653065621852875, -0.020149976015090942, -0.01764688827097416, -0.015143799595534801, -0.012640710920095444, -0.010137622244656086, -0.007634533569216728, -0.005131445825099945, -0.0026283562183380127, -0.00012526754289865494, 0.002377821132540703, 0.004880909807980061, 0.007383998483419418, 0.009887087158858776, 0.012390175834298134, 0.014893263578414917, 0.01739635318517685, 0.019899442791938782, 0.022402530536055565, 0.024905618280172348, 0.02740870788693428, 0.029911797493696213, 0.03241488337516785, 0.03491797298192978, 0.03742106258869171, 0.039924152195453644, 0.042427241802215576, 0.04493032768368721, 0.04743341729044914, 0.049936506897211075, 0.05243959277868271, 0.05494268238544464, 0.057445771992206573, 0.059948861598968506, 0.06245195120573044, 0.06495504081249237, 0.0674581229686737, 0.06996121257543564, 0.07246430218219757, 0.0749673917889595, 0.07747048139572144]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 5.0, 2.0, 3.0, 10.0, 8.0, 17.0, 13.0, 24.0, 43.0, 44.0, 78.0, 126.0, 204.0, 336.0, 537.0, 997.0, 1892.0, 3656.0, 8401.0, 21395.0, 73443.0, 622629.0, 240371.0, 46349.0, 15355.0, 6187.0, 2935.0, 1409.0, 781.0, 499.0, 287.0, 186.0, 108.0, 70.0, 48.0, 40.0, 13.0, 13.0, 16.0, 14.0, 9.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11676025390625, -0.11350154876708984, -0.11024284362792969, -0.10698413848876953, -0.10372543334960938, -0.10046672821044922, -0.09720802307128906, -0.0939493179321289, -0.09069061279296875, -0.0874319076538086, -0.08417320251464844, -0.08091449737548828, -0.07765579223632812, -0.07439708709716797, -0.07113838195800781, -0.06787967681884766, -0.0646209716796875, -0.061362266540527344, -0.05810356140136719, -0.05484485626220703, -0.051586151123046875, -0.04832744598388672, -0.04506874084472656, -0.041810035705566406, -0.03855133056640625, -0.035292625427246094, -0.03203392028808594, -0.02877521514892578, -0.025516510009765625, -0.02225780487060547, -0.018999099731445312, -0.015740394592285156, -0.012481689453125, -0.009222984313964844, -0.0059642791748046875, -0.0027055740356445312, 0.000553131103515625, 0.0038118362426757812, 0.0070705413818359375, 0.010329246520996094, 0.01358795166015625, 0.016846656799316406, 0.020105361938476562, 0.02336406707763672, 0.026622772216796875, 0.02988147735595703, 0.03314018249511719, 0.036398887634277344, 0.0396575927734375, 0.042916297912597656, 0.04617500305175781, 0.04943370819091797, 0.052692413330078125, 0.05595111846923828, 0.05920982360839844, 0.062468528747558594, 0.06572723388671875, 0.0689859390258789, 0.07224464416503906, 0.07550334930419922, 0.07876205444335938, 0.08202075958251953, 0.08527946472167969, 0.08853816986083984, 0.091796875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 2.0, 4.0, 7.0, 5.0, 7.0, 14.0, 17.0, 11.0, 24.0, 26.0, 39.0, 26.0, 55.0, 113.0, 176.0, 151.0, 84.0, 44.0, 36.0, 32.0, 26.0, 13.0, 19.0, 8.0, 18.0, 12.0, 2.0, 9.0, 3.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.0210418701171875, -0.020514369010925293, -0.019986867904663086, -0.01945936679840088, -0.018931865692138672, -0.018404364585876465, -0.017876863479614258, -0.01734936237335205, -0.016821861267089844, -0.016294360160827637, -0.01576685905456543, -0.015239357948303223, -0.014711856842041016, -0.014184355735778809, -0.013656854629516602, -0.013129353523254395, -0.012601852416992188, -0.01207435131072998, -0.011546850204467773, -0.011019349098205566, -0.01049184799194336, -0.009964346885681152, -0.009436845779418945, -0.008909344673156738, -0.008381843566894531, -0.007854342460632324, -0.007326841354370117, -0.00679934024810791, -0.006271839141845703, -0.005744338035583496, -0.005216836929321289, -0.004689335823059082, -0.004161834716796875, -0.003634333610534668, -0.003106832504272461, -0.002579331398010254, -0.002051830291748047, -0.0015243291854858398, -0.0009968280792236328, -0.0004693269729614258, 5.817413330078125e-05, 0.0005856752395629883, 0.0011131763458251953, 0.0016406774520874023, 0.0021681785583496094, 0.0026956796646118164, 0.0032231807708740234, 0.0037506818771362305, 0.0042781829833984375, 0.0048056840896606445, 0.0053331851959228516, 0.005860686302185059, 0.006388187408447266, 0.006915688514709473, 0.00744318962097168, 0.007970690727233887, 0.008498191833496094, 0.0090256929397583, 0.009553194046020508, 0.010080695152282715, 0.010608196258544922, 0.011135697364807129, 0.011663198471069336, 0.012190699577331543, 0.01271820068359375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 9.0, 2.0, 7.0, 13.0, 22.0, 21.0, 36.0, 66.0, 88.0, 196.0, 501.0, 2216.0, 15803.0, 485391.0, 525182.0, 15805.0, 2199.0, 526.0, 197.0, 82.0, 64.0, 28.0, 28.0, 16.0, 5.0, 8.0, 8.0, 3.0, 2.0, 5.0, 4.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.1575927734375, -0.1530914306640625, -0.148590087890625, -0.1440887451171875, -0.13958740234375, -0.1350860595703125, -0.130584716796875, -0.1260833740234375, -0.12158203125, -0.1170806884765625, -0.112579345703125, -0.1080780029296875, -0.10357666015625, -0.0990753173828125, -0.094573974609375, -0.0900726318359375, -0.0855712890625, -0.0810699462890625, -0.076568603515625, -0.0720672607421875, -0.06756591796875, -0.0630645751953125, -0.058563232421875, -0.0540618896484375, -0.049560546875, -0.0450592041015625, -0.040557861328125, -0.0360565185546875, -0.03155517578125, -0.0270538330078125, -0.022552490234375, -0.0180511474609375, -0.0135498046875, -0.0090484619140625, -0.004547119140625, -4.57763671875e-05, 0.00445556640625, 0.0089569091796875, 0.013458251953125, 0.0179595947265625, 0.0224609375, 0.0269622802734375, 0.031463623046875, 0.0359649658203125, 0.04046630859375, 0.0449676513671875, 0.049468994140625, 0.0539703369140625, 0.0584716796875, 0.0629730224609375, 0.067474365234375, 0.0719757080078125, 0.07647705078125, 0.0809783935546875, 0.085479736328125, 0.0899810791015625, 0.094482421875, 0.0989837646484375, 0.103485107421875, 0.1079864501953125, 0.11248779296875, 0.1169891357421875, 0.121490478515625, 0.1259918212890625, 0.1304931640625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 10.0, 6.0, 7.0, 5.0, 8.0, 18.0, 19.0, 14.0, 23.0, 21.0, 28.0, 32.0, 40.0, 42.0, 56.0, 46.0, 49.0, 46.0, 55.0, 44.0, 35.0, 49.0, 57.0, 38.0, 34.0, 42.0, 25.0, 31.0, 25.0, 16.0, 19.0, 12.0, 10.0, 12.0, 4.0, 7.0, 7.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.05364990234375, -0.052046775817871094, -0.05044364929199219, -0.04884052276611328, -0.047237396240234375, -0.04563426971435547, -0.04403114318847656, -0.042428016662597656, -0.04082489013671875, -0.039221763610839844, -0.03761863708496094, -0.03601551055908203, -0.034412384033203125, -0.03280925750732422, -0.031206130981445312, -0.029603004455566406, -0.0279998779296875, -0.026396751403808594, -0.024793624877929688, -0.02319049835205078, -0.021587371826171875, -0.01998424530029297, -0.018381118774414062, -0.016777992248535156, -0.01517486572265625, -0.013571739196777344, -0.011968612670898438, -0.010365486145019531, -0.008762359619140625, -0.007159233093261719, -0.0055561065673828125, -0.003952980041503906, -0.002349853515625, -0.0007467269897460938, 0.0008563995361328125, 0.0024595260620117188, 0.004062652587890625, 0.005665779113769531, 0.0072689056396484375, 0.008872032165527344, 0.01047515869140625, 0.012078285217285156, 0.013681411743164062, 0.015284538269042969, 0.016887664794921875, 0.01849079132080078, 0.020093917846679688, 0.021697044372558594, 0.0233001708984375, 0.024903297424316406, 0.026506423950195312, 0.02810955047607422, 0.029712677001953125, 0.03131580352783203, 0.03291893005371094, 0.034522056579589844, 0.03612518310546875, 0.037728309631347656, 0.03933143615722656, 0.04093456268310547, 0.042537689208984375, 0.04414081573486328, 0.04574394226074219, 0.047347068786621094, 0.0489501953125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 7.0, 13.0, 25.0, 78.0, 554.0, 616227.0, 430949.0, 562.0, 82.0, 33.0, 15.0, 3.0, 3.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4658203125, -0.4538726806640625, -0.441925048828125, -0.4299774169921875, -0.41802978515625, -0.4060821533203125, -0.394134521484375, -0.3821868896484375, -0.3702392578125, -0.3582916259765625, -0.346343994140625, -0.3343963623046875, -0.32244873046875, -0.3105010986328125, -0.298553466796875, -0.2866058349609375, -0.274658203125, -0.2627105712890625, -0.250762939453125, -0.2388153076171875, -0.22686767578125, -0.2149200439453125, -0.202972412109375, -0.1910247802734375, -0.1790771484375, -0.1671295166015625, -0.155181884765625, -0.1432342529296875, -0.13128662109375, -0.1193389892578125, -0.107391357421875, -0.0954437255859375, -0.08349609375, -0.0715484619140625, -0.059600830078125, -0.0476531982421875, -0.03570556640625, -0.0237579345703125, -0.011810302734375, 0.0001373291015625, 0.0120849609375, 0.0240325927734375, 0.035980224609375, 0.0479278564453125, 0.05987548828125, 0.0718231201171875, 0.083770751953125, 0.0957183837890625, 0.107666015625, 0.1196136474609375, 0.131561279296875, 0.1435089111328125, 0.15545654296875, 0.1674041748046875, 0.179351806640625, 0.1912994384765625, 0.2032470703125, 0.2151947021484375, 0.227142333984375, 0.2390899658203125, 0.25103759765625, 0.2629852294921875, 0.274932861328125, 0.2868804931640625, 0.298828125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 2.0, 5.0, 5.0, 9.0, 17.0, 14.0, 23.0, 34.0, 45.0, 62.0, 70.0, 99.0, 106.0, 121.0, 83.0, 79.0, 57.0, 34.0, 29.0, 25.0, 9.0, 7.0, 10.0, 7.0, 9.0, 6.0, 8.0, 3.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.9981136322021484e-05, -2.8857029974460602e-05, -2.773292362689972e-05, -2.6608817279338837e-05, -2.5484710931777954e-05, -2.436060458421707e-05, -2.323649823665619e-05, -2.2112391889095306e-05, -2.0988285541534424e-05, -1.986417919397354e-05, -1.874007284641266e-05, -1.7615966498851776e-05, -1.6491860151290894e-05, -1.536775380373001e-05, -1.4243647456169128e-05, -1.3119541108608246e-05, -1.1995434761047363e-05, -1.087132841348648e-05, -9.747222065925598e-06, -8.623115718364716e-06, -7.499009370803833e-06, -6.3749030232429504e-06, -5.250796675682068e-06, -4.126690328121185e-06, -3.0025839805603027e-06, -1.8784776329994202e-06, -7.543712854385376e-07, 3.6973506212234497e-07, 1.4938414096832275e-06, 2.61794775724411e-06, 3.7420541048049927e-06, 4.866160452365875e-06, 5.990266799926758e-06, 7.11437314748764e-06, 8.238479495048523e-06, 9.362585842609406e-06, 1.0486692190170288e-05, 1.161079853773117e-05, 1.2734904885292053e-05, 1.3859011232852936e-05, 1.4983117580413818e-05, 1.61072239279747e-05, 1.7231330275535583e-05, 1.8355436623096466e-05, 1.947954297065735e-05, 2.060364931821823e-05, 2.1727755665779114e-05, 2.2851862013339996e-05, 2.397596836090088e-05, 2.510007470846176e-05, 2.6224181056022644e-05, 2.7348287403583527e-05, 2.847239375114441e-05, 2.9596500098705292e-05, 3.0720606446266174e-05, 3.184471279382706e-05, 3.296881914138794e-05, 3.409292548894882e-05, 3.5217031836509705e-05, 3.634113818407059e-05, 3.746524453163147e-05, 3.858935087919235e-05, 3.9713457226753235e-05, 4.083756357431412e-05, 4.1961669921875e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 10.0, 12.0, 28.0, 34.0, 50.0, 107.0, 208.0, 500.0, 1401.0, 5130.0, 38540.0, 842549.0, 145093.0, 10940.0, 2487.0, 795.0, 344.0, 126.0, 69.0, 42.0, 16.0, 15.0, 14.0, 8.0, 9.0, 5.0, 6.0, 2.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09271240234375, -0.08987712860107422, -0.08704185485839844, -0.08420658111572266, -0.08137130737304688, -0.0785360336303711, -0.07570075988769531, -0.07286548614501953, -0.07003021240234375, -0.06719493865966797, -0.06435966491699219, -0.061524391174316406, -0.058689117431640625, -0.055853843688964844, -0.05301856994628906, -0.05018329620361328, -0.0473480224609375, -0.04451274871826172, -0.04167747497558594, -0.038842201232910156, -0.036006927490234375, -0.033171653747558594, -0.030336380004882812, -0.02750110626220703, -0.02466583251953125, -0.02183055877685547, -0.018995285034179688, -0.016160011291503906, -0.013324737548828125, -0.010489463806152344, -0.0076541900634765625, -0.004818916320800781, -0.001983642578125, 0.0008516311645507812, 0.0036869049072265625, 0.006522178649902344, 0.009357452392578125, 0.012192726135253906, 0.015027999877929688, 0.01786327362060547, 0.02069854736328125, 0.02353382110595703, 0.026369094848632812, 0.029204368591308594, 0.032039642333984375, 0.034874916076660156, 0.03771018981933594, 0.04054546356201172, 0.0433807373046875, 0.04621601104736328, 0.04905128479003906, 0.051886558532714844, 0.054721832275390625, 0.057557106018066406, 0.06039237976074219, 0.06322765350341797, 0.06606292724609375, 0.06889820098876953, 0.07173347473144531, 0.0745687484741211, 0.07740402221679688, 0.08023929595947266, 0.08307456970214844, 0.08590984344482422, 0.0887451171875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 8.0, 6.0, 10.0, 16.0, 25.0, 41.0, 67.0, 124.0, 133.0, 173.0, 160.0, 93.0, 51.0, 26.0, 16.0, 12.0, 8.0, 8.0, 4.0, 1.0, 2.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.057373046875, -0.05559873580932617, -0.053824424743652344, -0.052050113677978516, -0.05027580261230469, -0.04850149154663086, -0.04672718048095703, -0.0449528694152832, -0.043178558349609375, -0.04140424728393555, -0.03962993621826172, -0.03785562515258789, -0.03608131408691406, -0.034307003021240234, -0.032532691955566406, -0.030758380889892578, -0.02898406982421875, -0.027209758758544922, -0.025435447692871094, -0.023661136627197266, -0.021886825561523438, -0.02011251449584961, -0.01833820343017578, -0.016563892364501953, -0.014789581298828125, -0.013015270233154297, -0.011240959167480469, -0.00946664810180664, -0.0076923370361328125, -0.005918025970458984, -0.004143714904785156, -0.002369403839111328, -0.0005950927734375, 0.0011792182922363281, 0.0029535293579101562, 0.004727840423583984, 0.0065021514892578125, 0.00827646255493164, 0.010050773620605469, 0.011825084686279297, 0.013599395751953125, 0.015373706817626953, 0.01714801788330078, 0.01892232894897461, 0.020696640014648438, 0.022470951080322266, 0.024245262145996094, 0.026019573211669922, 0.02779388427734375, 0.029568195343017578, 0.031342506408691406, 0.033116817474365234, 0.03489112854003906, 0.03666543960571289, 0.03843975067138672, 0.04021406173706055, 0.041988372802734375, 0.0437626838684082, 0.04553699493408203, 0.04731130599975586, 0.04908561706542969, 0.050859928131103516, 0.052634239196777344, 0.05440855026245117, 0.056182861328125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 7.0, 16.0, 218.0, 732.0, 32.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35238611698150635, -0.2851608991622925, -0.21793566644191742, -0.15071043372154236, -0.08348521590232849, -0.016259998083114624, 0.05096524953842163, 0.1181904673576355, 0.18541568517684937, 0.25264090299606323, 0.3198661208152771, 0.38709136843681335, 0.4543165862560272, 0.5215418338775635, 0.5887670516967773, 0.6559922695159912, 0.7232174873352051, 0.790442705154419, 0.8576679229736328, 0.9248931407928467, 0.9921183586120605, 1.0593435764312744, 1.1265687942504883, 1.1937940120697021, 1.261019229888916, 1.3282444477081299, 1.3954696655273438, 1.4626948833465576, 1.5299201011657715, 1.5971453189849854, 1.6643705368041992, 1.731595754623413, 1.798821210861206, 1.86604642868042, 1.9332716464996338, 2.0004968643188477, 2.0677220821380615, 2.1349472999572754, 2.2021725177764893, 2.269397735595703, 2.336622953414917, 2.403848171234131, 2.4710733890533447, 2.5382986068725586, 2.6055238246917725, 2.6727490425109863, 2.7399742603302, 2.807199478149414, 2.874424934387207, 2.941650152206421, 3.0088753700256348, 3.0761005878448486, 3.1433258056640625, 3.2105510234832764, 3.2777762413024902, 3.345001459121704, 3.412226676940918, 3.479451894760132, 3.5466771125793457, 3.6139023303985596, 3.6811275482177734, 3.7483527660369873, 3.815577983856201, 3.882803201675415, 3.950028419494629]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 1.0, 8.0, 10.0, 12.0, 8.0, 8.0, 9.0, 14.0, 15.0, 27.0, 33.0, 42.0, 52.0, 51.0, 66.0, 54.0, 72.0, 65.0, 71.0, 65.0, 46.0, 46.0, 40.0, 26.0, 38.0, 22.0, 18.0, 15.0, 20.0, 8.0, 4.0, 8.0, 4.0, 3.0, 3.0, 6.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4513883590698242, -0.4379616677761078, -0.42453497648239136, -0.41110825538635254, -0.3976815640926361, -0.3842548727989197, -0.37082818150520325, -0.3574014902114868, -0.343974769115448, -0.33054807782173157, -0.31712138652801514, -0.3036946654319763, -0.2902679741382599, -0.27684128284454346, -0.263414591550827, -0.2499879002571106, -0.23656120896339417, -0.22313451766967773, -0.2097078114748001, -0.19628112018108368, -0.18285441398620605, -0.16942772269248962, -0.1560010313987732, -0.14257434010505676, -0.12914763391017914, -0.11572093516588211, -0.10229423642158508, -0.08886754512786865, -0.07544084638357162, -0.0620141476392746, -0.048587456345558167, -0.03516075760126114, -0.02173405885696411, -0.008307361975312233, 0.005119334906339645, 0.018546029925346375, 0.0319727286696434, 0.04539942741394043, 0.05882611870765686, 0.07225281745195389, 0.08567951619625092, 0.09910621494054794, 0.11253291368484497, 0.1259596049785614, 0.13938629627227783, 0.15281300246715546, 0.1662396937608719, 0.1796663999557495, 0.19309309124946594, 0.20651978254318237, 0.21994648873806, 0.23337318003177643, 0.24679988622665405, 0.2602265775203705, 0.2736532688140869, 0.28707996010780334, 0.3005066514015198, 0.3139333426952362, 0.32736003398895264, 0.34078675508499146, 0.3542134463787079, 0.3676401376724243, 0.38106682896614075, 0.3944935202598572, 0.407920241355896]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 7.0, 3.0, 5.0, 16.0, 8.0, 10.0, 21.0, 20.0, 32.0, 27.0, 32.0, 54.0, 68.0, 98.0, 127.0, 183.0, 271.0, 384.0, 625.0, 812.0, 1244.0, 1796.0, 2898.0, 4701.0, 9240.0, 24348.0, 138289.0, 3877231.0, 90253.0, 20420.0, 8250.0, 4348.0, 2699.0, 1789.0, 1113.0, 819.0, 584.0, 411.0, 331.0, 211.0, 144.0, 113.0, 72.0, 63.0, 37.0, 29.0, 20.0, 13.0, 6.0, 6.0, 2.0, 2.0, 1.0], "bins": [-0.177734375, -0.17310714721679688, -0.16847991943359375, -0.16385269165039062, -0.1592254638671875, -0.15459823608398438, -0.14997100830078125, -0.14534378051757812, -0.140716552734375, -0.13608932495117188, -0.13146209716796875, -0.12683486938476562, -0.1222076416015625, -0.11758041381835938, -0.11295318603515625, -0.10832595825195312, -0.10369873046875, -0.09907150268554688, -0.09444427490234375, -0.08981704711914062, -0.0851898193359375, -0.08056259155273438, -0.07593536376953125, -0.07130813598632812, -0.066680908203125, -0.062053680419921875, -0.05742645263671875, -0.052799224853515625, -0.0481719970703125, -0.043544769287109375, -0.03891754150390625, -0.034290313720703125, -0.0296630859375, -0.025035858154296875, -0.02040863037109375, -0.015781402587890625, -0.0111541748046875, -0.006526947021484375, -0.00189971923828125, 0.002727508544921875, 0.007354736328125, 0.011981964111328125, 0.01660919189453125, 0.021236419677734375, 0.0258636474609375, 0.030490875244140625, 0.03511810302734375, 0.039745330810546875, 0.04437255859375, 0.048999786376953125, 0.05362701416015625, 0.058254241943359375, 0.0628814697265625, 0.06750869750976562, 0.07213592529296875, 0.07676315307617188, 0.081390380859375, 0.08601760864257812, 0.09064483642578125, 0.09527206420898438, 0.0998992919921875, 0.10452651977539062, 0.10915374755859375, 0.11378097534179688, 0.118408203125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 3.0, 6.0, 12.0, 11.0, 17.0, 19.0, 13.0, 18.0, 32.0, 39.0, 66.0, 82.0, 137.0, 142.0, 121.0, 63.0, 51.0, 42.0, 15.0, 20.0, 17.0, 13.0, 19.0, 5.0, 8.0, 5.0, 6.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.0209197998046875, -0.020386576652526855, -0.01985335350036621, -0.019320130348205566, -0.018786907196044922, -0.018253684043884277, -0.017720460891723633, -0.01718723773956299, -0.016654014587402344, -0.0161207914352417, -0.015587568283081055, -0.01505434513092041, -0.014521121978759766, -0.013987898826599121, -0.013454675674438477, -0.012921452522277832, -0.012388229370117188, -0.011855006217956543, -0.011321783065795898, -0.010788559913635254, -0.01025533676147461, -0.009722113609313965, -0.00918889045715332, -0.008655667304992676, -0.008122444152832031, -0.007589221000671387, -0.007055997848510742, -0.006522774696350098, -0.005989551544189453, -0.005456328392028809, -0.004923105239868164, -0.0043898820877075195, -0.003856658935546875, -0.0033234357833862305, -0.002790212631225586, -0.0022569894790649414, -0.0017237663269042969, -0.0011905431747436523, -0.0006573200225830078, -0.00012409687042236328, 0.00040912628173828125, 0.0009423494338989258, 0.0014755725860595703, 0.002008795738220215, 0.0025420188903808594, 0.003075242042541504, 0.0036084651947021484, 0.004141688346862793, 0.0046749114990234375, 0.005208134651184082, 0.0057413578033447266, 0.006274580955505371, 0.006807804107666016, 0.00734102725982666, 0.007874250411987305, 0.00840747356414795, 0.008940696716308594, 0.009473919868469238, 0.010007143020629883, 0.010540366172790527, 0.011073589324951172, 0.011606812477111816, 0.012140035629272461, 0.012673258781433105, 0.01320648193359375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 5.0, 12.0, 12.0, 14.0, 15.0, 40.0, 53.0, 90.0, 164.0, 324.0, 812.0, 2214.0, 6765.0, 23959.0, 154203.0, 3821972.0, 149177.0, 23828.0, 6628.0, 2308.0, 871.0, 334.0, 181.0, 85.0, 62.0, 40.0, 27.0, 20.0, 14.0, 12.0, 11.0, 5.0, 10.0, 2.0, 5.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1544189453125, -0.1493549346923828, -0.14429092407226562, -0.13922691345214844, -0.13416290283203125, -0.12909889221191406, -0.12403488159179688, -0.11897087097167969, -0.1139068603515625, -0.10884284973144531, -0.10377883911132812, -0.09871482849121094, -0.09365081787109375, -0.08858680725097656, -0.08352279663085938, -0.07845878601074219, -0.073394775390625, -0.06833076477050781, -0.06326675415039062, -0.05820274353027344, -0.05313873291015625, -0.04807472229003906, -0.043010711669921875, -0.03794670104980469, -0.0328826904296875, -0.027818679809570312, -0.022754669189453125, -0.017690658569335938, -0.01262664794921875, -0.0075626373291015625, -0.002498626708984375, 0.0025653839111328125, 0.00762939453125, 0.012693405151367188, 0.017757415771484375, 0.022821426391601562, 0.02788543701171875, 0.03294944763183594, 0.038013458251953125, 0.04307746887207031, 0.0481414794921875, 0.05320549011230469, 0.058269500732421875, 0.06333351135253906, 0.06839752197265625, 0.07346153259277344, 0.07852554321289062, 0.08358955383300781, 0.088653564453125, 0.09371757507324219, 0.09878158569335938, 0.10384559631347656, 0.10890960693359375, 0.11397361755371094, 0.11903762817382812, 0.12410163879394531, 0.1291656494140625, 0.1342296600341797, 0.13929367065429688, 0.14435768127441406, 0.14942169189453125, 0.15448570251464844, 0.15954971313476562, 0.1646137237548828, 0.169677734375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 4.0, 4.0, 3.0, 6.0, 7.0, 4.0, 9.0, 14.0, 10.0, 19.0, 33.0, 33.0, 45.0, 71.0, 105.0, 177.0, 409.0, 1784.0, 655.0, 231.0, 126.0, 98.0, 52.0, 33.0, 28.0, 24.0, 15.0, 19.0, 12.0, 7.0, 8.0, 4.0, 8.0, 2.0, 0.0, 3.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0160675048828125, -0.015443563461303711, -0.014819622039794922, -0.014195680618286133, -0.013571739196777344, -0.012947797775268555, -0.012323856353759766, -0.011699914932250977, -0.011075973510742188, -0.010452032089233398, -0.00982809066772461, -0.00920414924621582, -0.008580207824707031, -0.007956266403198242, -0.007332324981689453, -0.006708383560180664, -0.006084442138671875, -0.005460500717163086, -0.004836559295654297, -0.004212617874145508, -0.0035886764526367188, -0.0029647350311279297, -0.0023407936096191406, -0.0017168521881103516, -0.0010929107666015625, -0.00046896934509277344, 0.00015497207641601562, 0.0007789134979248047, 0.0014028549194335938, 0.002026796340942383, 0.002650737762451172, 0.003274679183959961, 0.00389862060546875, 0.004522562026977539, 0.005146503448486328, 0.005770444869995117, 0.006394386291503906, 0.007018327713012695, 0.007642269134521484, 0.008266210556030273, 0.008890151977539062, 0.009514093399047852, 0.01013803482055664, 0.01076197624206543, 0.011385917663574219, 0.012009859085083008, 0.012633800506591797, 0.013257741928100586, 0.013881683349609375, 0.014505624771118164, 0.015129566192626953, 0.015753507614135742, 0.01637744903564453, 0.01700139045715332, 0.01762533187866211, 0.0182492733001709, 0.018873214721679688, 0.019497156143188477, 0.020121097564697266, 0.020745038986206055, 0.021368980407714844, 0.021992921829223633, 0.022616863250732422, 0.02324080467224121, 0.02386474609375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 10.0, 34.0, 172.0, 427.0, 293.0, 55.0, 15.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16836299002170563, -0.1582910716533661, -0.14821913838386536, -0.13814722001552582, -0.12807530164718628, -0.11800337582826614, -0.10793145000934601, -0.09785953164100647, -0.08778760582208633, -0.0777156800031662, -0.06764376163482666, -0.057571835815906525, -0.04749991372227669, -0.03742799162864685, -0.027356065809726715, -0.017284147441387177, -0.007212221622467041, 0.0028597014024853706, 0.012931624427437782, 0.02300354838371277, 0.033075470477342606, 0.04314739257097244, 0.05321931838989258, 0.06329123675823212, 0.07336316257715225, 0.08343508839607239, 0.09350700676441193, 0.10357893258333206, 0.1136508584022522, 0.12372277677059174, 0.13379469513893127, 0.143866628408432, 0.15393856167793274, 0.16401048004627228, 0.174082413315773, 0.18415433168411255, 0.1942262500524521, 0.20429816842079163, 0.21437010169029236, 0.2244420200586319, 0.23451393842697144, 0.24458585679531097, 0.2546577751636505, 0.26472970843315125, 0.274801641702652, 0.2848735451698303, 0.29494547843933105, 0.3050174117088318, 0.3150893449783325, 0.32516127824783325, 0.3352331817150116, 0.34530511498451233, 0.35537704825401306, 0.3654489517211914, 0.37552088499069214, 0.38559281826019287, 0.3956647217273712, 0.40573665499687195, 0.4158085584640503, 0.425880491733551, 0.43595242500305176, 0.4460243284702301, 0.45609626173973083, 0.4661681652069092, 0.4762400984764099]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 3.0, 7.0, 7.0, 13.0, 18.0, 21.0, 22.0, 31.0, 39.0, 51.0, 63.0, 65.0, 58.0, 73.0, 63.0, 56.0, 56.0, 49.0, 64.0, 50.0, 46.0, 32.0, 34.0, 20.0, 18.0, 14.0, 7.0, 7.0, 6.0, 7.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09539002180099487, -0.0922093614935875, -0.08902870118618011, -0.08584803342819214, -0.08266737312078476, -0.07948671281337738, -0.0763060450553894, -0.07312538474798203, -0.06994472444057465, -0.06676406413316727, -0.06358340382575989, -0.06040273606777191, -0.05722207576036453, -0.05404141545295715, -0.050860751420259476, -0.0476800873875618, -0.04449942708015442, -0.04131876677274704, -0.03813810274004936, -0.034957438707351685, -0.031776778399944305, -0.028596116229891777, -0.02541545405983925, -0.02223479188978672, -0.019054129719734192, -0.015873467549681664, -0.012692805379629135, -0.009512143209576607, -0.006331481039524078, -0.00315081886947155, 2.9843300580978394e-05, 0.0032105054706335068, 0.006391167640686035, 0.009571829810738564, 0.012752491980791092, 0.01593315415084362, 0.01911381632089615, 0.022294478490948677, 0.025475140661001205, 0.028655802831053734, 0.03183646500110626, 0.03501712530851364, 0.03819778934121132, 0.041378453373909, 0.044559113681316376, 0.047739773988723755, 0.05092043802142143, 0.05410110205411911, 0.05728176236152649, 0.06046242266893387, 0.06364308297634125, 0.06682375073432922, 0.0700044110417366, 0.07318507134914398, 0.07636573910713196, 0.07954639941453934, 0.08272705972194672, 0.0859077200293541, 0.08908838033676147, 0.09226904809474945, 0.09544970840215683, 0.09863036870956421, 0.10181103646755219, 0.10499169677495956, 0.10817235708236694]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 10.0, 7.0, 14.0, 10.0, 24.0, 31.0, 44.0, 100.0, 136.0, 260.0, 431.0, 825.0, 1566.0, 3212.0, 7147.0, 16761.0, 49290.0, 237241.0, 586675.0, 96747.0, 27796.0, 10757.0, 4669.0, 2228.0, 1197.0, 585.0, 298.0, 184.0, 101.0, 78.0, 46.0, 22.0, 23.0, 18.0, 10.0, 4.0, 7.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1180419921875, -0.11413955688476562, -0.11023712158203125, -0.10633468627929688, -0.1024322509765625, -0.09852981567382812, -0.09462738037109375, -0.09072494506835938, -0.086822509765625, -0.08292007446289062, -0.07901763916015625, -0.07511520385742188, -0.0712127685546875, -0.06731033325195312, -0.06340789794921875, -0.059505462646484375, -0.05560302734375, -0.051700592041015625, -0.04779815673828125, -0.043895721435546875, -0.0399932861328125, -0.036090850830078125, -0.03218841552734375, -0.028285980224609375, -0.024383544921875, -0.020481109619140625, -0.01657867431640625, -0.012676239013671875, -0.0087738037109375, -0.004871368408203125, -0.00096893310546875, 0.002933502197265625, 0.0068359375, 0.010738372802734375, 0.01464080810546875, 0.018543243408203125, 0.0224456787109375, 0.026348114013671875, 0.03025054931640625, 0.034152984619140625, 0.038055419921875, 0.041957855224609375, 0.04586029052734375, 0.049762725830078125, 0.0536651611328125, 0.057567596435546875, 0.06147003173828125, 0.06537246704101562, 0.06927490234375, 0.07317733764648438, 0.07707977294921875, 0.08098220825195312, 0.0848846435546875, 0.08878707885742188, 0.09268951416015625, 0.09659194946289062, 0.100494384765625, 0.10439682006835938, 0.10829925537109375, 0.11220169067382812, 0.1161041259765625, 0.12000656127929688, 0.12390899658203125, 0.12781143188476562, 0.1317138671875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 3.0, 0.0, 10.0, 9.0, 3.0, 13.0, 14.0, 20.0, 15.0, 27.0, 23.0, 50.0, 71.0, 94.0, 134.0, 139.0, 105.0, 61.0, 55.0, 35.0, 25.0, 17.0, 16.0, 15.0, 9.0, 8.0, 5.0, 1.0, 7.0, 6.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 1.0], "bins": [-0.020599365234375, -0.02008509635925293, -0.01957082748413086, -0.01905655860900879, -0.01854228973388672, -0.01802802085876465, -0.017513751983642578, -0.016999483108520508, -0.016485214233398438, -0.015970945358276367, -0.015456676483154297, -0.014942407608032227, -0.014428138732910156, -0.013913869857788086, -0.013399600982666016, -0.012885332107543945, -0.012371063232421875, -0.011856794357299805, -0.011342525482177734, -0.010828256607055664, -0.010313987731933594, -0.009799718856811523, -0.009285449981689453, -0.008771181106567383, -0.008256912231445312, -0.007742643356323242, -0.007228374481201172, -0.0067141056060791016, -0.006199836730957031, -0.005685567855834961, -0.005171298980712891, -0.00465703010559082, -0.00414276123046875, -0.0036284923553466797, -0.0031142234802246094, -0.002599954605102539, -0.0020856857299804688, -0.0015714168548583984, -0.0010571479797363281, -0.0005428791046142578, -2.86102294921875e-05, 0.0004856586456298828, 0.0009999275207519531, 0.0015141963958740234, 0.0020284652709960938, 0.002542734146118164, 0.0030570030212402344, 0.0035712718963623047, 0.004085540771484375, 0.004599809646606445, 0.005114078521728516, 0.005628347396850586, 0.006142616271972656, 0.0066568851470947266, 0.007171154022216797, 0.007685422897338867, 0.008199691772460938, 0.008713960647583008, 0.009228229522705078, 0.009742498397827148, 0.010256767272949219, 0.010771036148071289, 0.01128530502319336, 0.01179957389831543, 0.0123138427734375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 4.0, 5.0, 9.0, 8.0, 14.0, 16.0, 27.0, 32.0, 40.0, 62.0, 93.0, 131.0, 194.0, 302.0, 507.0, 1090.0, 2809.0, 10933.0, 65724.0, 488951.0, 411494.0, 52188.0, 9158.0, 2410.0, 992.0, 501.0, 289.0, 177.0, 118.0, 82.0, 54.0, 36.0, 31.0, 23.0, 16.0, 6.0, 8.0, 6.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.15234375, -0.1478557586669922, -0.14336776733398438, -0.13887977600097656, -0.13439178466796875, -0.12990379333496094, -0.12541580200195312, -0.12092781066894531, -0.1164398193359375, -0.11195182800292969, -0.10746383666992188, -0.10297584533691406, -0.09848785400390625, -0.09399986267089844, -0.08951187133789062, -0.08502388000488281, -0.080535888671875, -0.07604789733886719, -0.07155990600585938, -0.06707191467285156, -0.06258392333984375, -0.05809593200683594, -0.053607940673828125, -0.04911994934082031, -0.0446319580078125, -0.04014396667480469, -0.035655975341796875, -0.031167984008789062, -0.02667999267578125, -0.022192001342773438, -0.017704010009765625, -0.013216018676757812, -0.00872802734375, -0.0042400360107421875, 0.000247955322265625, 0.0047359466552734375, 0.00922393798828125, 0.013711929321289062, 0.018199920654296875, 0.022687911987304688, 0.0271759033203125, 0.03166389465332031, 0.036151885986328125, 0.04063987731933594, 0.04512786865234375, 0.04961585998535156, 0.054103851318359375, 0.05859184265136719, 0.063079833984375, 0.06756782531738281, 0.07205581665039062, 0.07654380798339844, 0.08103179931640625, 0.08551979064941406, 0.09000778198242188, 0.09449577331542969, 0.0989837646484375, 0.10347175598144531, 0.10795974731445312, 0.11244773864746094, 0.11693572998046875, 0.12142372131347656, 0.12591171264648438, 0.1303997039794922, 0.1348876953125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 3.0, 6.0, 5.0, 11.0, 8.0, 22.0, 19.0, 14.0, 20.0, 23.0, 23.0, 30.0, 24.0, 36.0, 33.0, 32.0, 49.0, 42.0, 52.0, 54.0, 46.0, 46.0, 51.0, 42.0, 37.0, 40.0, 38.0, 28.0, 23.0, 20.0, 30.0, 13.0, 15.0, 16.0, 13.0, 11.0, 8.0, 2.0, 6.0, 3.0, 4.0, 1.0, 4.0, 2.0, 0.0, 2.0, 3.0], "bins": [-0.07135009765625, -0.06942319869995117, -0.06749629974365234, -0.06556940078735352, -0.06364250183105469, -0.06171560287475586, -0.05978870391845703, -0.0578618049621582, -0.055934906005859375, -0.05400800704956055, -0.05208110809326172, -0.05015420913696289, -0.04822731018066406, -0.046300411224365234, -0.044373512268066406, -0.04244661331176758, -0.04051971435546875, -0.03859281539916992, -0.036665916442871094, -0.034739017486572266, -0.03281211853027344, -0.03088521957397461, -0.02895832061767578, -0.027031421661376953, -0.025104522705078125, -0.023177623748779297, -0.02125072479248047, -0.01932382583618164, -0.017396926879882812, -0.015470027923583984, -0.013543128967285156, -0.011616230010986328, -0.0096893310546875, -0.007762432098388672, -0.005835533142089844, -0.003908634185791016, -0.0019817352294921875, -5.4836273193359375e-05, 0.0018720626831054688, 0.003798961639404297, 0.005725860595703125, 0.007652759552001953, 0.009579658508300781, 0.01150655746459961, 0.013433456420898438, 0.015360355377197266, 0.017287254333496094, 0.019214153289794922, 0.02114105224609375, 0.023067951202392578, 0.024994850158691406, 0.026921749114990234, 0.028848648071289062, 0.03077554702758789, 0.03270244598388672, 0.03462934494018555, 0.036556243896484375, 0.0384831428527832, 0.04041004180908203, 0.04233694076538086, 0.04426383972167969, 0.046190738677978516, 0.048117637634277344, 0.05004453659057617, 0.051971435546875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 7.0, 7.0, 11.0, 16.0, 17.0, 47.0, 58.0, 105.0, 189.0, 293.0, 572.0, 1078.0, 2560.0, 6471.0, 19806.0, 83520.0, 416245.0, 405727.0, 81352.0, 19358.0, 6170.0, 2419.0, 1159.0, 622.0, 289.0, 172.0, 103.0, 67.0, 40.0, 34.0, 16.0, 13.0, 7.0, 3.0, 5.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.053375244140625, -0.05165290832519531, -0.049930572509765625, -0.04820823669433594, -0.04648590087890625, -0.04476356506347656, -0.043041229248046875, -0.04131889343261719, -0.0395965576171875, -0.03787422180175781, -0.036151885986328125, -0.03442955017089844, -0.03270721435546875, -0.030984878540039062, -0.029262542724609375, -0.027540206909179688, -0.02581787109375, -0.024095535278320312, -0.022373199462890625, -0.020650863647460938, -0.01892852783203125, -0.017206192016601562, -0.015483856201171875, -0.013761520385742188, -0.0120391845703125, -0.010316848754882812, -0.008594512939453125, -0.0068721771240234375, -0.00514984130859375, -0.0034275054931640625, -0.001705169677734375, 1.71661376953125e-05, 0.001739501953125, 0.0034618377685546875, 0.005184173583984375, 0.0069065093994140625, 0.00862884521484375, 0.010351181030273438, 0.012073516845703125, 0.013795852661132812, 0.0155181884765625, 0.017240524291992188, 0.018962860107421875, 0.020685195922851562, 0.02240753173828125, 0.024129867553710938, 0.025852203369140625, 0.027574539184570312, 0.029296875, 0.031019210815429688, 0.032741546630859375, 0.03446388244628906, 0.03618621826171875, 0.03790855407714844, 0.039630889892578125, 0.04135322570800781, 0.0430755615234375, 0.04479789733886719, 0.046520233154296875, 0.04824256896972656, 0.04996490478515625, 0.05168724060058594, 0.053409576416015625, 0.05513191223144531, 0.056854248046875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 1.0, 8.0, 11.0, 6.0, 8.0, 14.0, 14.0, 21.0, 33.0, 31.0, 31.0, 58.0, 51.0, 67.0, 83.0, 92.0, 70.0, 63.0, 61.0, 59.0, 43.0, 31.0, 22.0, 21.0, 29.0, 10.0, 16.0, 13.0, 10.0, 5.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.695487976074219e-05, -3.566499799489975e-05, -3.437511622905731e-05, -3.3085234463214874e-05, -3.1795352697372437e-05, -3.050547093153e-05, -2.921558916568756e-05, -2.7925707399845123e-05, -2.6635825634002686e-05, -2.5345943868160248e-05, -2.405606210231781e-05, -2.2766180336475372e-05, -2.1476298570632935e-05, -2.0186416804790497e-05, -1.889653503894806e-05, -1.760665327310562e-05, -1.6316771507263184e-05, -1.5026889741420746e-05, -1.3737007975578308e-05, -1.244712620973587e-05, -1.1157244443893433e-05, -9.867362678050995e-06, -8.577480912208557e-06, -7.287599146366119e-06, -5.997717380523682e-06, -4.707835614681244e-06, -3.417953848838806e-06, -2.1280720829963684e-06, -8.381903171539307e-07, 4.516914486885071e-07, 1.7415732145309448e-06, 3.0314549803733826e-06, 4.32133674621582e-06, 5.611218512058258e-06, 6.901100277900696e-06, 8.190982043743134e-06, 9.480863809585571e-06, 1.0770745575428009e-05, 1.2060627341270447e-05, 1.3350509107112885e-05, 1.4640390872955322e-05, 1.593027263879776e-05, 1.7220154404640198e-05, 1.8510036170482635e-05, 1.9799917936325073e-05, 2.108979970216751e-05, 2.237968146800995e-05, 2.3669563233852386e-05, 2.4959444999694824e-05, 2.6249326765537262e-05, 2.75392085313797e-05, 2.8829090297222137e-05, 3.0118972063064575e-05, 3.140885382890701e-05, 3.269873559474945e-05, 3.398861736059189e-05, 3.5278499126434326e-05, 3.6568380892276764e-05, 3.78582626581192e-05, 3.914814442396164e-05, 4.043802618980408e-05, 4.1727907955646515e-05, 4.301778972148895e-05, 4.430767148733139e-05, 4.559755325317383e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 6.0, 10.0, 9.0, 5.0, 11.0, 7.0, 16.0, 15.0, 27.0, 40.0, 42.0, 63.0, 104.0, 171.0, 309.0, 561.0, 1307.0, 3230.0, 10499.0, 53923.0, 452268.0, 454746.0, 54635.0, 10617.0, 3308.0, 1267.0, 543.0, 276.0, 169.0, 103.0, 60.0, 66.0, 28.0, 29.0, 28.0, 14.0, 12.0, 9.0, 3.0, 7.0, 4.0, 0.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.07867431640625, -0.07648897171020508, -0.07430362701416016, -0.07211828231811523, -0.06993293762207031, -0.06774759292602539, -0.06556224822998047, -0.06337690353393555, -0.061191558837890625, -0.0590062141418457, -0.05682086944580078, -0.05463552474975586, -0.05245018005371094, -0.050264835357666016, -0.048079490661621094, -0.04589414596557617, -0.04370880126953125, -0.04152345657348633, -0.039338111877441406, -0.037152767181396484, -0.03496742248535156, -0.03278207778930664, -0.03059673309326172, -0.028411388397216797, -0.026226043701171875, -0.024040699005126953, -0.02185535430908203, -0.01967000961303711, -0.017484664916992188, -0.015299320220947266, -0.013113975524902344, -0.010928630828857422, -0.0087432861328125, -0.006557941436767578, -0.004372596740722656, -0.0021872520446777344, -1.9073486328125e-06, 0.0021834373474121094, 0.004368782043457031, 0.006554126739501953, 0.008739471435546875, 0.010924816131591797, 0.013110160827636719, 0.01529550552368164, 0.017480850219726562, 0.019666194915771484, 0.021851539611816406, 0.024036884307861328, 0.02622222900390625, 0.028407573699951172, 0.030592918395996094, 0.032778263092041016, 0.03496360778808594, 0.03714895248413086, 0.03933429718017578, 0.0415196418762207, 0.043704986572265625, 0.04589033126831055, 0.04807567596435547, 0.05026102066040039, 0.05244636535644531, 0.054631710052490234, 0.056817054748535156, 0.05900239944458008, 0.061187744140625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 4.0, 4.0, 3.0, 9.0, 11.0, 10.0, 17.0, 23.0, 16.0, 29.0, 31.0, 44.0, 55.0, 60.0, 52.0, 79.0, 77.0, 69.0, 67.0, 62.0, 42.0, 44.0, 40.0, 31.0, 22.0, 20.0, 18.0, 12.0, 8.0, 12.0, 7.0, 6.0, 5.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03155517578125, -0.030637025833129883, -0.029718875885009766, -0.02880072593688965, -0.02788257598876953, -0.026964426040649414, -0.026046276092529297, -0.02512812614440918, -0.024209976196289062, -0.023291826248168945, -0.022373676300048828, -0.02145552635192871, -0.020537376403808594, -0.019619226455688477, -0.01870107650756836, -0.017782926559448242, -0.016864776611328125, -0.015946626663208008, -0.01502847671508789, -0.014110326766967773, -0.013192176818847656, -0.012274026870727539, -0.011355876922607422, -0.010437726974487305, -0.009519577026367188, -0.00860142707824707, -0.007683277130126953, -0.006765127182006836, -0.005846977233886719, -0.0049288272857666016, -0.004010677337646484, -0.003092527389526367, -0.00217437744140625, -0.0012562274932861328, -0.0003380775451660156, 0.0005800724029541016, 0.0014982223510742188, 0.002416372299194336, 0.003334522247314453, 0.00425267219543457, 0.0051708221435546875, 0.006088972091674805, 0.007007122039794922, 0.007925271987915039, 0.008843421936035156, 0.009761571884155273, 0.01067972183227539, 0.011597871780395508, 0.012516021728515625, 0.013434171676635742, 0.01435232162475586, 0.015270471572875977, 0.016188621520996094, 0.01710677146911621, 0.018024921417236328, 0.018943071365356445, 0.019861221313476562, 0.02077937126159668, 0.021697521209716797, 0.022615671157836914, 0.02353382110595703, 0.02445197105407715, 0.025370121002197266, 0.026288270950317383, 0.0272064208984375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 5.0, 4.0, 13.0, 30.0, 63.0, 119.0, 228.0, 246.0, 147.0, 82.0, 33.0, 17.0, 12.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0117350816726685, -0.9838110208511353, -0.955886960029602, -0.9279628396034241, -0.9000387787818909, -0.8721147179603577, -0.8441905975341797, -0.8162665367126465, -0.7883424758911133, -0.7604184150695801, -0.7324943542480469, -0.7045702338218689, -0.6766461730003357, -0.6487221121788025, -0.6207979917526245, -0.5928739309310913, -0.5649498701095581, -0.5370258092880249, -0.5091017484664917, -0.4811776280403137, -0.4532535672187805, -0.4253295063972473, -0.3974054157733917, -0.36948132514953613, -0.34155726432800293, -0.3136332035064697, -0.28570911288261414, -0.25778502225875854, -0.22986096143722534, -0.20193688571453094, -0.17401280999183655, -0.14608873426914215, -0.11816471815109253, -0.09024064242839813, -0.062316566705703735, -0.03439249098300934, -0.006468415260314941, 0.021455660462379456, 0.04937973618507385, 0.07730381190776825, 0.10522788763046265, 0.13315196335315704, 0.16107603907585144, 0.18900011479854584, 0.21692419052124023, 0.24484826624393463, 0.27277234196662903, 0.3006964325904846, 0.3286204934120178, 0.356544554233551, 0.3844686448574066, 0.4123927354812622, 0.4403167963027954, 0.4682408571243286, 0.4961649477481842, 0.5240890383720398, 0.552013099193573, 0.5799371600151062, 0.6078612804412842, 0.6357853412628174, 0.6637094020843506, 0.6916334629058838, 0.719557523727417, 0.747481644153595, 0.7754057049751282]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 7.0, 5.0, 8.0, 7.0, 16.0, 11.0, 25.0, 28.0, 32.0, 33.0, 36.0, 53.0, 48.0, 46.0, 57.0, 59.0, 67.0, 60.0, 60.0, 48.0, 53.0, 39.0, 41.0, 36.0, 24.0, 23.0, 24.0, 16.0, 11.0, 13.0, 9.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5634295344352722, -0.5459505319595337, -0.5284714698791504, -0.5109924674034119, -0.49351343512535095, -0.47603440284729004, -0.4585554003715515, -0.4410763680934906, -0.4235973358154297, -0.4061183035373688, -0.38863930106163025, -0.37116026878356934, -0.3536812365055084, -0.3362022042274475, -0.318723201751709, -0.30124416947364807, -0.28376516699790955, -0.26628613471984863, -0.2488071173429489, -0.2313280999660492, -0.21384906768798828, -0.19637005031108856, -0.17889103293418884, -0.16141200065612793, -0.1439329832792282, -0.1264539659023285, -0.10897493362426758, -0.09149591624736786, -0.07401689141988754, -0.05653786659240723, -0.03905884921550751, -0.02157982438802719, -0.004100799560546875, 0.013378223404288292, 0.03085724636912346, 0.04833626747131348, 0.06581529229879379, 0.08329431712627411, 0.10077333450317383, 0.11825235933065414, 0.13573138415813446, 0.15321040153503418, 0.1706894338130951, 0.1881684511899948, 0.20564746856689453, 0.22312650084495544, 0.24060551822185516, 0.2580845355987549, 0.2755635678768158, 0.2930426001548767, 0.31052160263061523, 0.32800063490867615, 0.34547966718673706, 0.3629586696624756, 0.3804377019405365, 0.3979167342185974, 0.41539573669433594, 0.43287476897239685, 0.4503537714481354, 0.4678328037261963, 0.4853118360042572, 0.5027908682823181, 0.5202698707580566, 0.5377488732337952, 0.5552279353141785]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 8.0, 10.0, 10.0, 16.0, 30.0, 28.0, 46.0, 87.0, 173.0, 345.0, 730.0, 2176.0, 9538.0, 133125.0, 4005801.0, 34736.0, 4867.0, 1424.0, 525.0, 241.0, 145.0, 75.0, 45.0, 27.0, 25.0, 7.0, 5.0, 11.0, 6.0, 1.0, 1.0, 4.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.417236328125, -0.406341552734375, -0.39544677734375, -0.384552001953125, -0.3736572265625, -0.362762451171875, -0.35186767578125, -0.340972900390625, -0.330078125, -0.319183349609375, -0.30828857421875, -0.297393798828125, -0.2864990234375, -0.275604248046875, -0.26470947265625, -0.253814697265625, -0.242919921875, -0.232025146484375, -0.22113037109375, -0.210235595703125, -0.1993408203125, -0.188446044921875, -0.17755126953125, -0.166656494140625, -0.15576171875, -0.144866943359375, -0.13397216796875, -0.123077392578125, -0.1121826171875, -0.101287841796875, -0.09039306640625, -0.079498291015625, -0.068603515625, -0.057708740234375, -0.04681396484375, -0.035919189453125, -0.0250244140625, -0.014129638671875, -0.00323486328125, 0.007659912109375, 0.0185546875, 0.029449462890625, 0.04034423828125, 0.051239013671875, 0.0621337890625, 0.073028564453125, 0.08392333984375, 0.094818115234375, 0.105712890625, 0.116607666015625, 0.12750244140625, 0.138397216796875, 0.1492919921875, 0.160186767578125, 0.17108154296875, 0.181976318359375, 0.19287109375, 0.203765869140625, 0.21466064453125, 0.225555419921875, 0.2364501953125, 0.247344970703125, 0.25823974609375, 0.269134521484375, 0.280029296875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 4.0, 5.0, 11.0, 7.0, 9.0, 21.0, 16.0, 21.0, 36.0, 32.0, 51.0, 60.0, 96.0, 77.0, 113.0, 91.0, 76.0, 75.0, 49.0, 25.0, 21.0, 22.0, 18.0, 18.0, 9.0, 3.0, 7.0, 5.0, 7.0, 3.0, 1.0, 0.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.0220184326171875, -0.021444082260131836, -0.020869731903076172, -0.020295381546020508, -0.019721031188964844, -0.01914668083190918, -0.018572330474853516, -0.01799798011779785, -0.017423629760742188, -0.016849279403686523, -0.01627492904663086, -0.015700578689575195, -0.015126228332519531, -0.014551877975463867, -0.013977527618408203, -0.013403177261352539, -0.012828826904296875, -0.012254476547241211, -0.011680126190185547, -0.011105775833129883, -0.010531425476074219, -0.009957075119018555, -0.00938272476196289, -0.008808374404907227, -0.008234024047851562, -0.0076596736907958984, -0.007085323333740234, -0.00651097297668457, -0.005936622619628906, -0.005362272262573242, -0.004787921905517578, -0.004213571548461914, -0.00363922119140625, -0.003064870834350586, -0.002490520477294922, -0.0019161701202392578, -0.0013418197631835938, -0.0007674694061279297, -0.00019311904907226562, 0.00038123130798339844, 0.0009555816650390625, 0.0015299320220947266, 0.0021042823791503906, 0.0026786327362060547, 0.0032529830932617188, 0.003827333450317383, 0.004401683807373047, 0.004976034164428711, 0.005550384521484375, 0.006124734878540039, 0.006699085235595703, 0.007273435592651367, 0.007847785949707031, 0.008422136306762695, 0.00899648666381836, 0.009570837020874023, 0.010145187377929688, 0.010719537734985352, 0.011293888092041016, 0.01186823844909668, 0.012442588806152344, 0.013016939163208008, 0.013591289520263672, 0.014165639877319336, 0.014739990234375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 6.0, 9.0, 15.0, 25.0, 34.0, 45.0, 122.0, 268.0, 700.0, 2117.0, 8458.0, 50179.0, 3128000.0, 955022.0, 39467.0, 7076.0, 1798.0, 491.0, 221.0, 96.0, 65.0, 32.0, 15.0, 7.0, 6.0, 8.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.280029296875, -0.27301788330078125, -0.2660064697265625, -0.25899505615234375, -0.251983642578125, -0.24497222900390625, -0.2379608154296875, -0.23094940185546875, -0.22393798828125, -0.21692657470703125, -0.2099151611328125, -0.20290374755859375, -0.195892333984375, -0.18888092041015625, -0.1818695068359375, -0.17485809326171875, -0.1678466796875, -0.16083526611328125, -0.1538238525390625, -0.14681243896484375, -0.139801025390625, -0.13278961181640625, -0.1257781982421875, -0.11876678466796875, -0.11175537109375, -0.10474395751953125, -0.0977325439453125, -0.09072113037109375, -0.083709716796875, -0.07669830322265625, -0.0696868896484375, -0.06267547607421875, -0.0556640625, -0.04865264892578125, -0.0416412353515625, -0.03462982177734375, -0.027618408203125, -0.02060699462890625, -0.0135955810546875, -0.00658416748046875, 0.00042724609375, 0.00743865966796875, 0.0144500732421875, 0.02146148681640625, 0.028472900390625, 0.03548431396484375, 0.0424957275390625, 0.04950714111328125, 0.0565185546875, 0.06352996826171875, 0.0705413818359375, 0.07755279541015625, 0.084564208984375, 0.09157562255859375, 0.0985870361328125, 0.10559844970703125, 0.11260986328125, 0.11962127685546875, 0.1266326904296875, 0.13364410400390625, 0.140655517578125, 0.14766693115234375, 0.1546783447265625, 0.16168975830078125, 0.168701171875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 3.0, 2.0, 3.0, 8.0, 11.0, 14.0, 9.0, 17.0, 20.0, 26.0, 41.0, 59.0, 81.0, 122.0, 261.0, 479.0, 1800.0, 469.0, 207.0, 126.0, 82.0, 67.0, 40.0, 22.0, 19.0, 22.0, 8.0, 16.0, 9.0, 5.0, 9.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.025177001953125, -0.02429342269897461, -0.02340984344482422, -0.022526264190673828, -0.021642684936523438, -0.020759105682373047, -0.019875526428222656, -0.018991947174072266, -0.018108367919921875, -0.017224788665771484, -0.016341209411621094, -0.015457630157470703, -0.014574050903320312, -0.013690471649169922, -0.012806892395019531, -0.01192331314086914, -0.01103973388671875, -0.01015615463256836, -0.009272575378417969, -0.008388996124267578, -0.0075054168701171875, -0.006621837615966797, -0.005738258361816406, -0.004854679107666016, -0.003971099853515625, -0.0030875205993652344, -0.0022039413452148438, -0.0013203620910644531, -0.0004367828369140625, 0.0004467964172363281, 0.0013303756713867188, 0.0022139549255371094, 0.0030975341796875, 0.003981113433837891, 0.004864692687988281, 0.005748271942138672, 0.0066318511962890625, 0.007515430450439453, 0.008399009704589844, 0.009282588958740234, 0.010166168212890625, 0.011049747467041016, 0.011933326721191406, 0.012816905975341797, 0.013700485229492188, 0.014584064483642578, 0.015467643737792969, 0.01635122299194336, 0.01723480224609375, 0.01811838150024414, 0.01900196075439453, 0.019885540008544922, 0.020769119262695312, 0.021652698516845703, 0.022536277770996094, 0.023419857025146484, 0.024303436279296875, 0.025187015533447266, 0.026070594787597656, 0.026954174041748047, 0.027837753295898438, 0.028721332550048828, 0.02960491180419922, 0.03048849105834961, 0.0313720703125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 8.0, 20.0, 44.0, 81.0, 179.0, 270.0, 203.0, 108.0, 49.0, 22.0, 13.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3423707187175751, -0.3335146903991699, -0.3246586322784424, -0.31580260396003723, -0.3069465756416321, -0.29809054732322693, -0.2892345190048218, -0.28037846088409424, -0.2715224325656891, -0.26266640424728394, -0.2538103461265564, -0.24495431780815125, -0.2360982894897461, -0.22724226117134094, -0.2183862179517746, -0.20953017473220825, -0.2006741464138031, -0.19181811809539795, -0.1829620748758316, -0.17410603165626526, -0.1652500033378601, -0.15639397501945496, -0.1475379317998886, -0.13868188858032227, -0.12982586026191711, -0.12096982449293137, -0.11211378872394562, -0.10325775295495987, -0.09440171718597412, -0.08554568141698837, -0.07668964564800262, -0.06783360987901688, -0.05897757411003113, -0.05012153834104538, -0.04126550257205963, -0.03240946680307388, -0.023553431034088135, -0.014697395265102386, -0.005841359496116638, 0.00301467627286911, 0.011870712041854858, 0.020726747810840607, 0.029582783579826355, 0.0384388193488121, 0.04729485511779785, 0.0561508908867836, 0.06500692665576935, 0.0738629624247551, 0.08271899819374084, 0.09157503396272659, 0.10043106973171234, 0.10928710550069809, 0.11814314126968384, 0.126999169588089, 0.13585521280765533, 0.14471125602722168, 0.15356728434562683, 0.16242331266403198, 0.17127935588359833, 0.18013539910316467, 0.18899142742156982, 0.19784745573997498, 0.20670349895954132, 0.21555954217910767, 0.22441557049751282]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 4.0, 2.0, 9.0, 5.0, 11.0, 11.0, 15.0, 16.0, 22.0, 25.0, 26.0, 34.0, 37.0, 51.0, 33.0, 56.0, 53.0, 44.0, 53.0, 57.0, 44.0, 47.0, 43.0, 45.0, 36.0, 36.0, 30.0, 37.0, 21.0, 26.0, 17.0, 14.0, 14.0, 11.0, 7.0, 7.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11070460081100464, -0.10726530849933624, -0.10382600873708725, -0.10038671642541885, -0.09694741666316986, -0.09350812435150146, -0.09006883203983307, -0.08662953972816467, -0.08319023996591568, -0.07975094765424728, -0.07631164789199829, -0.0728723555803299, -0.0694330632686615, -0.0659937635064125, -0.06255447119474411, -0.059115175157785416, -0.05567587912082672, -0.05223658308386803, -0.04879728704690933, -0.045357994735240936, -0.04191869869828224, -0.03847940266132355, -0.03504011034965515, -0.03160081431269646, -0.028161518275737762, -0.024722222238779068, -0.021282928064465523, -0.017843633890151978, -0.014404337853193283, -0.010965041816234589, -0.007525747641921043, -0.004086453467607498, -0.0006471574306488037, 0.002792137674987316, 0.006231432780623436, 0.009670727886259556, 0.013110022991895676, 0.01654931902885437, 0.019988613203167915, 0.02342790737748146, 0.026867203414440155, 0.03030649945139885, 0.033745795488357544, 0.03718508780002594, 0.040624383836984634, 0.04406367987394333, 0.047502972185611725, 0.05094226822257042, 0.054381564259529114, 0.05782086029648781, 0.0612601563334465, 0.0646994486451149, 0.06813874840736389, 0.07157804071903229, 0.07501733303070068, 0.07845662534236908, 0.08189592510461807, 0.08533521741628647, 0.08877451717853546, 0.09221380949020386, 0.09565310180187225, 0.09909240156412125, 0.10253169387578964, 0.10597099363803864, 0.10941028594970703]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 7.0, 10.0, 24.0, 22.0, 21.0, 69.0, 95.0, 136.0, 228.0, 341.0, 645.0, 1177.0, 2397.0, 5065.0, 11219.0, 29827.0, 94999.0, 371507.0, 380403.0, 98179.0, 30169.0, 11645.0, 5056.0, 2413.0, 1277.0, 647.0, 366.0, 197.0, 144.0, 88.0, 59.0, 27.0, 27.0, 20.0, 17.0, 12.0, 6.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1146240234375, -0.11135005950927734, -0.10807609558105469, -0.10480213165283203, -0.10152816772460938, -0.09825420379638672, -0.09498023986816406, -0.0917062759399414, -0.08843231201171875, -0.0851583480834961, -0.08188438415527344, -0.07861042022705078, -0.07533645629882812, -0.07206249237060547, -0.06878852844238281, -0.06551456451416016, -0.0622406005859375, -0.058966636657714844, -0.05569267272949219, -0.05241870880126953, -0.049144744873046875, -0.04587078094482422, -0.04259681701660156, -0.039322853088378906, -0.03604888916015625, -0.032774925231933594, -0.029500961303710938, -0.02622699737548828, -0.022953033447265625, -0.01967906951904297, -0.016405105590820312, -0.013131141662597656, -0.009857177734375, -0.006583213806152344, -0.0033092498779296875, -3.528594970703125e-05, 0.003238677978515625, 0.006512641906738281, 0.009786605834960938, 0.013060569763183594, 0.01633453369140625, 0.019608497619628906, 0.022882461547851562, 0.02615642547607422, 0.029430389404296875, 0.03270435333251953, 0.03597831726074219, 0.039252281188964844, 0.0425262451171875, 0.045800209045410156, 0.04907417297363281, 0.05234813690185547, 0.055622100830078125, 0.05889606475830078, 0.06217002868652344, 0.0654439926147461, 0.06871795654296875, 0.0719919204711914, 0.07526588439941406, 0.07853984832763672, 0.08181381225585938, 0.08508777618408203, 0.08836174011230469, 0.09163570404052734, 0.09490966796875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 5.0, 10.0, 6.0, 15.0, 23.0, 15.0, 35.0, 44.0, 48.0, 64.0, 81.0, 84.0, 103.0, 72.0, 77.0, 70.0, 55.0, 34.0, 35.0, 22.0, 18.0, 14.0, 9.0, 11.0, 11.0, 6.0, 3.0, 3.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.021331787109375, -0.020779967308044434, -0.020228147506713867, -0.0196763277053833, -0.019124507904052734, -0.018572688102722168, -0.0180208683013916, -0.017469048500061035, -0.01691722869873047, -0.016365408897399902, -0.015813589096069336, -0.01526176929473877, -0.014709949493408203, -0.014158129692077637, -0.01360630989074707, -0.013054490089416504, -0.012502670288085938, -0.011950850486755371, -0.011399030685424805, -0.010847210884094238, -0.010295391082763672, -0.009743571281433105, -0.009191751480102539, -0.008639931678771973, -0.008088111877441406, -0.00753629207611084, -0.0069844722747802734, -0.006432652473449707, -0.005880832672119141, -0.005329012870788574, -0.004777193069458008, -0.004225373268127441, -0.003673553466796875, -0.0031217336654663086, -0.002569913864135742, -0.0020180940628051758, -0.0014662742614746094, -0.000914454460144043, -0.00036263465881347656, 0.00018918514251708984, 0.0007410049438476562, 0.0012928247451782227, 0.001844644546508789, 0.0023964643478393555, 0.002948284149169922, 0.0035001039505004883, 0.004051923751831055, 0.004603743553161621, 0.0051555633544921875, 0.005707383155822754, 0.00625920295715332, 0.006811022758483887, 0.007362842559814453, 0.00791466236114502, 0.008466482162475586, 0.009018301963806152, 0.009570121765136719, 0.010121941566467285, 0.010673761367797852, 0.011225581169128418, 0.011777400970458984, 0.01232922077178955, 0.012881040573120117, 0.013432860374450684, 0.01398468017578125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 8.0, 10.0, 12.0, 15.0, 28.0, 32.0, 56.0, 65.0, 86.0, 138.0, 197.0, 293.0, 441.0, 858.0, 1857.0, 5087.0, 16709.0, 67086.0, 313689.0, 486508.0, 115530.0, 26844.0, 7593.0, 2650.0, 1098.0, 578.0, 344.0, 220.0, 160.0, 95.0, 65.0, 58.0, 31.0, 25.0, 23.0, 19.0, 7.0, 9.0, 11.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1171875, -0.11342906951904297, -0.10967063903808594, -0.1059122085571289, -0.10215377807617188, -0.09839534759521484, -0.09463691711425781, -0.09087848663330078, -0.08712005615234375, -0.08336162567138672, -0.07960319519042969, -0.07584476470947266, -0.07208633422851562, -0.0683279037475586, -0.06456947326660156, -0.06081104278564453, -0.0570526123046875, -0.05329418182373047, -0.04953575134277344, -0.045777320861816406, -0.042018890380859375, -0.038260459899902344, -0.03450202941894531, -0.03074359893798828, -0.02698516845703125, -0.02322673797607422, -0.019468307495117188, -0.015709877014160156, -0.011951446533203125, -0.008193016052246094, -0.0044345855712890625, -0.0006761550903320312, 0.003082275390625, 0.006840705871582031, 0.010599136352539062, 0.014357566833496094, 0.018115997314453125, 0.021874427795410156, 0.025632858276367188, 0.02939128875732422, 0.03314971923828125, 0.03690814971923828, 0.04066658020019531, 0.044425010681152344, 0.048183441162109375, 0.051941871643066406, 0.05570030212402344, 0.05945873260498047, 0.0632171630859375, 0.06697559356689453, 0.07073402404785156, 0.0744924545288086, 0.07825088500976562, 0.08200931549072266, 0.08576774597167969, 0.08952617645263672, 0.09328460693359375, 0.09704303741455078, 0.10080146789550781, 0.10455989837646484, 0.10831832885742188, 0.1120767593383789, 0.11583518981933594, 0.11959362030029297, 0.12335205078125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 1.0, 3.0, 6.0, 4.0, 9.0, 3.0, 12.0, 11.0, 10.0, 20.0, 19.0, 15.0, 32.0, 33.0, 29.0, 28.0, 31.0, 35.0, 45.0, 46.0, 40.0, 48.0, 41.0, 48.0, 45.0, 38.0, 40.0, 35.0, 38.0, 44.0, 34.0, 23.0, 27.0, 12.0, 17.0, 14.0, 8.0, 13.0, 6.0, 9.0, 5.0, 10.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.072021484375, -0.06980514526367188, -0.06758880615234375, -0.06537246704101562, -0.0631561279296875, -0.060939788818359375, -0.05872344970703125, -0.056507110595703125, -0.054290771484375, -0.052074432373046875, -0.04985809326171875, -0.047641754150390625, -0.0454254150390625, -0.043209075927734375, -0.04099273681640625, -0.038776397705078125, -0.03656005859375, -0.034343719482421875, -0.03212738037109375, -0.029911041259765625, -0.0276947021484375, -0.025478363037109375, -0.02326202392578125, -0.021045684814453125, -0.018829345703125, -0.016613006591796875, -0.01439666748046875, -0.012180328369140625, -0.0099639892578125, -0.007747650146484375, -0.00553131103515625, -0.003314971923828125, -0.0010986328125, 0.001117706298828125, 0.00333404541015625, 0.005550384521484375, 0.0077667236328125, 0.009983062744140625, 0.01219940185546875, 0.014415740966796875, 0.016632080078125, 0.018848419189453125, 0.02106475830078125, 0.023281097412109375, 0.0254974365234375, 0.027713775634765625, 0.02993011474609375, 0.032146453857421875, 0.03436279296875, 0.036579132080078125, 0.03879547119140625, 0.041011810302734375, 0.0432281494140625, 0.045444488525390625, 0.04766082763671875, 0.049877166748046875, 0.052093505859375, 0.054309844970703125, 0.05652618408203125, 0.058742523193359375, 0.0609588623046875, 0.06317520141601562, 0.06539154052734375, 0.06760787963867188, 0.06982421875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 9.0, 11.0, 13.0, 18.0, 27.0, 52.0, 106.0, 102.0, 143.0, 239.0, 345.0, 517.0, 755.0, 1333.0, 2212.0, 4008.0, 8235.0, 21451.0, 71233.0, 295663.0, 459488.0, 124802.0, 33349.0, 12019.0, 5275.0, 2812.0, 1589.0, 906.0, 606.0, 392.0, 256.0, 181.0, 120.0, 91.0, 61.0, 53.0, 22.0, 18.0, 12.0, 8.0, 10.0, 2.0, 8.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.054534912109375, -0.05294036865234375, -0.0513458251953125, -0.04975128173828125, -0.04815673828125, -0.04656219482421875, -0.0449676513671875, -0.04337310791015625, -0.041778564453125, -0.04018402099609375, -0.0385894775390625, -0.03699493408203125, -0.035400390625, -0.03380584716796875, -0.0322113037109375, -0.03061676025390625, -0.029022216796875, -0.02742767333984375, -0.0258331298828125, -0.02423858642578125, -0.02264404296875, -0.02104949951171875, -0.0194549560546875, -0.01786041259765625, -0.016265869140625, -0.01467132568359375, -0.0130767822265625, -0.01148223876953125, -0.0098876953125, -0.00829315185546875, -0.0066986083984375, -0.00510406494140625, -0.003509521484375, -0.00191497802734375, -0.0003204345703125, 0.00127410888671875, 0.00286865234375, 0.00446319580078125, 0.0060577392578125, 0.00765228271484375, 0.009246826171875, 0.01084136962890625, 0.0124359130859375, 0.01403045654296875, 0.015625, 0.01721954345703125, 0.0188140869140625, 0.02040863037109375, 0.022003173828125, 0.02359771728515625, 0.0251922607421875, 0.02678680419921875, 0.02838134765625, 0.02997589111328125, 0.0315704345703125, 0.03316497802734375, 0.034759521484375, 0.03635406494140625, 0.0379486083984375, 0.03954315185546875, 0.0411376953125, 0.04273223876953125, 0.0443267822265625, 0.04592132568359375, 0.047515869140625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 6.0, 15.0, 21.0, 20.0, 32.0, 79.0, 90.0, 142.0, 187.0, 149.0, 103.0, 57.0, 39.0, 26.0, 19.0, 11.0, 3.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.594989776611328e-05, -8.409842848777771e-05, -8.224695920944214e-05, -8.039548993110657e-05, -7.8544020652771e-05, -7.669255137443542e-05, -7.484108209609985e-05, -7.298961281776428e-05, -7.113814353942871e-05, -6.928667426109314e-05, -6.743520498275757e-05, -6.5583735704422e-05, -6.373226642608643e-05, -6.188079714775085e-05, -6.002932786941528e-05, -5.817785859107971e-05, -5.632638931274414e-05, -5.447492003440857e-05, -5.2623450756073e-05, -5.077198147773743e-05, -4.8920512199401855e-05, -4.7069042921066284e-05, -4.521757364273071e-05, -4.336610436439514e-05, -4.151463508605957e-05, -3.9663165807724e-05, -3.781169652938843e-05, -3.5960227251052856e-05, -3.4108757972717285e-05, -3.2257288694381714e-05, -3.0405819416046143e-05, -2.855435013771057e-05, -2.6702880859375e-05, -2.485141158103943e-05, -2.2999942302703857e-05, -2.1148473024368286e-05, -1.9297003746032715e-05, -1.7445534467697144e-05, -1.5594065189361572e-05, -1.3742595911026001e-05, -1.189112663269043e-05, -1.0039657354354858e-05, -8.188188076019287e-06, -6.336718797683716e-06, -4.4852495193481445e-06, -2.6337802410125732e-06, -7.82310962677002e-07, 1.0691583156585693e-06, 2.9206275939941406e-06, 4.772096872329712e-06, 6.623566150665283e-06, 8.475035429000854e-06, 1.0326504707336426e-05, 1.2177973985671997e-05, 1.4029443264007568e-05, 1.588091254234314e-05, 1.773238182067871e-05, 1.9583851099014282e-05, 2.1435320377349854e-05, 2.3286789655685425e-05, 2.5138258934020996e-05, 2.6989728212356567e-05, 2.884119749069214e-05, 3.069266676902771e-05, 3.254413604736328e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 8.0, 6.0, 12.0, 17.0, 20.0, 42.0, 72.0, 124.0, 249.0, 667.0, 2197.0, 10833.0, 222616.0, 782098.0, 24187.0, 3671.0, 964.0, 367.0, 165.0, 71.0, 56.0, 28.0, 17.0, 15.0, 11.0, 11.0, 8.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10650634765625, -0.10147762298583984, -0.09644889831542969, -0.09142017364501953, -0.08639144897460938, -0.08136272430419922, -0.07633399963378906, -0.0713052749633789, -0.06627655029296875, -0.061247825622558594, -0.05621910095214844, -0.05119037628173828, -0.046161651611328125, -0.04113292694091797, -0.03610420227050781, -0.031075477600097656, -0.0260467529296875, -0.021018028259277344, -0.015989303588867188, -0.010960578918457031, -0.005931854248046875, -0.0009031295776367188, 0.0041255950927734375, 0.009154319763183594, 0.01418304443359375, 0.019211769104003906, 0.024240493774414062, 0.02926921844482422, 0.034297943115234375, 0.03932666778564453, 0.04435539245605469, 0.049384117126464844, 0.054412841796875, 0.059441566467285156, 0.06447029113769531, 0.06949901580810547, 0.07452774047851562, 0.07955646514892578, 0.08458518981933594, 0.0896139144897461, 0.09464263916015625, 0.0996713638305664, 0.10470008850097656, 0.10972881317138672, 0.11475753784179688, 0.11978626251220703, 0.12481498718261719, 0.12984371185302734, 0.1348724365234375, 0.13990116119384766, 0.1449298858642578, 0.14995861053466797, 0.15498733520507812, 0.16001605987548828, 0.16504478454589844, 0.1700735092163086, 0.17510223388671875, 0.1801309585571289, 0.18515968322753906, 0.19018840789794922, 0.19521713256835938, 0.20024585723876953, 0.2052745819091797, 0.21030330657958984, 0.21533203125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 9.0, 7.0, 20.0, 22.0, 45.0, 80.0, 124.0, 163.0, 143.0, 151.0, 68.0, 54.0, 36.0, 25.0, 13.0, 7.0, 5.0, 5.0, 2.0, 1.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.050506591796875, -0.048220157623291016, -0.04593372344970703, -0.04364728927612305, -0.04136085510253906, -0.03907442092895508, -0.036787986755371094, -0.03450155258178711, -0.032215118408203125, -0.02992868423461914, -0.027642250061035156, -0.025355815887451172, -0.023069381713867188, -0.020782947540283203, -0.01849651336669922, -0.016210079193115234, -0.01392364501953125, -0.011637210845947266, -0.009350776672363281, -0.007064342498779297, -0.0047779083251953125, -0.002491474151611328, -0.00020503997802734375, 0.0020813941955566406, 0.004367828369140625, 0.006654262542724609, 0.008940696716308594, 0.011227130889892578, 0.013513565063476562, 0.015799999237060547, 0.01808643341064453, 0.020372867584228516, 0.0226593017578125, 0.024945735931396484, 0.02723217010498047, 0.029518604278564453, 0.03180503845214844, 0.03409147262573242, 0.036377906799316406, 0.03866434097290039, 0.040950775146484375, 0.04323720932006836, 0.045523643493652344, 0.04781007766723633, 0.05009651184082031, 0.0523829460144043, 0.05466938018798828, 0.056955814361572266, 0.05924224853515625, 0.061528682708740234, 0.06381511688232422, 0.0661015510559082, 0.06838798522949219, 0.07067441940307617, 0.07296085357666016, 0.07524728775024414, 0.07753372192382812, 0.07982015609741211, 0.0821065902709961, 0.08439302444458008, 0.08667945861816406, 0.08896589279174805, 0.09125232696533203, 0.09353876113891602, 0.0958251953125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 6.0, 8.0, 16.0, 16.0, 43.0, 77.0, 106.0, 158.0, 158.0, 148.0, 118.0, 58.0, 43.0, 19.0, 10.0, 11.0, 9.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5261595845222473, -0.5014950037002563, -0.47683045268058777, -0.4521659016609192, -0.4275013208389282, -0.40283676981925964, -0.37817221879959106, -0.3535076379776001, -0.3288430869579315, -0.30417853593826294, -0.279513955116272, -0.2548494040966034, -0.23018483817577362, -0.20552027225494385, -0.18085572123527527, -0.1561911553144455, -0.13152658939361572, -0.10686202347278595, -0.08219746500253677, -0.0575329065322876, -0.032868340611457825, -0.008203774690628052, 0.016460776329040527, 0.0411253422498703, 0.06578990817070007, 0.09045447409152985, 0.11511903256177902, 0.1397835910320282, 0.16444815695285797, 0.18911272287368774, 0.21377727389335632, 0.2384418398141861, 0.2631063461303711, 0.2877708971500397, 0.31243547797203064, 0.3371000289916992, 0.3617646098136902, 0.38642916083335876, 0.41109371185302734, 0.4357582926750183, 0.4604228436946869, 0.48508739471435547, 0.5097519755363464, 0.5344165563583374, 0.5590810775756836, 0.5837456583976746, 0.6084102392196655, 0.6330747604370117, 0.6577393412590027, 0.6824039220809937, 0.7070684432983398, 0.7317330241203308, 0.7563976049423218, 0.781062126159668, 0.8057267069816589, 0.8303912878036499, 0.8550558090209961, 0.8797203898429871, 0.9043849110603333, 0.9290494918823242, 0.9537140727043152, 0.9783786535263062, 1.0030431747436523, 1.0277076959609985, 1.0523723363876343]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 6.0, 6.0, 7.0, 9.0, 9.0, 10.0, 17.0, 16.0, 23.0, 27.0, 25.0, 20.0, 31.0, 42.0, 30.0, 30.0, 36.0, 46.0, 40.0, 51.0, 38.0, 37.0, 38.0, 45.0, 46.0, 43.0, 40.0, 37.0, 35.0, 18.0, 30.0, 18.0, 14.0, 15.0, 18.0, 3.0, 10.0, 13.0, 2.0, 9.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.49666398763656616, -0.48125702142715454, -0.46585002541542053, -0.4504430294036865, -0.4350360631942749, -0.4196290969848633, -0.4042221009731293, -0.38881510496139526, -0.37340813875198364, -0.358001172542572, -0.342594176530838, -0.327187180519104, -0.3117802143096924, -0.29637324810028076, -0.28096625208854675, -0.26555925607681274, -0.2501522898674011, -0.2347453087568283, -0.2193383276462555, -0.20393134653568268, -0.18852436542510986, -0.17311738431453705, -0.15771040320396423, -0.14230342209339142, -0.1268964409828186, -0.11148945987224579, -0.09608247876167297, -0.08067549765110016, -0.06526851654052734, -0.04986153542995453, -0.034454554319381714, -0.0190475732088089, -0.003640592098236084, 0.011766389012336731, 0.027173370122909546, 0.04258035123348236, 0.057987332344055176, 0.07339431345462799, 0.0888012945652008, 0.10420827567577362, 0.11961525678634644, 0.13502223789691925, 0.15042921900749207, 0.16583620011806488, 0.1812431812286377, 0.1966501623392105, 0.21205714344978333, 0.22746412456035614, 0.24287110567092896, 0.2582780718803406, 0.2736850678920746, 0.2890920639038086, 0.3044990301132202, 0.31990599632263184, 0.33531299233436584, 0.35071998834609985, 0.3661269545555115, 0.3815339207649231, 0.3969409167766571, 0.4123479127883911, 0.42775487899780273, 0.44316184520721436, 0.45856884121894836, 0.4739758372306824, 0.489382803440094]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 9.0, 12.0, 10.0, 11.0, 15.0, 40.0, 42.0, 63.0, 92.0, 138.0, 206.0, 336.0, 541.0, 1004.0, 2046.0, 5136.0, 16182.0, 77559.0, 3638498.0, 396478.0, 38505.0, 9941.0, 3622.0, 1595.0, 798.0, 463.0, 298.0, 189.0, 122.0, 86.0, 63.0, 45.0, 39.0, 34.0, 12.0, 17.0, 11.0, 8.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.12841796875, -0.12410926818847656, -0.11980056762695312, -0.11549186706542969, -0.11118316650390625, -0.10687446594238281, -0.10256576538085938, -0.09825706481933594, -0.0939483642578125, -0.08963966369628906, -0.08533096313476562, -0.08102226257324219, -0.07671356201171875, -0.07240486145019531, -0.06809616088867188, -0.06378746032714844, -0.059478759765625, -0.05517005920410156, -0.050861358642578125, -0.04655265808105469, -0.04224395751953125, -0.03793525695800781, -0.033626556396484375, -0.029317855834960938, -0.0250091552734375, -0.020700454711914062, -0.016391754150390625, -0.012083053588867188, -0.00777435302734375, -0.0034656524658203125, 0.000843048095703125, 0.0051517486572265625, 0.00946044921875, 0.013769149780273438, 0.018077850341796875, 0.022386550903320312, 0.02669525146484375, 0.031003952026367188, 0.035312652587890625, 0.03962135314941406, 0.0439300537109375, 0.04823875427246094, 0.052547454833984375, 0.05685615539550781, 0.06116485595703125, 0.06547355651855469, 0.06978225708007812, 0.07409095764160156, 0.078399658203125, 0.08270835876464844, 0.08701705932617188, 0.09132575988769531, 0.09563446044921875, 0.09994316101074219, 0.10425186157226562, 0.10856056213378906, 0.1128692626953125, 0.11717796325683594, 0.12148666381835938, 0.1257953643798828, 0.13010406494140625, 0.1344127655029297, 0.13872146606445312, 0.14303016662597656, 0.1473388671875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 6.0, 6.0, 6.0, 6.0, 11.0, 8.0, 16.0, 12.0, 22.0, 25.0, 42.0, 46.0, 53.0, 47.0, 69.0, 80.0, 71.0, 84.0, 73.0, 73.0, 39.0, 45.0, 32.0, 25.0, 24.0, 18.0, 15.0, 10.0, 8.0, 8.0, 7.0, 4.0, 2.0, 4.0, 5.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0196685791015625, -0.019065380096435547, -0.018462181091308594, -0.01785898208618164, -0.017255783081054688, -0.016652584075927734, -0.01604938507080078, -0.015446186065673828, -0.014842987060546875, -0.014239788055419922, -0.013636589050292969, -0.013033390045166016, -0.012430191040039062, -0.01182699203491211, -0.011223793029785156, -0.010620594024658203, -0.01001739501953125, -0.009414196014404297, -0.008810997009277344, -0.00820779800415039, -0.0076045989990234375, -0.007001399993896484, -0.006398200988769531, -0.005795001983642578, -0.005191802978515625, -0.004588603973388672, -0.003985404968261719, -0.0033822059631347656, -0.0027790069580078125, -0.0021758079528808594, -0.0015726089477539062, -0.0009694099426269531, -0.0003662109375, 0.00023698806762695312, 0.0008401870727539062, 0.0014433860778808594, 0.0020465850830078125, 0.0026497840881347656, 0.0032529830932617188, 0.003856182098388672, 0.004459381103515625, 0.005062580108642578, 0.005665779113769531, 0.006268978118896484, 0.0068721771240234375, 0.007475376129150391, 0.008078575134277344, 0.008681774139404297, 0.00928497314453125, 0.009888172149658203, 0.010491371154785156, 0.01109457015991211, 0.011697769165039062, 0.012300968170166016, 0.012904167175292969, 0.013507366180419922, 0.014110565185546875, 0.014713764190673828, 0.015316963195800781, 0.015920162200927734, 0.016523361206054688, 0.01712656021118164, 0.017729759216308594, 0.018332958221435547, 0.0189361572265625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 6.0, 8.0, 16.0, 35.0, 72.0, 103.0, 175.0, 366.0, 908.0, 1973.0, 5086.0, 15355.0, 59749.0, 555866.0, 3391310.0, 124937.0, 25298.0, 7843.0, 2825.0, 1165.0, 610.0, 280.0, 138.0, 63.0, 40.0, 27.0, 15.0, 7.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13427734375, -0.1305685043334961, -0.1268596649169922, -0.12315082550048828, -0.11944198608398438, -0.11573314666748047, -0.11202430725097656, -0.10831546783447266, -0.10460662841796875, -0.10089778900146484, -0.09718894958496094, -0.09348011016845703, -0.08977127075195312, -0.08606243133544922, -0.08235359191894531, -0.0786447525024414, -0.0749359130859375, -0.0712270736694336, -0.06751823425292969, -0.06380939483642578, -0.060100555419921875, -0.05639171600341797, -0.05268287658691406, -0.048974037170410156, -0.04526519775390625, -0.041556358337402344, -0.03784751892089844, -0.03413867950439453, -0.030429840087890625, -0.02672100067138672, -0.023012161254882812, -0.019303321838378906, -0.015594482421875, -0.011885643005371094, -0.008176803588867188, -0.004467964172363281, -0.000759124755859375, 0.0029497146606445312, 0.0066585540771484375, 0.010367393493652344, 0.01407623291015625, 0.017785072326660156, 0.021493911743164062, 0.02520275115966797, 0.028911590576171875, 0.03262042999267578, 0.03632926940917969, 0.040038108825683594, 0.0437469482421875, 0.047455787658691406, 0.05116462707519531, 0.05487346649169922, 0.058582305908203125, 0.06229114532470703, 0.06599998474121094, 0.06970882415771484, 0.07341766357421875, 0.07712650299072266, 0.08083534240722656, 0.08454418182373047, 0.08825302124023438, 0.09196186065673828, 0.09567070007324219, 0.0993795394897461, 0.10308837890625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 1.0, 1.0, 4.0, 2.0, 7.0, 6.0, 10.0, 12.0, 15.0, 20.0, 21.0, 26.0, 61.0, 90.0, 147.0, 235.0, 717.0, 1767.0, 419.0, 193.0, 101.0, 60.0, 43.0, 28.0, 28.0, 20.0, 7.0, 12.0, 8.0, 7.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0295257568359375, -0.028580665588378906, -0.027635574340820312, -0.02669048309326172, -0.025745391845703125, -0.02480030059814453, -0.023855209350585938, -0.022910118103027344, -0.02196502685546875, -0.021019935607910156, -0.020074844360351562, -0.01912975311279297, -0.018184661865234375, -0.01723957061767578, -0.016294479370117188, -0.015349388122558594, -0.014404296875, -0.013459205627441406, -0.012514114379882812, -0.011569023132324219, -0.010623931884765625, -0.009678840637207031, -0.008733749389648438, -0.007788658142089844, -0.00684356689453125, -0.005898475646972656, -0.0049533843994140625, -0.004008293151855469, -0.003063201904296875, -0.0021181106567382812, -0.0011730194091796875, -0.00022792816162109375, 0.0007171630859375, 0.0016622543334960938, 0.0026073455810546875, 0.0035524368286132812, 0.004497528076171875, 0.005442619323730469, 0.0063877105712890625, 0.007332801818847656, 0.00827789306640625, 0.009222984313964844, 0.010168075561523438, 0.011113166809082031, 0.012058258056640625, 0.013003349304199219, 0.013948440551757812, 0.014893531799316406, 0.015838623046875, 0.016783714294433594, 0.017728805541992188, 0.01867389678955078, 0.019618988037109375, 0.02056407928466797, 0.021509170532226562, 0.022454261779785156, 0.02339935302734375, 0.024344444274902344, 0.025289535522460938, 0.02623462677001953, 0.027179718017578125, 0.02812480926513672, 0.029069900512695312, 0.030014991760253906, 0.0309600830078125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 7.0, 5.0, 12.0, 20.0, 28.0, 31.0, 45.0, 55.0, 87.0, 111.0, 129.0, 111.0, 101.0, 75.0, 51.0, 45.0, 26.0, 18.0, 14.0, 6.0, 2.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10153816640377045, -0.09757574647665024, -0.09361332654953003, -0.08965090662240982, -0.08568848669528961, -0.0817260593175888, -0.0777636393904686, -0.07380121946334839, -0.06983879953622818, -0.06587637960910797, -0.06191395968198776, -0.057951536029577255, -0.053989116102457047, -0.05002669617533684, -0.04606427252292633, -0.04210185259580612, -0.03813943266868591, -0.034177012741565704, -0.030214590951800346, -0.02625216916203499, -0.02228974923491478, -0.01832732930779457, -0.014364907518029213, -0.010402485728263855, -0.006440065801143646, -0.002477644942700863, 0.0014847759157419205, 0.005447196774184704, 0.009409617632627487, 0.013372037559747696, 0.017334459349513054, 0.021296881139278412, 0.025259315967559814, 0.029221735894680023, 0.03318415582180023, 0.03714657947421074, 0.04110899940133095, 0.04507141932845116, 0.049033842980861664, 0.05299626290798187, 0.05695868283510208, 0.06092110276222229, 0.0648835226893425, 0.06884594261646271, 0.07280836999416351, 0.07677078247070312, 0.08073320984840393, 0.08469562977552414, 0.08865804970264435, 0.09262046962976456, 0.09658288955688477, 0.10054530948400497, 0.10450772941112518, 0.10847015678882599, 0.1124325767159462, 0.1163949966430664, 0.12035741657018661, 0.12431983649730682, 0.12828226387500763, 0.13224467635154724, 0.13620710372924805, 0.14016951620578766, 0.14413194358348846, 0.14809435606002808, 0.15205678343772888]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 1.0, 5.0, 8.0, 6.0, 6.0, 16.0, 17.0, 12.0, 16.0, 14.0, 22.0, 25.0, 28.0, 34.0, 41.0, 40.0, 30.0, 33.0, 40.0, 32.0, 50.0, 59.0, 31.0, 44.0, 44.0, 43.0, 35.0, 38.0, 42.0, 27.0, 22.0, 14.0, 20.0, 14.0, 20.0, 18.0, 5.0, 18.0, 8.0, 2.0, 2.0, 6.0, 5.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.08024102449417114, -0.07758000493049622, -0.07491899281740189, -0.07225797325372696, -0.06959696114063263, -0.0669359415769577, -0.06427492201328278, -0.06161390617489815, -0.05895289033651352, -0.05629187449812889, -0.05363085865974426, -0.050969839096069336, -0.04830882325768471, -0.04564780741930008, -0.04298678785562515, -0.040325772017240524, -0.037664756178855896, -0.03500374034047127, -0.03234272450208664, -0.029681704938411713, -0.027020689100027084, -0.024359673261642456, -0.02169865556061268, -0.0190376378595829, -0.016376622021198273, -0.01371560525149107, -0.011054588481783867, -0.008393571712076664, -0.005732554942369461, -0.003071538172662258, -0.00041052140295505524, 0.0022504962980747223, 0.004911512136459351, 0.0075725289061665535, 0.010233545675873756, 0.01289456244558096, 0.015555579215288162, 0.01821659505367279, 0.020877612754702568, 0.023538630455732346, 0.026199646294116974, 0.028860662132501602, 0.03152167797088623, 0.03418269753456116, 0.036843713372945786, 0.039504729211330414, 0.04216574877500534, 0.04482676461338997, 0.0474877804517746, 0.050148796290159225, 0.052809812128543854, 0.05547083169221878, 0.05813184753060341, 0.06079286336898804, 0.06345388293266296, 0.06611490249633789, 0.06877591460943222, 0.07143693417310715, 0.07409794628620148, 0.0767589658498764, 0.07941998541355133, 0.08208099752664566, 0.08474201709032059, 0.08740302920341492, 0.09006404876708984]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 7.0, 10.0, 27.0, 33.0, 32.0, 54.0, 74.0, 137.0, 144.0, 248.0, 394.0, 586.0, 837.0, 1564.0, 2573.0, 4250.0, 7376.0, 13223.0, 25448.0, 50624.0, 105914.0, 222735.0, 298507.0, 159194.0, 74791.0, 36437.0, 18901.0, 10208.0, 5473.0, 3216.0, 2052.0, 1188.0, 799.0, 474.0, 347.0, 213.0, 154.0, 103.0, 54.0, 46.0, 39.0, 17.0, 9.0, 7.0, 12.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.055572509765625, -0.05390214920043945, -0.052231788635253906, -0.05056142807006836, -0.04889106750488281, -0.047220706939697266, -0.04555034637451172, -0.04387998580932617, -0.042209625244140625, -0.04053926467895508, -0.03886890411376953, -0.037198543548583984, -0.03552818298339844, -0.03385782241821289, -0.032187461853027344, -0.030517101287841797, -0.02884674072265625, -0.027176380157470703, -0.025506019592285156, -0.02383565902709961, -0.022165298461914062, -0.020494937896728516, -0.01882457733154297, -0.017154216766357422, -0.015483856201171875, -0.013813495635986328, -0.012143135070800781, -0.010472774505615234, -0.008802413940429688, -0.007132053375244141, -0.005461692810058594, -0.003791332244873047, -0.0021209716796875, -0.0004506111145019531, 0.0012197494506835938, 0.0028901100158691406, 0.0045604705810546875, 0.006230831146240234, 0.007901191711425781, 0.009571552276611328, 0.011241912841796875, 0.012912273406982422, 0.014582633972167969, 0.016252994537353516, 0.017923355102539062, 0.01959371566772461, 0.021264076232910156, 0.022934436798095703, 0.02460479736328125, 0.026275157928466797, 0.027945518493652344, 0.02961587905883789, 0.03128623962402344, 0.032956600189208984, 0.03462696075439453, 0.03629732131958008, 0.037967681884765625, 0.03963804244995117, 0.04130840301513672, 0.042978763580322266, 0.04464912414550781, 0.04631948471069336, 0.047989845275878906, 0.04966020584106445, 0.05133056640625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 7.0, 2.0, 5.0, 15.0, 12.0, 22.0, 18.0, 31.0, 29.0, 32.0, 50.0, 46.0, 72.0, 66.0, 64.0, 76.0, 63.0, 55.0, 59.0, 58.0, 42.0, 47.0, 22.0, 29.0, 15.0, 11.0, 7.0, 6.0, 9.0, 7.0, 2.0, 9.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.019561767578125, -0.018991708755493164, -0.018421649932861328, -0.017851591110229492, -0.017281532287597656, -0.01671147346496582, -0.016141414642333984, -0.015571355819702148, -0.015001296997070312, -0.014431238174438477, -0.01386117935180664, -0.013291120529174805, -0.012721061706542969, -0.012151002883911133, -0.011580944061279297, -0.011010885238647461, -0.010440826416015625, -0.009870767593383789, -0.009300708770751953, -0.008730649948120117, -0.008160591125488281, -0.007590532302856445, -0.007020473480224609, -0.0064504146575927734, -0.0058803558349609375, -0.0053102970123291016, -0.004740238189697266, -0.00417017936706543, -0.0036001205444335938, -0.003030061721801758, -0.002460002899169922, -0.001889944076538086, -0.00131988525390625, -0.0007498264312744141, -0.00017976760864257812, 0.0003902912139892578, 0.0009603500366210938, 0.0015304088592529297, 0.0021004676818847656, 0.0026705265045166016, 0.0032405853271484375, 0.0038106441497802734, 0.004380702972412109, 0.004950761795043945, 0.005520820617675781, 0.006090879440307617, 0.006660938262939453, 0.007230997085571289, 0.007801055908203125, 0.008371114730834961, 0.008941173553466797, 0.009511232376098633, 0.010081291198730469, 0.010651350021362305, 0.01122140884399414, 0.011791467666625977, 0.012361526489257812, 0.012931585311889648, 0.013501644134521484, 0.01407170295715332, 0.014641761779785156, 0.015211820602416992, 0.015781879425048828, 0.016351938247680664, 0.0169219970703125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 5.0, 9.0, 7.0, 8.0, 14.0, 17.0, 16.0, 30.0, 58.0, 68.0, 88.0, 119.0, 182.0, 245.0, 378.0, 596.0, 1022.0, 1885.0, 4027.0, 9376.0, 25054.0, 75623.0, 228990.0, 405571.0, 194491.0, 63303.0, 21265.0, 8167.0, 3557.0, 1628.0, 973.0, 585.0, 368.0, 235.0, 180.0, 111.0, 78.0, 51.0, 51.0, 33.0, 29.0, 18.0, 16.0, 8.0, 7.0, 4.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.071044921875, -0.06891918182373047, -0.06679344177246094, -0.0646677017211914, -0.06254196166992188, -0.060416221618652344, -0.05829048156738281, -0.05616474151611328, -0.05403900146484375, -0.05191326141357422, -0.04978752136230469, -0.047661781311035156, -0.045536041259765625, -0.043410301208496094, -0.04128456115722656, -0.03915882110595703, -0.0370330810546875, -0.03490734100341797, -0.03278160095214844, -0.030655860900878906, -0.028530120849609375, -0.026404380798339844, -0.024278640747070312, -0.02215290069580078, -0.02002716064453125, -0.01790142059326172, -0.015775680541992188, -0.013649940490722656, -0.011524200439453125, -0.009398460388183594, -0.0072727203369140625, -0.005146980285644531, -0.003021240234375, -0.0008955001831054688, 0.0012302398681640625, 0.0033559799194335938, 0.005481719970703125, 0.007607460021972656, 0.009733200073242188, 0.011858940124511719, 0.01398468017578125, 0.01611042022705078, 0.018236160278320312, 0.020361900329589844, 0.022487640380859375, 0.024613380432128906, 0.026739120483398438, 0.02886486053466797, 0.0309906005859375, 0.03311634063720703, 0.03524208068847656, 0.037367820739746094, 0.039493560791015625, 0.041619300842285156, 0.04374504089355469, 0.04587078094482422, 0.04799652099609375, 0.05012226104736328, 0.05224800109863281, 0.054373741149902344, 0.056499481201171875, 0.058625221252441406, 0.06075096130371094, 0.06287670135498047, 0.06500244140625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 5.0, 2.0, 3.0, 4.0, 5.0, 13.0, 10.0, 15.0, 18.0, 24.0, 22.0, 22.0, 28.0, 32.0, 25.0, 35.0, 34.0, 31.0, 47.0, 45.0, 53.0, 41.0, 46.0, 39.0, 38.0, 33.0, 43.0, 31.0, 32.0, 46.0, 25.0, 25.0, 20.0, 18.0, 15.0, 17.0, 14.0, 12.0, 5.0, 3.0, 8.0, 7.0, 3.0, 3.0, 4.0, 5.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.0765380859375, -0.07442569732666016, -0.07231330871582031, -0.07020092010498047, -0.06808853149414062, -0.06597614288330078, -0.06386375427246094, -0.061751365661621094, -0.05963897705078125, -0.057526588439941406, -0.05541419982910156, -0.05330181121826172, -0.051189422607421875, -0.04907703399658203, -0.04696464538574219, -0.044852256774902344, -0.0427398681640625, -0.040627479553222656, -0.03851509094238281, -0.03640270233154297, -0.034290313720703125, -0.03217792510986328, -0.030065536499023438, -0.027953147888183594, -0.02584075927734375, -0.023728370666503906, -0.021615982055664062, -0.01950359344482422, -0.017391204833984375, -0.015278816223144531, -0.013166427612304688, -0.011054039001464844, -0.008941650390625, -0.006829261779785156, -0.0047168731689453125, -0.0026044845581054688, -0.000492095947265625, 0.0016202926635742188, 0.0037326812744140625, 0.005845069885253906, 0.00795745849609375, 0.010069847106933594, 0.012182235717773438, 0.014294624328613281, 0.016407012939453125, 0.01851940155029297, 0.020631790161132812, 0.022744178771972656, 0.0248565673828125, 0.026968955993652344, 0.029081344604492188, 0.03119373321533203, 0.033306121826171875, 0.03541851043701172, 0.03753089904785156, 0.039643287658691406, 0.04175567626953125, 0.043868064880371094, 0.04598045349121094, 0.04809284210205078, 0.050205230712890625, 0.05231761932373047, 0.05443000793457031, 0.056542396545410156, 0.05865478515625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 7.0, 15.0, 13.0, 15.0, 23.0, 34.0, 55.0, 78.0, 96.0, 139.0, 243.0, 449.0, 728.0, 1332.0, 2706.0, 5568.0, 13143.0, 34961.0, 105435.0, 351051.0, 361193.0, 109679.0, 36006.0, 13630.0, 5749.0, 2790.0, 1382.0, 764.0, 463.0, 274.0, 183.0, 106.0, 81.0, 44.0, 35.0, 17.0, 18.0, 14.0, 8.0, 6.0, 1.0, 7.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.03448486328125, -0.033471107482910156, -0.03245735168457031, -0.03144359588623047, -0.030429840087890625, -0.02941608428955078, -0.028402328491210938, -0.027388572692871094, -0.02637481689453125, -0.025361061096191406, -0.024347305297851562, -0.02333354949951172, -0.022319793701171875, -0.02130603790283203, -0.020292282104492188, -0.019278526306152344, -0.0182647705078125, -0.017251014709472656, -0.016237258911132812, -0.015223503112792969, -0.014209747314453125, -0.013195991516113281, -0.012182235717773438, -0.011168479919433594, -0.01015472412109375, -0.009140968322753906, -0.008127212524414062, -0.007113456726074219, -0.006099700927734375, -0.005085945129394531, -0.0040721893310546875, -0.0030584335327148438, -0.002044677734375, -0.0010309219360351562, -1.71661376953125e-05, 0.0009965896606445312, 0.002010345458984375, 0.0030241012573242188, 0.0040378570556640625, 0.005051612854003906, 0.00606536865234375, 0.007079124450683594, 0.008092880249023438, 0.009106636047363281, 0.010120391845703125, 0.011134147644042969, 0.012147903442382812, 0.013161659240722656, 0.0141754150390625, 0.015189170837402344, 0.016202926635742188, 0.01721668243408203, 0.018230438232421875, 0.01924419403076172, 0.020257949829101562, 0.021271705627441406, 0.02228546142578125, 0.023299217224121094, 0.024312973022460938, 0.02532672882080078, 0.026340484619140625, 0.02735424041748047, 0.028367996215820312, 0.029381752014160156, 0.0303955078125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 13.0, 15.0, 16.0, 28.0, 34.0, 46.0, 45.0, 86.0, 85.0, 86.0, 100.0, 108.0, 69.0, 70.0, 47.0, 43.0, 28.0, 25.0, 12.0, 8.0, 5.0, 5.0, 5.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.7087669372558594e-05, -4.5942142605781555e-05, -4.4796615839004517e-05, -4.365108907222748e-05, -4.250556230545044e-05, -4.13600355386734e-05, -4.021450877189636e-05, -3.9068982005119324e-05, -3.7923455238342285e-05, -3.6777928471565247e-05, -3.563240170478821e-05, -3.448687493801117e-05, -3.334134817123413e-05, -3.219582140445709e-05, -3.1050294637680054e-05, -2.9904767870903015e-05, -2.8759241104125977e-05, -2.7613714337348938e-05, -2.64681875705719e-05, -2.532266080379486e-05, -2.4177134037017822e-05, -2.3031607270240784e-05, -2.1886080503463745e-05, -2.0740553736686707e-05, -1.9595026969909668e-05, -1.844950020313263e-05, -1.730397343635559e-05, -1.6158446669578552e-05, -1.5012919902801514e-05, -1.3867393136024475e-05, -1.2721866369247437e-05, -1.1576339602470398e-05, -1.043081283569336e-05, -9.28528606891632e-06, -8.139759302139282e-06, -6.994232535362244e-06, -5.848705768585205e-06, -4.7031790018081665e-06, -3.557652235031128e-06, -2.4121254682540894e-06, -1.2665987014770508e-06, -1.210719347000122e-07, 1.0244548320770264e-06, 2.169981598854065e-06, 3.3155083656311035e-06, 4.461035132408142e-06, 5.606561899185181e-06, 6.752088665962219e-06, 7.897615432739258e-06, 9.043142199516296e-06, 1.0188668966293335e-05, 1.1334195733070374e-05, 1.2479722499847412e-05, 1.362524926662445e-05, 1.477077603340149e-05, 1.5916302800178528e-05, 1.7061829566955566e-05, 1.8207356333732605e-05, 1.9352883100509644e-05, 2.0498409867286682e-05, 2.164393663406372e-05, 2.278946340084076e-05, 2.3934990167617798e-05, 2.5080516934394836e-05, 2.6226043701171875e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 5.0, 4.0, 14.0, 11.0, 15.0, 25.0, 29.0, 51.0, 93.0, 132.0, 260.0, 433.0, 890.0, 2231.0, 6922.0, 29549.0, 167603.0, 631490.0, 168106.0, 29552.0, 6970.0, 2183.0, 968.0, 457.0, 222.0, 137.0, 71.0, 47.0, 28.0, 22.0, 11.0, 7.0, 10.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052520751953125, -0.050952911376953125, -0.04938507080078125, -0.047817230224609375, -0.0462493896484375, -0.044681549072265625, -0.04311370849609375, -0.041545867919921875, -0.03997802734375, -0.038410186767578125, -0.03684234619140625, -0.035274505615234375, -0.0337066650390625, -0.032138824462890625, -0.03057098388671875, -0.029003143310546875, -0.027435302734375, -0.025867462158203125, -0.02429962158203125, -0.022731781005859375, -0.0211639404296875, -0.019596099853515625, -0.01802825927734375, -0.016460418701171875, -0.014892578125, -0.013324737548828125, -0.01175689697265625, -0.010189056396484375, -0.0086212158203125, -0.007053375244140625, -0.00548553466796875, -0.003917694091796875, -0.002349853515625, -0.000782012939453125, 0.00078582763671875, 0.002353668212890625, 0.0039215087890625, 0.005489349365234375, 0.00705718994140625, 0.008625030517578125, 0.01019287109375, 0.011760711669921875, 0.01332855224609375, 0.014896392822265625, 0.0164642333984375, 0.018032073974609375, 0.01959991455078125, 0.021167755126953125, 0.022735595703125, 0.024303436279296875, 0.02587127685546875, 0.027439117431640625, 0.0290069580078125, 0.030574798583984375, 0.03214263916015625, 0.033710479736328125, 0.0352783203125, 0.036846160888671875, 0.03841400146484375, 0.039981842041015625, 0.0415496826171875, 0.043117523193359375, 0.04468536376953125, 0.046253204345703125, 0.047821044921875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 4.0, 8.0, 9.0, 4.0, 9.0, 13.0, 18.0, 33.0, 51.0, 49.0, 73.0, 98.0, 102.0, 118.0, 105.0, 89.0, 65.0, 45.0, 34.0, 29.0, 19.0, 14.0, 8.0, 7.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.05975341796875, -0.05840444564819336, -0.05705547332763672, -0.05570650100708008, -0.05435752868652344, -0.0530085563659668, -0.051659584045410156, -0.050310611724853516, -0.048961639404296875, -0.047612667083740234, -0.046263694763183594, -0.04491472244262695, -0.04356575012207031, -0.04221677780151367, -0.04086780548095703, -0.03951883316040039, -0.03816986083984375, -0.03682088851928711, -0.03547191619873047, -0.03412294387817383, -0.03277397155761719, -0.03142499923706055, -0.030076026916503906, -0.028727054595947266, -0.027378082275390625, -0.026029109954833984, -0.024680137634277344, -0.023331165313720703, -0.021982192993164062, -0.020633220672607422, -0.01928424835205078, -0.01793527603149414, -0.0165863037109375, -0.01523733139038086, -0.013888359069824219, -0.012539386749267578, -0.011190414428710938, -0.009841442108154297, -0.008492469787597656, -0.007143497467041016, -0.005794525146484375, -0.004445552825927734, -0.0030965805053710938, -0.0017476081848144531, -0.0003986358642578125, 0.0009503364562988281, 0.0022993087768554688, 0.0036482810974121094, 0.00499725341796875, 0.006346225738525391, 0.007695198059082031, 0.009044170379638672, 0.010393142700195312, 0.011742115020751953, 0.013091087341308594, 0.014440059661865234, 0.015789031982421875, 0.017138004302978516, 0.018486976623535156, 0.019835948944091797, 0.021184921264648438, 0.022533893585205078, 0.02388286590576172, 0.02523183822631836, 0.026580810546875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 13.0, 16.0, 49.0, 117.0, 219.0, 235.0, 177.0, 115.0, 33.0, 18.0, 12.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42393758893013, -0.39454230666160583, -0.36514702439308167, -0.3357517421245575, -0.3063564598560333, -0.27696117758750916, -0.24756589531898499, -0.21817061305046082, -0.18877533078193665, -0.15938004851341248, -0.1299847662448883, -0.10058948397636414, -0.07119420170783997, -0.041798919439315796, -0.012403637170791626, 0.016991645097732544, 0.046386927366256714, 0.07578220963478088, 0.10517749190330505, 0.13457277417182922, 0.1639680564403534, 0.19336333870887756, 0.22275862097740173, 0.2521539032459259, 0.2815491855144501, 0.31094446778297424, 0.3403397500514984, 0.3697350323200226, 0.39913031458854675, 0.4285255968570709, 0.4579208791255951, 0.48731616139411926, 0.5167114734649658, 0.54610675573349, 0.5755020380020142, 0.6048973202705383, 0.6342926025390625, 0.6636878848075867, 0.6930831670761108, 0.722478449344635, 0.7518737316131592, 0.7812690138816833, 0.8106642961502075, 0.8400595784187317, 0.8694548606872559, 0.89885014295578, 0.9282454252243042, 0.9576407074928284, 0.9870359897613525, 1.0164313316345215, 1.0458265542984009, 1.0752217769622803, 1.1046171188354492, 1.1340124607086182, 1.1634076833724976, 1.192802906036377, 1.222198247909546, 1.2515935897827148, 1.2809888124465942, 1.3103840351104736, 1.3397793769836426, 1.3691747188568115, 1.398569941520691, 1.4279651641845703, 1.4573605060577393]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 5.0, 5.0, 7.0, 8.0, 9.0, 9.0, 10.0, 13.0, 19.0, 23.0, 24.0, 22.0, 25.0, 34.0, 40.0, 37.0, 54.0, 38.0, 61.0, 48.0, 52.0, 57.0, 61.0, 43.0, 50.0, 40.0, 34.0, 23.0, 19.0, 20.0, 21.0, 24.0, 15.0, 13.0, 13.0, 10.0, 3.0, 3.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.5078218579292297, -0.4937440752983093, -0.4796662926673889, -0.4655885100364685, -0.4515107274055481, -0.4374329447746277, -0.4233551621437073, -0.40927737951278687, -0.39519959688186646, -0.38112181425094604, -0.36704403162002563, -0.3529662489891052, -0.3388884663581848, -0.3248106837272644, -0.310732901096344, -0.2966551184654236, -0.2825773358345032, -0.26849955320358276, -0.25442177057266235, -0.24034398794174194, -0.22626620531082153, -0.21218842267990112, -0.1981106400489807, -0.1840328574180603, -0.1699550747871399, -0.15587729215621948, -0.14179950952529907, -0.12772172689437866, -0.11364394426345825, -0.09956616163253784, -0.08548837900161743, -0.07141059637069702, -0.05733281373977661, -0.0432550311088562, -0.02917724847793579, -0.01509946584701538, -0.0010216832160949707, 0.01305609941482544, 0.02713388204574585, 0.04121166467666626, 0.05528944730758667, 0.06936722993850708, 0.08344501256942749, 0.0975227952003479, 0.11160057783126831, 0.12567836046218872, 0.13975614309310913, 0.15383392572402954, 0.16791170835494995, 0.18198949098587036, 0.19606727361679077, 0.21014505624771118, 0.2242228388786316, 0.238300621509552, 0.2523784041404724, 0.2664561867713928, 0.28053396940231323, 0.29461175203323364, 0.30868953466415405, 0.32276731729507446, 0.3368450999259949, 0.3509228825569153, 0.3650006651878357, 0.3790784478187561, 0.3931562304496765]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 7.0, 5.0, 7.0, 9.0, 11.0, 18.0, 28.0, 40.0, 81.0, 106.0, 141.0, 235.0, 379.0, 612.0, 1035.0, 1793.0, 3568.0, 7368.0, 17966.0, 58294.0, 507898.0, 3451142.0, 98614.0, 25213.0, 9634.0, 4447.0, 2297.0, 1273.0, 741.0, 420.0, 266.0, 199.0, 150.0, 92.0, 61.0, 44.0, 31.0, 22.0, 15.0, 7.0, 2.0, 7.0, 1.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0804443359375, -0.07758903503417969, -0.07473373413085938, -0.07187843322753906, -0.06902313232421875, -0.06616783142089844, -0.06331253051757812, -0.06045722961425781, -0.0576019287109375, -0.05474662780761719, -0.051891326904296875, -0.04903602600097656, -0.04618072509765625, -0.04332542419433594, -0.040470123291015625, -0.03761482238769531, -0.034759521484375, -0.03190422058105469, -0.029048919677734375, -0.026193618774414062, -0.02333831787109375, -0.020483016967773438, -0.017627716064453125, -0.014772415161132812, -0.0119171142578125, -0.009061813354492188, -0.006206512451171875, -0.0033512115478515625, -0.00049591064453125, 0.0023593902587890625, 0.005214691162109375, 0.008069992065429688, 0.01092529296875, 0.013780593872070312, 0.016635894775390625, 0.019491195678710938, 0.02234649658203125, 0.025201797485351562, 0.028057098388671875, 0.030912399291992188, 0.0337677001953125, 0.03662300109863281, 0.039478302001953125, 0.04233360290527344, 0.04518890380859375, 0.04804420471191406, 0.050899505615234375, 0.05375480651855469, 0.056610107421875, 0.05946540832519531, 0.062320709228515625, 0.06517601013183594, 0.06803131103515625, 0.07088661193847656, 0.07374191284179688, 0.07659721374511719, 0.0794525146484375, 0.08230781555175781, 0.08516311645507812, 0.08801841735839844, 0.09087371826171875, 0.09372901916503906, 0.09658432006835938, 0.09943962097167969, 0.102294921875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 5.0, 9.0, 13.0, 6.0, 19.0, 18.0, 26.0, 29.0, 33.0, 37.0, 52.0, 50.0, 49.0, 64.0, 57.0, 64.0, 67.0, 60.0, 55.0, 33.0, 37.0, 47.0, 30.0, 24.0, 21.0, 14.0, 20.0, 14.0, 6.0, 9.0, 4.0, 3.0, 3.0, 6.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0189056396484375, -0.0183560848236084, -0.017806529998779297, -0.017256975173950195, -0.016707420349121094, -0.016157865524291992, -0.01560831069946289, -0.015058755874633789, -0.014509201049804688, -0.013959646224975586, -0.013410091400146484, -0.012860536575317383, -0.012310981750488281, -0.01176142692565918, -0.011211872100830078, -0.010662317276000977, -0.010112762451171875, -0.009563207626342773, -0.009013652801513672, -0.00846409797668457, -0.007914543151855469, -0.007364988327026367, -0.006815433502197266, -0.006265878677368164, -0.0057163238525390625, -0.005166769027709961, -0.004617214202880859, -0.004067659378051758, -0.0035181045532226562, -0.0029685497283935547, -0.002418994903564453, -0.0018694400787353516, -0.00131988525390625, -0.0007703304290771484, -0.00022077560424804688, 0.0003287792205810547, 0.0008783340454101562, 0.0014278888702392578, 0.0019774436950683594, 0.002526998519897461, 0.0030765533447265625, 0.003626108169555664, 0.004175662994384766, 0.004725217819213867, 0.005274772644042969, 0.00582432746887207, 0.006373882293701172, 0.0069234371185302734, 0.007472991943359375, 0.008022546768188477, 0.008572101593017578, 0.00912165641784668, 0.009671211242675781, 0.010220766067504883, 0.010770320892333984, 0.011319875717163086, 0.011869430541992188, 0.012418985366821289, 0.01296854019165039, 0.013518095016479492, 0.014067649841308594, 0.014617204666137695, 0.015166759490966797, 0.0157163143157959, 0.016265869140625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 5.0, 11.0, 12.0, 30.0, 29.0, 41.0, 68.0, 90.0, 201.0, 369.0, 747.0, 1808.0, 4738.0, 14161.0, 60029.0, 773628.0, 3213419.0, 94480.0, 19564.0, 6198.0, 2341.0, 1042.0, 496.0, 285.0, 156.0, 100.0, 67.0, 54.0, 36.0, 28.0, 14.0, 7.0, 10.0, 9.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08697509765625, -0.08336925506591797, -0.07976341247558594, -0.0761575698852539, -0.07255172729492188, -0.06894588470458984, -0.06534004211425781, -0.06173419952392578, -0.05812835693359375, -0.05452251434326172, -0.05091667175292969, -0.047310829162597656, -0.043704986572265625, -0.040099143981933594, -0.03649330139160156, -0.03288745880126953, -0.0292816162109375, -0.02567577362060547, -0.022069931030273438, -0.018464088439941406, -0.014858245849609375, -0.011252403259277344, -0.0076465606689453125, -0.004040718078613281, -0.00043487548828125, 0.0031709671020507812, 0.0067768096923828125, 0.010382652282714844, 0.013988494873046875, 0.017594337463378906, 0.021200180053710938, 0.02480602264404297, 0.028411865234375, 0.03201770782470703, 0.03562355041503906, 0.039229393005371094, 0.042835235595703125, 0.046441078186035156, 0.05004692077636719, 0.05365276336669922, 0.05725860595703125, 0.06086444854736328, 0.06447029113769531, 0.06807613372802734, 0.07168197631835938, 0.0752878189086914, 0.07889366149902344, 0.08249950408935547, 0.0861053466796875, 0.08971118927001953, 0.09331703186035156, 0.0969228744506836, 0.10052871704101562, 0.10413455963134766, 0.10774040222167969, 0.11134624481201172, 0.11495208740234375, 0.11855792999267578, 0.12216377258300781, 0.12576961517333984, 0.12937545776367188, 0.1329813003540039, 0.13658714294433594, 0.14019298553466797, 0.143798828125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 7.0, 14.0, 11.0, 24.0, 40.0, 59.0, 93.0, 173.0, 395.0, 2043.0, 635.0, 247.0, 117.0, 72.0, 46.0, 26.0, 19.0, 5.0, 19.0, 6.0, 4.0, 6.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0232086181640625, -0.02208685874938965, -0.020965099334716797, -0.019843339920043945, -0.018721580505371094, -0.017599821090698242, -0.01647806167602539, -0.015356302261352539, -0.014234542846679688, -0.013112783432006836, -0.011991024017333984, -0.010869264602661133, -0.009747505187988281, -0.00862574577331543, -0.007503986358642578, -0.0063822269439697266, -0.005260467529296875, -0.0041387081146240234, -0.003016948699951172, -0.0018951892852783203, -0.0007734298706054688, 0.0003483295440673828, 0.0014700889587402344, 0.002591848373413086, 0.0037136077880859375, 0.004835367202758789, 0.005957126617431641, 0.007078886032104492, 0.008200645446777344, 0.009322404861450195, 0.010444164276123047, 0.011565923690795898, 0.01268768310546875, 0.013809442520141602, 0.014931201934814453, 0.016052961349487305, 0.017174720764160156, 0.018296480178833008, 0.01941823959350586, 0.02053999900817871, 0.021661758422851562, 0.022783517837524414, 0.023905277252197266, 0.025027036666870117, 0.02614879608154297, 0.02727055549621582, 0.028392314910888672, 0.029514074325561523, 0.030635833740234375, 0.03175759315490723, 0.03287935256958008, 0.03400111198425293, 0.03512287139892578, 0.03624463081359863, 0.037366390228271484, 0.038488149642944336, 0.03960990905761719, 0.04073166847229004, 0.04185342788696289, 0.04297518730163574, 0.044096946716308594, 0.045218706130981445, 0.0463404655456543, 0.04746222496032715, 0.048583984375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 12.0, 27.0, 69.0, 131.0, 277.0, 254.0, 152.0, 45.0, 30.0, 7.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13349102437496185, -0.12308056652545929, -0.11267010867595673, -0.10225965082645416, -0.0918491929769516, -0.08143873512744904, -0.07102828472852707, -0.060617826879024506, -0.05020736902952194, -0.03979691118001938, -0.029386455193161964, -0.01897599920630455, -0.008565541356801987, 0.0018449164927005768, 0.012255370616912842, 0.022665828466415405, 0.03307628631591797, 0.04348674416542053, 0.053897202014923096, 0.06430765986442566, 0.07471811771392822, 0.08512857556343079, 0.09553902596235275, 0.10594948381185532, 0.11635994166135788, 0.12677039206027985, 0.1371808499097824, 0.14759130775928497, 0.15800176560878754, 0.1684122234582901, 0.17882268130779266, 0.18923313915729523, 0.1996435821056366, 0.21005403995513916, 0.22046449780464172, 0.2308749556541443, 0.24128541350364685, 0.2516958713531494, 0.262106329202652, 0.27251678705215454, 0.2829272449016571, 0.29333770275115967, 0.30374816060066223, 0.3141586184501648, 0.32456907629966736, 0.3349795341491699, 0.3453899919986725, 0.35580044984817505, 0.3662108778953552, 0.3766213357448578, 0.38703179359436035, 0.3974422514438629, 0.4078527092933655, 0.41826316714286804, 0.4286736249923706, 0.43908408284187317, 0.44949454069137573, 0.4599049985408783, 0.47031545639038086, 0.4807259142398834, 0.491136372089386, 0.5015468001365662, 0.5119572877883911, 0.5223677158355713, 0.5327782034873962]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 3.0, 9.0, 0.0, 4.0, 4.0, 7.0, 8.0, 11.0, 19.0, 13.0, 28.0, 13.0, 20.0, 26.0, 31.0, 20.0, 25.0, 38.0, 47.0, 58.0, 34.0, 53.0, 49.0, 37.0, 39.0, 42.0, 34.0, 42.0, 34.0, 41.0, 28.0, 25.0, 31.0, 26.0, 15.0, 24.0, 14.0, 13.0, 10.0, 3.0, 7.0, 6.0, 4.0, 4.0, 6.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09318786859512329, -0.0903608500957489, -0.08753383159637451, -0.08470682054758072, -0.08187980204820633, -0.07905278354883194, -0.07622577250003815, -0.07339875400066376, -0.07057173550128937, -0.06774471700191498, -0.06491769850254059, -0.062090687453746796, -0.059263668954372406, -0.056436650454998016, -0.053609635680913925, -0.050782620906829834, -0.047955602407455444, -0.045128583908081055, -0.042301569133996964, -0.03947455435991287, -0.03664753586053848, -0.03382051736116409, -0.030993502587080002, -0.02816648595035076, -0.02533946931362152, -0.02251245267689228, -0.01968543604016304, -0.0168584194034338, -0.01403140276670456, -0.011204386129975319, -0.008377369493246078, -0.005550352856516838, -0.0027233362197875977, 0.00010368041694164276, 0.002930697053670883, 0.005757713690400124, 0.008584730327129364, 0.011411746963858604, 0.014238763600587845, 0.017065780237317085, 0.019892796874046326, 0.022719813510775566, 0.025546830147504807, 0.028373846784234047, 0.031200863420963287, 0.03402788192033768, 0.03685489669442177, 0.03968191146850586, 0.04250892996788025, 0.04533594846725464, 0.04816296324133873, 0.05098997801542282, 0.05381699651479721, 0.0566440150141716, 0.05947102978825569, 0.06229804456233978, 0.06512506306171417, 0.06795208156108856, 0.07077910006046295, 0.07360611110925674, 0.07643312960863113, 0.07926014810800552, 0.08208715915679932, 0.0849141776561737, 0.0877411961555481]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 8.0, 10.0, 8.0, 13.0, 17.0, 31.0, 32.0, 51.0, 80.0, 112.0, 185.0, 252.0, 421.0, 667.0, 952.0, 1607.0, 2761.0, 4824.0, 8505.0, 15951.0, 31413.0, 62896.0, 131228.0, 254376.0, 261716.0, 135650.0, 65164.0, 32220.0, 16498.0, 8725.0, 4844.0, 2761.0, 1609.0, 1015.0, 661.0, 443.0, 266.0, 187.0, 118.0, 86.0, 49.0, 46.0, 27.0, 18.0, 17.0, 8.0, 7.0, 9.0, 6.0, 4.0, 2.0, 2.0], "bins": [-0.05615234375, -0.054593563079833984, -0.05303478240966797, -0.05147600173950195, -0.04991722106933594, -0.04835844039916992, -0.046799659729003906, -0.04524087905883789, -0.043682098388671875, -0.04212331771850586, -0.040564537048339844, -0.03900575637817383, -0.03744697570800781, -0.0358881950378418, -0.03432941436767578, -0.032770633697509766, -0.03121185302734375, -0.029653072357177734, -0.02809429168701172, -0.026535511016845703, -0.024976730346679688, -0.023417949676513672, -0.021859169006347656, -0.02030038833618164, -0.018741607666015625, -0.01718282699584961, -0.015624046325683594, -0.014065265655517578, -0.012506484985351562, -0.010947704315185547, -0.009388923645019531, -0.007830142974853516, -0.0062713623046875, -0.004712581634521484, -0.0031538009643554688, -0.0015950202941894531, -3.62396240234375e-05, 0.0015225410461425781, 0.0030813217163085938, 0.004640102386474609, 0.006198883056640625, 0.007757663726806641, 0.009316444396972656, 0.010875225067138672, 0.012434005737304688, 0.013992786407470703, 0.015551567077636719, 0.017110347747802734, 0.01866912841796875, 0.020227909088134766, 0.02178668975830078, 0.023345470428466797, 0.024904251098632812, 0.026463031768798828, 0.028021812438964844, 0.02958059310913086, 0.031139373779296875, 0.03269815444946289, 0.034256935119628906, 0.03581571578979492, 0.03737449645996094, 0.03893327713012695, 0.04049205780029297, 0.042050838470458984, 0.043609619140625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 6.0, 6.0, 7.0, 7.0, 13.0, 19.0, 24.0, 28.0, 28.0, 53.0, 39.0, 45.0, 63.0, 64.0, 53.0, 62.0, 65.0, 63.0, 63.0, 40.0, 51.0, 47.0, 29.0, 21.0, 25.0, 17.0, 13.0, 12.0, 6.0, 6.0, 8.0, 7.0, 1.0, 5.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0204620361328125, -0.01987171173095703, -0.019281387329101562, -0.018691062927246094, -0.018100738525390625, -0.017510414123535156, -0.016920089721679688, -0.01632976531982422, -0.01573944091796875, -0.015149116516113281, -0.014558792114257812, -0.013968467712402344, -0.013378143310546875, -0.012787818908691406, -0.012197494506835938, -0.011607170104980469, -0.011016845703125, -0.010426521301269531, -0.009836196899414062, -0.009245872497558594, -0.008655548095703125, -0.008065223693847656, -0.0074748992919921875, -0.006884574890136719, -0.00629425048828125, -0.005703926086425781, -0.0051136016845703125, -0.004523277282714844, -0.003932952880859375, -0.0033426284790039062, -0.0027523040771484375, -0.0021619796752929688, -0.0015716552734375, -0.0009813308715820312, -0.0003910064697265625, 0.00019931793212890625, 0.000789642333984375, 0.0013799667358398438, 0.0019702911376953125, 0.0025606155395507812, 0.00315093994140625, 0.0037412643432617188, 0.0043315887451171875, 0.004921913146972656, 0.005512237548828125, 0.006102561950683594, 0.0066928863525390625, 0.007283210754394531, 0.00787353515625, 0.008463859558105469, 0.009054183959960938, 0.009644508361816406, 0.010234832763671875, 0.010825157165527344, 0.011415481567382812, 0.012005805969238281, 0.01259613037109375, 0.013186454772949219, 0.013776779174804688, 0.014367103576660156, 0.014957427978515625, 0.015547752380371094, 0.016138076782226562, 0.01672840118408203, 0.0173187255859375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 6.0, 10.0, 5.0, 11.0, 13.0, 20.0, 36.0, 49.0, 72.0, 103.0, 180.0, 214.0, 367.0, 627.0, 1144.0, 2440.0, 5743.0, 17459.0, 62121.0, 246050.0, 473241.0, 172974.0, 43915.0, 12901.0, 4458.0, 1951.0, 953.0, 532.0, 320.0, 213.0, 128.0, 83.0, 69.0, 51.0, 28.0, 20.0, 18.0, 12.0, 13.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06781005859375, -0.06533241271972656, -0.06285476684570312, -0.06037712097167969, -0.05789947509765625, -0.05542182922363281, -0.052944183349609375, -0.05046653747558594, -0.0479888916015625, -0.04551124572753906, -0.043033599853515625, -0.04055595397949219, -0.03807830810546875, -0.03560066223144531, -0.033123016357421875, -0.030645370483398438, -0.028167724609375, -0.025690078735351562, -0.023212432861328125, -0.020734786987304688, -0.01825714111328125, -0.015779495239257812, -0.013301849365234375, -0.010824203491210938, -0.0083465576171875, -0.0058689117431640625, -0.003391265869140625, -0.0009136199951171875, 0.00156402587890625, 0.0040416717529296875, 0.006519317626953125, 0.008996963500976562, 0.011474609375, 0.013952255249023438, 0.016429901123046875, 0.018907546997070312, 0.02138519287109375, 0.023862838745117188, 0.026340484619140625, 0.028818130493164062, 0.0312957763671875, 0.03377342224121094, 0.036251068115234375, 0.03872871398925781, 0.04120635986328125, 0.04368400573730469, 0.046161651611328125, 0.04863929748535156, 0.051116943359375, 0.05359458923339844, 0.056072235107421875, 0.05854988098144531, 0.06102752685546875, 0.06350517272949219, 0.06598281860351562, 0.06846046447753906, 0.0709381103515625, 0.07341575622558594, 0.07589340209960938, 0.07837104797363281, 0.08084869384765625, 0.08332633972167969, 0.08580398559570312, 0.08828163146972656, 0.09075927734375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 1.0, 7.0, 4.0, 3.0, 6.0, 12.0, 17.0, 20.0, 18.0, 18.0, 21.0, 24.0, 32.0, 34.0, 31.0, 41.0, 42.0, 49.0, 42.0, 42.0, 35.0, 41.0, 45.0, 41.0, 46.0, 38.0, 37.0, 35.0, 31.0, 26.0, 20.0, 24.0, 28.0, 19.0, 19.0, 8.0, 9.0, 6.0, 8.0, 3.0, 7.0, 7.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06634521484375, -0.06415367126464844, -0.061962127685546875, -0.05977058410644531, -0.05757904052734375, -0.05538749694824219, -0.053195953369140625, -0.05100440979003906, -0.0488128662109375, -0.04662132263183594, -0.044429779052734375, -0.04223823547363281, -0.04004669189453125, -0.03785514831542969, -0.035663604736328125, -0.03347206115722656, -0.031280517578125, -0.029088973999023438, -0.026897430419921875, -0.024705886840820312, -0.02251434326171875, -0.020322799682617188, -0.018131256103515625, -0.015939712524414062, -0.0137481689453125, -0.011556625366210938, -0.009365081787109375, -0.0071735382080078125, -0.00498199462890625, -0.0027904510498046875, -0.000598907470703125, 0.0015926361083984375, 0.0037841796875, 0.0059757232666015625, 0.008167266845703125, 0.010358810424804688, 0.01255035400390625, 0.014741897583007812, 0.016933441162109375, 0.019124984741210938, 0.0213165283203125, 0.023508071899414062, 0.025699615478515625, 0.027891159057617188, 0.03008270263671875, 0.03227424621582031, 0.034465789794921875, 0.03665733337402344, 0.038848876953125, 0.04104042053222656, 0.043231964111328125, 0.04542350769042969, 0.04761505126953125, 0.04980659484863281, 0.051998138427734375, 0.05418968200683594, 0.0563812255859375, 0.05857276916503906, 0.060764312744140625, 0.06295585632324219, 0.06514739990234375, 0.06733894348144531, 0.06953048706054688, 0.07172203063964844, 0.07391357421875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 4.0, 1.0, 7.0, 10.0, 10.0, 17.0, 24.0, 27.0, 50.0, 92.0, 109.0, 199.0, 366.0, 721.0, 1673.0, 3668.0, 10462.0, 39419.0, 227914.0, 585868.0, 137671.0, 26701.0, 7812.0, 3025.0, 1254.0, 654.0, 325.0, 167.0, 82.0, 61.0, 43.0, 33.0, 20.0, 24.0, 15.0, 7.0, 5.0, 5.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04254150390625, -0.04114055633544922, -0.03973960876464844, -0.038338661193847656, -0.036937713623046875, -0.035536766052246094, -0.03413581848144531, -0.03273487091064453, -0.03133392333984375, -0.02993297576904297, -0.028532028198242188, -0.027131080627441406, -0.025730133056640625, -0.024329185485839844, -0.022928237915039062, -0.02152729034423828, -0.0201263427734375, -0.01872539520263672, -0.017324447631835938, -0.015923500061035156, -0.014522552490234375, -0.013121604919433594, -0.011720657348632812, -0.010319709777832031, -0.00891876220703125, -0.007517814636230469, -0.0061168670654296875, -0.004715919494628906, -0.003314971923828125, -0.0019140243530273438, -0.0005130767822265625, 0.0008878707885742188, 0.002288818359375, 0.0036897659301757812, 0.0050907135009765625, 0.006491661071777344, 0.007892608642578125, 0.009293556213378906, 0.010694503784179688, 0.012095451354980469, 0.01349639892578125, 0.014897346496582031, 0.016298294067382812, 0.017699241638183594, 0.019100189208984375, 0.020501136779785156, 0.021902084350585938, 0.02330303192138672, 0.0247039794921875, 0.02610492706298828, 0.027505874633789062, 0.028906822204589844, 0.030307769775390625, 0.031708717346191406, 0.03310966491699219, 0.03451061248779297, 0.03591156005859375, 0.03731250762939453, 0.03871345520019531, 0.040114402770996094, 0.041515350341796875, 0.042916297912597656, 0.04431724548339844, 0.04571819305419922, 0.047119140625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 6.0, 12.0, 11.0, 26.0, 22.0, 34.0, 41.0, 74.0, 74.0, 115.0, 100.0, 116.0, 96.0, 76.0, 60.0, 30.0, 25.0, 27.0, 13.0, 11.0, 6.0, 1.0, 6.0, 4.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0279159545898438e-05, -2.9056333005428314e-05, -2.783350646495819e-05, -2.6610679924488068e-05, -2.5387853384017944e-05, -2.416502684354782e-05, -2.2942200303077698e-05, -2.1719373762607574e-05, -2.049654722213745e-05, -1.9273720681667328e-05, -1.8050894141197205e-05, -1.682806760072708e-05, -1.5605241060256958e-05, -1.4382414519786835e-05, -1.3159587979316711e-05, -1.1936761438846588e-05, -1.0713934898376465e-05, -9.491108357906342e-06, -8.268281817436218e-06, -7.045455276966095e-06, -5.822628736495972e-06, -4.599802196025848e-06, -3.376975655555725e-06, -2.154149115085602e-06, -9.313225746154785e-07, 2.915039658546448e-07, 1.514330506324768e-06, 2.7371570467948914e-06, 3.959983587265015e-06, 5.182810127735138e-06, 6.405636668205261e-06, 7.6284632086753845e-06, 8.851289749145508e-06, 1.0074116289615631e-05, 1.1296942830085754e-05, 1.2519769370555878e-05, 1.3742595911026001e-05, 1.4965422451496124e-05, 1.6188248991966248e-05, 1.741107553243637e-05, 1.8633902072906494e-05, 1.9856728613376617e-05, 2.107955515384674e-05, 2.2302381694316864e-05, 2.3525208234786987e-05, 2.474803477525711e-05, 2.5970861315727234e-05, 2.7193687856197357e-05, 2.841651439666748e-05, 2.9639340937137604e-05, 3.086216747760773e-05, 3.208499401807785e-05, 3.3307820558547974e-05, 3.45306470990181e-05, 3.575347363948822e-05, 3.6976300179958344e-05, 3.819912672042847e-05, 3.942195326089859e-05, 4.064477980136871e-05, 4.186760634183884e-05, 4.309043288230896e-05, 4.431325942277908e-05, 4.5536085963249207e-05, 4.675891250371933e-05, 4.798173904418945e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 7.0, 11.0, 12.0, 30.0, 35.0, 41.0, 74.0, 107.0, 192.0, 310.0, 631.0, 1326.0, 3038.0, 8449.0, 29151.0, 171937.0, 625424.0, 165405.0, 28482.0, 8120.0, 3013.0, 1236.0, 662.0, 321.0, 206.0, 103.0, 73.0, 52.0, 30.0, 19.0, 11.0, 8.0, 8.0, 10.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.042205810546875, -0.04082155227661133, -0.039437294006347656, -0.038053035736083984, -0.03666877746582031, -0.03528451919555664, -0.03390026092529297, -0.0325160026550293, -0.031131744384765625, -0.029747486114501953, -0.02836322784423828, -0.02697896957397461, -0.025594711303710938, -0.024210453033447266, -0.022826194763183594, -0.021441936492919922, -0.02005767822265625, -0.018673419952392578, -0.017289161682128906, -0.015904903411865234, -0.014520645141601562, -0.01313638687133789, -0.011752128601074219, -0.010367870330810547, -0.008983612060546875, -0.007599353790283203, -0.006215095520019531, -0.004830837249755859, -0.0034465789794921875, -0.0020623207092285156, -0.0006780624389648438, 0.0007061958312988281, 0.0020904541015625, 0.003474712371826172, 0.004858970642089844, 0.006243228912353516, 0.0076274871826171875, 0.00901174545288086, 0.010396003723144531, 0.011780261993408203, 0.013164520263671875, 0.014548778533935547, 0.01593303680419922, 0.01731729507446289, 0.018701553344726562, 0.020085811614990234, 0.021470069885253906, 0.022854328155517578, 0.02423858642578125, 0.025622844696044922, 0.027007102966308594, 0.028391361236572266, 0.029775619506835938, 0.03115987777709961, 0.03254413604736328, 0.03392839431762695, 0.035312652587890625, 0.0366969108581543, 0.03808116912841797, 0.03946542739868164, 0.04084968566894531, 0.042233943939208984, 0.043618202209472656, 0.04500246047973633, 0.04638671875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 4.0, 7.0, 8.0, 13.0, 15.0, 26.0, 28.0, 29.0, 61.0, 71.0, 63.0, 90.0, 103.0, 77.0, 86.0, 72.0, 58.0, 53.0, 33.0, 19.0, 17.0, 16.0, 14.0, 7.0, 3.0, 3.0, 5.0, 6.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0300140380859375, -0.02901434898376465, -0.028014659881591797, -0.027014970779418945, -0.026015281677246094, -0.025015592575073242, -0.02401590347290039, -0.02301621437072754, -0.022016525268554688, -0.021016836166381836, -0.020017147064208984, -0.019017457962036133, -0.01801776885986328, -0.01701807975769043, -0.016018390655517578, -0.015018701553344727, -0.014019012451171875, -0.013019323348999023, -0.012019634246826172, -0.01101994514465332, -0.010020256042480469, -0.009020566940307617, -0.008020877838134766, -0.007021188735961914, -0.0060214996337890625, -0.005021810531616211, -0.004022121429443359, -0.003022432327270508, -0.0020227432250976562, -0.0010230541229248047, -2.3365020751953125e-05, 0.0009763240814208984, 0.00197601318359375, 0.0029757022857666016, 0.003975391387939453, 0.004975080490112305, 0.005974769592285156, 0.006974458694458008, 0.00797414779663086, 0.008973836898803711, 0.009973526000976562, 0.010973215103149414, 0.011972904205322266, 0.012972593307495117, 0.013972282409667969, 0.01497197151184082, 0.015971660614013672, 0.016971349716186523, 0.017971038818359375, 0.018970727920532227, 0.019970417022705078, 0.02097010612487793, 0.02196979522705078, 0.022969484329223633, 0.023969173431396484, 0.024968862533569336, 0.025968551635742188, 0.02696824073791504, 0.02796792984008789, 0.028967618942260742, 0.029967308044433594, 0.030966997146606445, 0.0319666862487793, 0.03296637535095215, 0.033966064453125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 18.0, 22.0, 26.0, 56.0, 72.0, 111.0, 151.0, 119.0, 141.0, 102.0, 71.0, 51.0, 22.0, 15.0, 7.0, 8.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3377261459827423, -0.3202654719352722, -0.3028047978878021, -0.28534412384033203, -0.26788341999053955, -0.25042277574539185, -0.23296207189559937, -0.21550139784812927, -0.19804072380065918, -0.1805800497531891, -0.163119375705719, -0.1456586867570877, -0.12819801270961761, -0.11073733866214752, -0.09327665716409683, -0.07581597566604614, -0.05835530161857605, -0.04089462384581566, -0.023433946073055267, -0.005973268300294876, 0.011487409472465515, 0.028948083519935608, 0.0464087650179863, 0.06386944651603699, 0.08133012056350708, 0.09879079461097717, 0.11625147610902786, 0.13371215760707855, 0.15117283165454865, 0.16863350570201874, 0.18609419465065002, 0.20355486869812012, 0.2210155725479126, 0.2384762465953827, 0.2559369206428528, 0.2733975946903229, 0.29085826873779297, 0.30831897258758545, 0.32577964663505554, 0.34324032068252563, 0.3607009947299957, 0.3781616687774658, 0.3956223428249359, 0.413083016872406, 0.4305437207221985, 0.4480043649673462, 0.46546506881713867, 0.48292574286460876, 0.5003864169120789, 0.5178471207618713, 0.535307765007019, 0.5527684688568115, 0.5702291131019592, 0.5876898169517517, 0.6051504611968994, 0.6226111650466919, 0.6400718688964844, 0.6575325727462769, 0.6749932169914246, 0.692453920841217, 0.7099145650863647, 0.7273752689361572, 0.7448359131813049, 0.7622966170310974, 0.7797572612762451]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 6.0, 2.0, 3.0, 4.0, 9.0, 8.0, 13.0, 8.0, 15.0, 21.0, 21.0, 29.0, 25.0, 32.0, 44.0, 38.0, 51.0, 51.0, 52.0, 61.0, 62.0, 45.0, 50.0, 45.0, 42.0, 39.0, 38.0, 25.0, 27.0, 22.0, 25.0, 16.0, 20.0, 16.0, 16.0, 9.0, 6.0, 5.0, 6.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43339109420776367, -0.4191264510154724, -0.40486177802085876, -0.3905971348285675, -0.37633249163627625, -0.3620678186416626, -0.34780317544937134, -0.3335385322570801, -0.3192738890647888, -0.30500924587249756, -0.2907445728778839, -0.27647992968559265, -0.2622152864933014, -0.24795062839984894, -0.23368597030639648, -0.21942132711410522, -0.20515665411949158, -0.19089199602603912, -0.17662735283374786, -0.1623626947402954, -0.14809805154800415, -0.1338333934545517, -0.11956873536109924, -0.10530408471822739, -0.09103943407535553, -0.07677478343248367, -0.06251013278961182, -0.04824547469615936, -0.033980824053287506, -0.01971617341041565, -0.005451515316963196, 0.008813135325908661, 0.023077785968780518, 0.037342436611652374, 0.05160709097981453, 0.06587174534797668, 0.08013639599084854, 0.0944010466337204, 0.10866570472717285, 0.12293035537004471, 0.13719500601291656, 0.15145966410636902, 0.16572430729866028, 0.17998896539211273, 0.19425362348556519, 0.20851826667785645, 0.2227829247713089, 0.23704758286476135, 0.2513122260570526, 0.26557686924934387, 0.2798415422439575, 0.2941061854362488, 0.30837082862854004, 0.3226354718208313, 0.33690014481544495, 0.3511647880077362, 0.36542946100234985, 0.3796941041946411, 0.39395877718925476, 0.408223420381546, 0.4224880635738373, 0.4367527365684509, 0.4510173797607422, 0.46528202295303345, 0.4795466661453247]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 5.0, 3.0, 7.0, 7.0, 15.0, 24.0, 41.0, 47.0, 72.0, 124.0, 182.0, 330.0, 465.0, 855.0, 1526.0, 2742.0, 5600.0, 12451.0, 32995.0, 116116.0, 2611960.0, 1256076.0, 100176.0, 29441.0, 11362.0, 5294.0, 2673.0, 1488.0, 842.0, 492.0, 309.0, 167.0, 113.0, 72.0, 78.0, 49.0, 31.0, 23.0, 8.0, 10.0, 6.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.07763671875, -0.07541561126708984, -0.07319450378417969, -0.07097339630126953, -0.06875228881835938, -0.06653118133544922, -0.06431007385253906, -0.062088966369628906, -0.05986785888671875, -0.057646751403808594, -0.05542564392089844, -0.05320453643798828, -0.050983428955078125, -0.04876232147216797, -0.04654121398925781, -0.044320106506347656, -0.0420989990234375, -0.039877891540527344, -0.03765678405761719, -0.03543567657470703, -0.033214569091796875, -0.03099346160888672, -0.028772354125976562, -0.026551246643066406, -0.02433013916015625, -0.022109031677246094, -0.019887924194335938, -0.01766681671142578, -0.015445709228515625, -0.013224601745605469, -0.011003494262695312, -0.008782386779785156, -0.006561279296875, -0.004340171813964844, -0.0021190643310546875, 0.00010204315185546875, 0.002323150634765625, 0.004544258117675781, 0.0067653656005859375, 0.008986473083496094, 0.01120758056640625, 0.013428688049316406, 0.015649795532226562, 0.01787090301513672, 0.020092010498046875, 0.02231311798095703, 0.024534225463867188, 0.026755332946777344, 0.0289764404296875, 0.031197547912597656, 0.03341865539550781, 0.03563976287841797, 0.037860870361328125, 0.04008197784423828, 0.04230308532714844, 0.044524192810058594, 0.04674530029296875, 0.048966407775878906, 0.05118751525878906, 0.05340862274169922, 0.055629730224609375, 0.05785083770751953, 0.06007194519042969, 0.062293052673339844, 0.06451416015625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 0.0, 1.0, 4.0, 6.0, 9.0, 4.0, 11.0, 9.0, 21.0, 17.0, 21.0, 28.0, 34.0, 39.0, 53.0, 58.0, 53.0, 51.0, 56.0, 57.0, 45.0, 71.0, 52.0, 58.0, 41.0, 41.0, 33.0, 29.0, 21.0, 18.0, 16.0, 4.0, 9.0, 8.0, 11.0, 2.0, 5.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.01776123046875, -0.017196178436279297, -0.016631126403808594, -0.01606607437133789, -0.015501022338867188, -0.014935970306396484, -0.014370918273925781, -0.013805866241455078, -0.013240814208984375, -0.012675762176513672, -0.012110710144042969, -0.011545658111572266, -0.010980606079101562, -0.01041555404663086, -0.009850502014160156, -0.009285449981689453, -0.00872039794921875, -0.008155345916748047, -0.007590293884277344, -0.007025241851806641, -0.0064601898193359375, -0.005895137786865234, -0.005330085754394531, -0.004765033721923828, -0.004199981689453125, -0.003634929656982422, -0.0030698776245117188, -0.0025048255920410156, -0.0019397735595703125, -0.0013747215270996094, -0.0008096694946289062, -0.0002446174621582031, 0.0003204345703125, 0.0008854866027832031, 0.0014505386352539062, 0.0020155906677246094, 0.0025806427001953125, 0.0031456947326660156, 0.0037107467651367188, 0.004275798797607422, 0.004840850830078125, 0.005405902862548828, 0.005970954895019531, 0.006536006927490234, 0.0071010589599609375, 0.007666110992431641, 0.008231163024902344, 0.008796215057373047, 0.00936126708984375, 0.009926319122314453, 0.010491371154785156, 0.01105642318725586, 0.011621475219726562, 0.012186527252197266, 0.012751579284667969, 0.013316631317138672, 0.013881683349609375, 0.014446735382080078, 0.015011787414550781, 0.015576839447021484, 0.016141891479492188, 0.01670694351196289, 0.017271995544433594, 0.017837047576904297, 0.018402099609375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 4.0, 10.0, 11.0, 18.0, 29.0, 70.0, 95.0, 197.0, 394.0, 828.0, 1912.0, 4823.0, 13501.0, 46696.0, 278781.0, 3484700.0, 293013.0, 47539.0, 13437.0, 4719.0, 1810.0, 833.0, 405.0, 209.0, 107.0, 56.0, 21.0, 21.0, 9.0, 13.0, 5.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.1243896484375, -0.12139320373535156, -0.11839675903320312, -0.11540031433105469, -0.11240386962890625, -0.10940742492675781, -0.10641098022460938, -0.10341453552246094, -0.1004180908203125, -0.09742164611816406, -0.09442520141601562, -0.09142875671386719, -0.08843231201171875, -0.08543586730957031, -0.08243942260742188, -0.07944297790527344, -0.076446533203125, -0.07345008850097656, -0.07045364379882812, -0.06745719909667969, -0.06446075439453125, -0.06146430969238281, -0.058467864990234375, -0.05547142028808594, -0.0524749755859375, -0.04947853088378906, -0.046482086181640625, -0.04348564147949219, -0.04048919677734375, -0.03749275207519531, -0.034496307373046875, -0.03149986267089844, -0.02850341796875, -0.025506973266601562, -0.022510528564453125, -0.019514083862304688, -0.01651763916015625, -0.013521194458007812, -0.010524749755859375, -0.0075283050537109375, -0.0045318603515625, -0.0015354156494140625, 0.001461029052734375, 0.0044574737548828125, 0.00745391845703125, 0.010450363159179688, 0.013446807861328125, 0.016443252563476562, 0.019439697265625, 0.022436141967773438, 0.025432586669921875, 0.028429031372070312, 0.03142547607421875, 0.03442192077636719, 0.037418365478515625, 0.04041481018066406, 0.0434112548828125, 0.04640769958496094, 0.049404144287109375, 0.05240058898925781, 0.05539703369140625, 0.05839347839355469, 0.061389923095703125, 0.06438636779785156, 0.0673828125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 1.0, 9.0, 7.0, 11.0, 9.0, 10.0, 22.0, 25.0, 25.0, 39.0, 69.0, 86.0, 166.0, 275.0, 608.0, 1476.0, 545.0, 268.0, 140.0, 84.0, 56.0, 32.0, 34.0, 24.0, 18.0, 10.0, 4.0, 3.0, 12.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0379638671875, -0.03682994842529297, -0.03569602966308594, -0.034562110900878906, -0.033428192138671875, -0.032294273376464844, -0.031160354614257812, -0.03002643585205078, -0.02889251708984375, -0.02775859832763672, -0.026624679565429688, -0.025490760803222656, -0.024356842041015625, -0.023222923278808594, -0.022089004516601562, -0.02095508575439453, -0.0198211669921875, -0.01868724822998047, -0.017553329467773438, -0.016419410705566406, -0.015285491943359375, -0.014151573181152344, -0.013017654418945312, -0.011883735656738281, -0.01074981689453125, -0.009615898132324219, -0.008481979370117188, -0.007348060607910156, -0.006214141845703125, -0.005080223083496094, -0.0039463043212890625, -0.0028123855590820312, -0.001678466796875, -0.0005445480346679688, 0.0005893707275390625, 0.0017232894897460938, 0.002857208251953125, 0.003991127014160156, 0.0051250457763671875, 0.006258964538574219, 0.00739288330078125, 0.008526802062988281, 0.009660720825195312, 0.010794639587402344, 0.011928558349609375, 0.013062477111816406, 0.014196395874023438, 0.015330314636230469, 0.0164642333984375, 0.01759815216064453, 0.018732070922851562, 0.019865989685058594, 0.020999908447265625, 0.022133827209472656, 0.023267745971679688, 0.02440166473388672, 0.02553558349609375, 0.02666950225830078, 0.027803421020507812, 0.028937339782714844, 0.030071258544921875, 0.031205177307128906, 0.03233909606933594, 0.03347301483154297, 0.03460693359375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 14.0, 64.0, 272.0, 414.0, 202.0, 30.0, 11.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2561997175216675, -1.2291288375854492, -1.202057957649231, -1.1749869585037231, -1.1479160785675049, -1.1208451986312866, -1.0937743186950684, -1.0667033195495605, -1.0396324396133423, -1.012561559677124, -0.985490620136261, -0.9584197402000427, -0.9313488006591797, -0.9042779207229614, -0.8772069811820984, -0.8501361012458801, -0.8230651617050171, -0.7959942817687988, -0.7689233422279358, -0.7418524622917175, -0.7147815227508545, -0.6877106428146362, -0.6606397032737732, -0.6335688233375549, -0.6064979434013367, -0.5794270634651184, -0.5523561239242554, -0.5252852439880371, -0.4982143044471741, -0.4711434245109558, -0.4440724849700928, -0.4170016050338745, -0.3899306654930115, -0.3628597557544708, -0.3357888460159302, -0.3087179362773895, -0.2816470265388489, -0.2545761466026306, -0.22750522196292877, -0.20043431222438812, -0.17336340248584747, -0.14629249274730682, -0.11922158300876617, -0.09215068072080612, -0.06507977098226547, -0.03800886869430542, -0.01093795895576477, 0.01613295078277588, 0.04320386052131653, 0.07027477025985718, 0.09734567999839783, 0.12441658228635788, 0.15148749947547913, 0.17855839431285858, 0.20562930405139923, 0.23270021378993988, 0.25977110862731934, 0.28684201836586, 0.31391292810440063, 0.3409838378429413, 0.36805474758148193, 0.3951256275177002, 0.42219656705856323, 0.4492674469947815, 0.47633838653564453]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 9.0, 2.0, 0.0, 3.0, 5.0, 9.0, 5.0, 6.0, 4.0, 16.0, 13.0, 13.0, 12.0, 22.0, 12.0, 21.0, 44.0, 33.0, 41.0, 33.0, 29.0, 32.0, 49.0, 36.0, 66.0, 29.0, 54.0, 42.0, 47.0, 48.0, 35.0, 29.0, 36.0, 22.0, 13.0, 18.0, 21.0, 26.0, 15.0, 13.0, 13.0, 8.0, 8.0, 4.0, 6.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.12559539079666138, -0.12173214554786682, -0.11786890029907227, -0.11400565505027771, -0.11014240980148315, -0.1062791645526886, -0.10241591930389404, -0.09855267405509949, -0.09468942880630493, -0.09082618355751038, -0.08696293830871582, -0.08309969305992126, -0.07923644781112671, -0.07537320256233215, -0.0715099573135376, -0.06764671206474304, -0.06378346681594849, -0.05992022156715393, -0.056056976318359375, -0.05219373106956482, -0.048330485820770264, -0.04446724057197571, -0.04060399532318115, -0.0367407500743866, -0.03287750482559204, -0.029014259576797485, -0.02515101432800293, -0.021287769079208374, -0.01742452383041382, -0.013561278581619263, -0.009698033332824707, -0.005834788084030151, -0.0019715428352355957, 0.00189170241355896, 0.005754947662353516, 0.009618192911148071, 0.013481438159942627, 0.017344683408737183, 0.02120792865753174, 0.025071173906326294, 0.02893441915512085, 0.032797664403915405, 0.03666090965270996, 0.04052415490150452, 0.04438740015029907, 0.04825064539909363, 0.052113890647888184, 0.05597713589668274, 0.059840381145477295, 0.06370362639427185, 0.0675668716430664, 0.07143011689186096, 0.07529336214065552, 0.07915660738945007, 0.08301985263824463, 0.08688309788703918, 0.09074634313583374, 0.0946095883846283, 0.09847283363342285, 0.10233607888221741, 0.10619932413101196, 0.11006256937980652, 0.11392581462860107, 0.11778905987739563, 0.12165230512619019]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 10.0, 12.0, 20.0, 20.0, 22.0, 50.0, 77.0, 133.0, 213.0, 389.0, 698.0, 1182.0, 2302.0, 4781.0, 9938.0, 22600.0, 54874.0, 144223.0, 384357.0, 262352.0, 92685.0, 37247.0, 15795.0, 7141.0, 3549.0, 1694.0, 881.0, 501.0, 293.0, 197.0, 96.0, 85.0, 45.0, 26.0, 20.0, 12.0, 8.0, 6.0, 6.0, 3.0, 2.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0833740234375, -0.08090591430664062, -0.07843780517578125, -0.07596969604492188, -0.0735015869140625, -0.07103347778320312, -0.06856536865234375, -0.06609725952148438, -0.063629150390625, -0.061161041259765625, -0.05869293212890625, -0.056224822998046875, -0.0537567138671875, -0.051288604736328125, -0.04882049560546875, -0.046352386474609375, -0.04388427734375, -0.041416168212890625, -0.03894805908203125, -0.036479949951171875, -0.0340118408203125, -0.031543731689453125, -0.02907562255859375, -0.026607513427734375, -0.024139404296875, -0.021671295166015625, -0.01920318603515625, -0.016735076904296875, -0.0142669677734375, -0.011798858642578125, -0.00933074951171875, -0.006862640380859375, -0.00439453125, -0.001926422119140625, 0.00054168701171875, 0.003009796142578125, 0.0054779052734375, 0.007946014404296875, 0.01041412353515625, 0.012882232666015625, 0.015350341796875, 0.017818450927734375, 0.02028656005859375, 0.022754669189453125, 0.0252227783203125, 0.027690887451171875, 0.03015899658203125, 0.032627105712890625, 0.03509521484375, 0.037563323974609375, 0.04003143310546875, 0.042499542236328125, 0.0449676513671875, 0.047435760498046875, 0.04990386962890625, 0.052371978759765625, 0.054840087890625, 0.057308197021484375, 0.05977630615234375, 0.062244415283203125, 0.0647125244140625, 0.06718063354492188, 0.06964874267578125, 0.07211685180664062, 0.0745849609375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 0.0, 7.0, 2.0, 6.0, 8.0, 15.0, 8.0, 9.0, 27.0, 16.0, 30.0, 45.0, 36.0, 50.0, 59.0, 54.0, 57.0, 67.0, 62.0, 74.0, 69.0, 46.0, 46.0, 32.0, 37.0, 33.0, 15.0, 23.0, 19.0, 16.0, 10.0, 5.0, 6.0, 6.0, 3.0, 1.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0177764892578125, -0.01718282699584961, -0.01658916473388672, -0.015995502471923828, -0.015401840209960938, -0.014808177947998047, -0.014214515686035156, -0.013620853424072266, -0.013027191162109375, -0.012433528900146484, -0.011839866638183594, -0.011246204376220703, -0.010652542114257812, -0.010058879852294922, -0.009465217590332031, -0.00887155532836914, -0.00827789306640625, -0.007684230804443359, -0.007090568542480469, -0.006496906280517578, -0.0059032440185546875, -0.005309581756591797, -0.004715919494628906, -0.004122257232666016, -0.003528594970703125, -0.0029349327087402344, -0.0023412704467773438, -0.0017476081848144531, -0.0011539459228515625, -0.0005602836608886719, 3.337860107421875e-05, 0.0006270408630371094, 0.001220703125, 0.0018143653869628906, 0.0024080276489257812, 0.003001689910888672, 0.0035953521728515625, 0.004189014434814453, 0.004782676696777344, 0.005376338958740234, 0.005970001220703125, 0.006563663482666016, 0.007157325744628906, 0.007750988006591797, 0.008344650268554688, 0.008938312530517578, 0.009531974792480469, 0.01012563705444336, 0.01071929931640625, 0.01131296157836914, 0.011906623840332031, 0.012500286102294922, 0.013093948364257812, 0.013687610626220703, 0.014281272888183594, 0.014874935150146484, 0.015468597412109375, 0.016062259674072266, 0.016655921936035156, 0.017249584197998047, 0.017843246459960938, 0.018436908721923828, 0.01903057098388672, 0.01962423324584961, 0.0202178955078125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 5.0, 4.0, 5.0, 10.0, 14.0, 28.0, 35.0, 46.0, 72.0, 108.0, 208.0, 301.0, 496.0, 907.0, 1654.0, 3553.0, 7945.0, 20558.0, 60520.0, 186049.0, 425891.0, 225195.0, 72996.0, 24486.0, 9325.0, 3903.0, 1896.0, 927.0, 504.0, 323.0, 206.0, 118.0, 88.0, 55.0, 36.0, 24.0, 21.0, 16.0, 12.0, 6.0, 4.0, 6.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.070068359375, -0.06785011291503906, -0.06563186645507812, -0.06341361999511719, -0.06119537353515625, -0.05897712707519531, -0.056758880615234375, -0.05454063415527344, -0.0523223876953125, -0.05010414123535156, -0.047885894775390625, -0.04566764831542969, -0.04344940185546875, -0.04123115539550781, -0.039012908935546875, -0.03679466247558594, -0.034576416015625, -0.03235816955566406, -0.030139923095703125, -0.027921676635742188, -0.02570343017578125, -0.023485183715820312, -0.021266937255859375, -0.019048690795898438, -0.0168304443359375, -0.014612197875976562, -0.012393951416015625, -0.010175704956054688, -0.00795745849609375, -0.0057392120361328125, -0.003520965576171875, -0.0013027191162109375, 0.00091552734375, 0.0031337738037109375, 0.005352020263671875, 0.0075702667236328125, 0.00978851318359375, 0.012006759643554688, 0.014225006103515625, 0.016443252563476562, 0.0186614990234375, 0.020879745483398438, 0.023097991943359375, 0.025316238403320312, 0.02753448486328125, 0.029752731323242188, 0.031970977783203125, 0.03418922424316406, 0.036407470703125, 0.03862571716308594, 0.040843963623046875, 0.04306221008300781, 0.04528045654296875, 0.04749870300292969, 0.049716949462890625, 0.05193519592285156, 0.0541534423828125, 0.05637168884277344, 0.058589935302734375, 0.06080818176269531, 0.06302642822265625, 0.06524467468261719, 0.06746292114257812, 0.06968116760253906, 0.0718994140625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 0.0, 4.0, 6.0, 7.0, 8.0, 8.0, 17.0, 14.0, 15.0, 23.0, 16.0, 24.0, 27.0, 28.0, 39.0, 40.0, 33.0, 39.0, 50.0, 41.0, 44.0, 33.0, 48.0, 48.0, 42.0, 30.0, 37.0, 41.0, 27.0, 31.0, 34.0, 24.0, 22.0, 19.0, 14.0, 12.0, 10.0, 5.0, 8.0, 8.0, 3.0, 8.0, 7.0, 0.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06646728515625, -0.06432056427001953, -0.06217384338378906, -0.060027122497558594, -0.057880401611328125, -0.055733680725097656, -0.05358695983886719, -0.05144023895263672, -0.04929351806640625, -0.04714679718017578, -0.04500007629394531, -0.042853355407714844, -0.040706634521484375, -0.038559913635253906, -0.03641319274902344, -0.03426647186279297, -0.0321197509765625, -0.02997303009033203, -0.027826309204101562, -0.025679588317871094, -0.023532867431640625, -0.021386146545410156, -0.019239425659179688, -0.01709270477294922, -0.01494598388671875, -0.012799263000488281, -0.010652542114257812, -0.008505821228027344, -0.006359100341796875, -0.004212379455566406, -0.0020656585693359375, 8.106231689453125e-05, 0.002227783203125, 0.004374504089355469, 0.0065212249755859375, 0.008667945861816406, 0.010814666748046875, 0.012961387634277344, 0.015108108520507812, 0.01725482940673828, 0.01940155029296875, 0.02154827117919922, 0.023694992065429688, 0.025841712951660156, 0.027988433837890625, 0.030135154724121094, 0.03228187561035156, 0.03442859649658203, 0.0365753173828125, 0.03872203826904297, 0.04086875915527344, 0.043015480041503906, 0.045162200927734375, 0.047308921813964844, 0.04945564270019531, 0.05160236358642578, 0.05374908447265625, 0.05589580535888672, 0.05804252624511719, 0.060189247131347656, 0.062335968017578125, 0.0644826889038086, 0.06662940979003906, 0.06877613067626953, 0.0709228515625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 7.0, 6.0, 8.0, 12.0, 15.0, 19.0, 41.0, 59.0, 131.0, 258.0, 527.0, 1017.0, 2567.0, 6846.0, 22209.0, 94465.0, 536496.0, 307505.0, 53914.0, 14344.0, 4678.0, 1846.0, 749.0, 401.0, 195.0, 101.0, 61.0, 34.0, 20.0, 12.0, 6.0, 8.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061614990234375, -0.05954885482788086, -0.05748271942138672, -0.05541658401489258, -0.05335044860839844, -0.0512843132019043, -0.049218177795410156, -0.047152042388916016, -0.045085906982421875, -0.043019771575927734, -0.040953636169433594, -0.03888750076293945, -0.03682136535644531, -0.03475522994995117, -0.03268909454345703, -0.03062295913696289, -0.02855682373046875, -0.02649068832397461, -0.02442455291748047, -0.022358417510986328, -0.020292282104492188, -0.018226146697998047, -0.016160011291503906, -0.014093875885009766, -0.012027740478515625, -0.009961605072021484, -0.007895469665527344, -0.005829334259033203, -0.0037631988525390625, -0.0016970634460449219, 0.00036907196044921875, 0.0024352073669433594, 0.0045013427734375, 0.006567478179931641, 0.008633613586425781, 0.010699748992919922, 0.012765884399414062, 0.014832019805908203, 0.016898155212402344, 0.018964290618896484, 0.021030426025390625, 0.023096561431884766, 0.025162696838378906, 0.027228832244873047, 0.029294967651367188, 0.03136110305786133, 0.03342723846435547, 0.03549337387084961, 0.03755950927734375, 0.03962564468383789, 0.04169178009033203, 0.04375791549682617, 0.04582405090332031, 0.04789018630981445, 0.049956321716308594, 0.052022457122802734, 0.054088592529296875, 0.056154727935791016, 0.058220863342285156, 0.0602869987487793, 0.06235313415527344, 0.06441926956176758, 0.06648540496826172, 0.06855154037475586, 0.07061767578125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 4.0, 11.0, 22.0, 26.0, 43.0, 59.0, 81.0, 113.0, 151.0, 146.0, 129.0, 77.0, 48.0, 39.0, 28.0, 10.0, 8.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5418739318847656e-05, -4.372932016849518e-05, -4.20399010181427e-05, -4.035048186779022e-05, -3.8661062717437744e-05, -3.6971643567085266e-05, -3.528222441673279e-05, -3.359280526638031e-05, -3.190338611602783e-05, -3.0213966965675354e-05, -2.8524547815322876e-05, -2.6835128664970398e-05, -2.514570951461792e-05, -2.3456290364265442e-05, -2.1766871213912964e-05, -2.0077452063560486e-05, -1.8388032913208008e-05, -1.669861376285553e-05, -1.5009194612503052e-05, -1.3319775462150574e-05, -1.1630356311798096e-05, -9.940937161445618e-06, -8.25151801109314e-06, -6.562098860740662e-06, -4.872679710388184e-06, -3.1832605600357056e-06, -1.4938414096832275e-06, 1.955777406692505e-07, 1.8849968910217285e-06, 3.5744160413742065e-06, 5.2638351917266846e-06, 6.953254342079163e-06, 8.64267349243164e-06, 1.0332092642784119e-05, 1.2021511793136597e-05, 1.3710930943489075e-05, 1.5400350093841553e-05, 1.708976924419403e-05, 1.877918839454651e-05, 2.0468607544898987e-05, 2.2158026695251465e-05, 2.3847445845603943e-05, 2.553686499595642e-05, 2.72262841463089e-05, 2.8915703296661377e-05, 3.0605122447013855e-05, 3.229454159736633e-05, 3.398396074771881e-05, 3.567337989807129e-05, 3.736279904842377e-05, 3.9052218198776245e-05, 4.074163734912872e-05, 4.24310564994812e-05, 4.412047564983368e-05, 4.580989480018616e-05, 4.7499313950538635e-05, 4.918873310089111e-05, 5.087815225124359e-05, 5.256757140159607e-05, 5.425699055194855e-05, 5.5946409702301025e-05, 5.7635828852653503e-05, 5.932524800300598e-05, 6.101466715335846e-05, 6.270408630371094e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 1.0, 8.0, 12.0, 12.0, 21.0, 25.0, 39.0, 81.0, 123.0, 195.0, 306.0, 572.0, 1096.0, 2334.0, 5581.0, 15525.0, 51111.0, 221162.0, 549411.0, 144456.0, 36221.0, 11901.0, 4314.0, 1894.0, 913.0, 486.0, 275.0, 182.0, 96.0, 70.0, 48.0, 25.0, 19.0, 13.0, 8.0, 5.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.056732177734375, -0.05512809753417969, -0.053524017333984375, -0.05191993713378906, -0.05031585693359375, -0.04871177673339844, -0.047107696533203125, -0.04550361633300781, -0.0438995361328125, -0.04229545593261719, -0.040691375732421875, -0.03908729553222656, -0.03748321533203125, -0.03587913513183594, -0.034275054931640625, -0.03267097473144531, -0.03106689453125, -0.029462814331054688, -0.027858734130859375, -0.026254653930664062, -0.02465057373046875, -0.023046493530273438, -0.021442413330078125, -0.019838333129882812, -0.0182342529296875, -0.016630172729492188, -0.015026092529296875, -0.013422012329101562, -0.01181793212890625, -0.010213851928710938, -0.008609771728515625, -0.0070056915283203125, -0.005401611328125, -0.0037975311279296875, -0.002193450927734375, -0.0005893707275390625, 0.00101470947265625, 0.0026187896728515625, 0.004222869873046875, 0.0058269500732421875, 0.0074310302734375, 0.009035110473632812, 0.010639190673828125, 0.012243270874023438, 0.01384735107421875, 0.015451431274414062, 0.017055511474609375, 0.018659591674804688, 0.020263671875, 0.021867752075195312, 0.023471832275390625, 0.025075912475585938, 0.02667999267578125, 0.028284072875976562, 0.029888153076171875, 0.03149223327636719, 0.0330963134765625, 0.03470039367675781, 0.036304473876953125, 0.03790855407714844, 0.03951263427734375, 0.04111671447753906, 0.042720794677734375, 0.04432487487792969, 0.045928955078125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 8.0, 1.0, 4.0, 8.0, 4.0, 10.0, 14.0, 22.0, 18.0, 22.0, 32.0, 34.0, 42.0, 51.0, 92.0, 97.0, 96.0, 87.0, 76.0, 61.0, 43.0, 33.0, 39.0, 22.0, 20.0, 22.0, 15.0, 12.0, 3.0, 4.0, 4.0, 4.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.042999267578125, -0.041748046875, -0.040496826171875, -0.03924560546875, -0.037994384765625, -0.0367431640625, -0.035491943359375, -0.03424072265625, -0.032989501953125, -0.03173828125, -0.030487060546875, -0.02923583984375, -0.027984619140625, -0.0267333984375, -0.025482177734375, -0.02423095703125, -0.022979736328125, -0.021728515625, -0.020477294921875, -0.01922607421875, -0.017974853515625, -0.0167236328125, -0.015472412109375, -0.01422119140625, -0.012969970703125, -0.01171875, -0.010467529296875, -0.00921630859375, -0.007965087890625, -0.0067138671875, -0.005462646484375, -0.00421142578125, -0.002960205078125, -0.001708984375, -0.000457763671875, 0.00079345703125, 0.002044677734375, 0.0032958984375, 0.004547119140625, 0.00579833984375, 0.007049560546875, 0.00830078125, 0.009552001953125, 0.01080322265625, 0.012054443359375, 0.0133056640625, 0.014556884765625, 0.01580810546875, 0.017059326171875, 0.018310546875, 0.019561767578125, 0.02081298828125, 0.022064208984375, 0.0233154296875, 0.024566650390625, 0.02581787109375, 0.027069091796875, 0.0283203125, 0.029571533203125, 0.03082275390625, 0.032073974609375, 0.0333251953125, 0.034576416015625, 0.03582763671875, 0.037078857421875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 9.0, 42.0, 72.0, 138.0, 179.0, 187.0, 177.0, 98.0, 52.0, 23.0, 12.0, 8.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6950697302818298, -0.6665341258049011, -0.6379985213279724, -0.6094629764556885, -0.5809273719787598, -0.552391767501831, -0.5238561630249023, -0.49532055854797363, -0.4667849838733673, -0.4382493793964386, -0.4097138047218323, -0.38117820024490356, -0.35264259576797485, -0.32410702109336853, -0.2955714166164398, -0.2670358419418335, -0.23850023746490479, -0.20996464788913727, -0.18142905831336975, -0.15289345383644104, -0.12435786426067352, -0.095822274684906, -0.0672866702079773, -0.03875108063220978, -0.01021549105644226, 0.018320102244615555, 0.04685569554567337, 0.07539129257202148, 0.103926882147789, 0.13246247172355652, 0.16099807620048523, 0.18953366577625275, 0.21806931495666504, 0.24660490453243256, 0.2751404941082001, 0.3036760985851288, 0.3322116732597351, 0.3607472777366638, 0.38928288221359253, 0.41781848669052124, 0.44635406136512756, 0.4748896658420563, 0.5034252405166626, 0.5319608449935913, 0.56049644947052, 0.5890320539474487, 0.6175676584243774, 0.6461032032966614, 0.6746388077735901, 0.7031744122505188, 0.7317100167274475, 0.7602455615997314, 0.7887811660766602, 0.8173167705535889, 0.8458523750305176, 0.8743879795074463, 0.902923583984375, 0.9314591884613037, 0.9599947929382324, 0.9885303974151611, 1.0170660018920898, 1.0456016063690186, 1.0741372108459473, 1.1026726961135864, 1.1312083005905151]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 0.0, 1.0, 6.0, 6.0, 3.0, 6.0, 17.0, 19.0, 17.0, 19.0, 30.0, 30.0, 32.0, 39.0, 33.0, 47.0, 39.0, 52.0, 46.0, 60.0, 55.0, 50.0, 48.0, 57.0, 48.0, 38.0, 43.0, 36.0, 24.0, 27.0, 16.0, 15.0, 11.0, 10.0, 3.0, 8.0, 4.0, 7.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43116235733032227, -0.4161853790283203, -0.40120840072631836, -0.3862314224243164, -0.37125447392463684, -0.3562774956226349, -0.34130051732063293, -0.326323539018631, -0.3113465905189514, -0.29636961221694946, -0.2813926339149475, -0.26641565561294556, -0.251438707113266, -0.23646172881126404, -0.22148475050926208, -0.20650777220726013, -0.19153079390525818, -0.17655381560325623, -0.16157685220241547, -0.1465998739004135, -0.13162291049957275, -0.1166459321975708, -0.10166895389556885, -0.08669198304414749, -0.07171501219272614, -0.05673804134130478, -0.041761066764593124, -0.02678409218788147, -0.011807121336460114, 0.0031698495149612427, 0.018146827816963196, 0.03312379866838455, 0.04810076951980591, 0.06307774037122726, 0.07805471122264862, 0.09303168952465057, 0.10800866037607193, 0.12298563122749329, 0.13796260952949524, 0.1529395878314972, 0.16791655123233795, 0.1828935295343399, 0.19787049293518066, 0.21284747123718262, 0.22782444953918457, 0.24280141294002533, 0.2577784061431885, 0.27275535464286804, 0.28773233294487, 0.30270931124687195, 0.3176862895488739, 0.33266323804855347, 0.3476402163505554, 0.3626171946525574, 0.3775941729545593, 0.3925711512565613, 0.40754812955856323, 0.4225251078605652, 0.43750208616256714, 0.4524790644645691, 0.46745601296424866, 0.4824329912662506, 0.49740996956825256, 0.5123869180679321, 0.5273638963699341]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 5.0, 8.0, 8.0, 16.0, 26.0, 37.0, 53.0, 108.0, 158.0, 234.0, 397.0, 677.0, 1250.0, 2270.0, 4771.0, 11174.0, 29903.0, 112532.0, 3425749.0, 504155.0, 64729.0, 19988.0, 7844.0, 3713.0, 1841.0, 1062.0, 571.0, 362.0, 215.0, 137.0, 111.0, 58.0, 40.0, 28.0, 12.0, 9.0, 9.0, 6.0, 3.0, 5.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07421875, -0.07145118713378906, -0.06868362426757812, -0.06591606140136719, -0.06314849853515625, -0.06038093566894531, -0.057613372802734375, -0.05484580993652344, -0.0520782470703125, -0.04931068420410156, -0.046543121337890625, -0.04377555847167969, -0.04100799560546875, -0.03824043273925781, -0.035472869873046875, -0.03270530700683594, -0.029937744140625, -0.027170181274414062, -0.024402618408203125, -0.021635055541992188, -0.01886749267578125, -0.016099929809570312, -0.013332366943359375, -0.010564804077148438, -0.0077972412109375, -0.0050296783447265625, -0.002262115478515625, 0.0005054473876953125, 0.00327301025390625, 0.0060405731201171875, 0.008808135986328125, 0.011575698852539062, 0.01434326171875, 0.017110824584960938, 0.019878387451171875, 0.022645950317382812, 0.02541351318359375, 0.028181076049804688, 0.030948638916015625, 0.03371620178222656, 0.0364837646484375, 0.03925132751464844, 0.042018890380859375, 0.04478645324707031, 0.04755401611328125, 0.05032157897949219, 0.053089141845703125, 0.05585670471191406, 0.058624267578125, 0.06139183044433594, 0.06415939331054688, 0.06692695617675781, 0.06969451904296875, 0.07246208190917969, 0.07522964477539062, 0.07799720764160156, 0.0807647705078125, 0.08353233337402344, 0.08629989624023438, 0.08906745910644531, 0.09183502197265625, 0.09460258483886719, 0.09737014770507812, 0.10013771057128906, 0.1029052734375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 10.0, 4.0, 9.0, 9.0, 11.0, 18.0, 25.0, 43.0, 38.0, 48.0, 67.0, 57.0, 78.0, 53.0, 69.0, 72.0, 65.0, 64.0, 52.0, 44.0, 44.0, 29.0, 14.0, 32.0, 10.0, 11.0, 7.0, 2.0, 4.0, 6.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0169219970703125, -0.016196012496948242, -0.015470027923583984, -0.014744043350219727, -0.014018058776855469, -0.013292074203491211, -0.012566089630126953, -0.011840105056762695, -0.011114120483398438, -0.01038813591003418, -0.009662151336669922, -0.008936166763305664, -0.008210182189941406, -0.0074841976165771484, -0.006758213043212891, -0.006032228469848633, -0.005306243896484375, -0.004580259323120117, -0.0038542747497558594, -0.0031282901763916016, -0.0024023056030273438, -0.001676321029663086, -0.0009503364562988281, -0.0002243518829345703, 0.0005016326904296875, 0.0012276172637939453, 0.001953601837158203, 0.002679586410522461, 0.0034055709838867188, 0.0041315555572509766, 0.004857540130615234, 0.005583524703979492, 0.00630950927734375, 0.007035493850708008, 0.007761478424072266, 0.008487462997436523, 0.009213447570800781, 0.009939432144165039, 0.010665416717529297, 0.011391401290893555, 0.012117385864257812, 0.01284337043762207, 0.013569355010986328, 0.014295339584350586, 0.015021324157714844, 0.0157473087310791, 0.01647329330444336, 0.017199277877807617, 0.017925262451171875, 0.018651247024536133, 0.01937723159790039, 0.02010321617126465, 0.020829200744628906, 0.021555185317993164, 0.022281169891357422, 0.02300715446472168, 0.023733139038085938, 0.024459123611450195, 0.025185108184814453, 0.02591109275817871, 0.02663707733154297, 0.027363061904907227, 0.028089046478271484, 0.028815031051635742, 0.029541015625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 5.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 6.0, 13.0, 12.0, 23.0, 44.0, 46.0, 80.0, 100.0, 162.0, 235.0, 337.0, 501.0, 725.0, 1105.0, 1742.0, 2813.0, 4485.0, 7744.0, 13434.0, 25155.0, 52981.0, 135021.0, 644599.0, 2866360.0, 266990.0, 85334.0, 37628.0, 19226.0, 10745.0, 6177.0, 3777.0, 2313.0, 1460.0, 972.0, 580.0, 459.0, 287.0, 175.0, 111.0, 112.0, 80.0, 48.0, 20.0, 27.0, 16.0, 8.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.053863525390625, -0.05214071273803711, -0.05041790008544922, -0.04869508743286133, -0.04697227478027344, -0.04524946212768555, -0.043526649475097656, -0.041803836822509766, -0.040081024169921875, -0.038358211517333984, -0.036635398864746094, -0.0349125862121582, -0.03318977355957031, -0.03146696090698242, -0.02974414825439453, -0.02802133560180664, -0.02629852294921875, -0.02457571029663086, -0.02285289764404297, -0.021130084991455078, -0.019407272338867188, -0.017684459686279297, -0.015961647033691406, -0.014238834381103516, -0.012516021728515625, -0.010793209075927734, -0.009070396423339844, -0.007347583770751953, -0.0056247711181640625, -0.003901958465576172, -0.0021791458129882812, -0.0004563331604003906, 0.0012664794921875, 0.0029892921447753906, 0.004712104797363281, 0.006434917449951172, 0.008157730102539062, 0.009880542755126953, 0.011603355407714844, 0.013326168060302734, 0.015048980712890625, 0.016771793365478516, 0.018494606018066406, 0.020217418670654297, 0.021940231323242188, 0.023663043975830078, 0.02538585662841797, 0.02710866928100586, 0.02883148193359375, 0.03055429458618164, 0.03227710723876953, 0.03399991989135742, 0.03572273254394531, 0.0374455451965332, 0.039168357849121094, 0.040891170501708984, 0.042613983154296875, 0.044336795806884766, 0.046059608459472656, 0.04778242111206055, 0.04950523376464844, 0.05122804641723633, 0.05295085906982422, 0.05467367172241211, 0.056396484375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 6.0, 8.0, 10.0, 8.0, 17.0, 21.0, 19.0, 38.0, 64.0, 85.0, 168.0, 361.0, 1660.0, 849.0, 295.0, 138.0, 96.0, 56.0, 43.0, 32.0, 26.0, 20.0, 18.0, 9.0, 12.0, 5.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034942626953125, -0.03368806838989258, -0.032433509826660156, -0.031178951263427734, -0.029924392700195312, -0.02866983413696289, -0.02741527557373047, -0.026160717010498047, -0.024906158447265625, -0.023651599884033203, -0.02239704132080078, -0.02114248275756836, -0.019887924194335938, -0.018633365631103516, -0.017378807067871094, -0.016124248504638672, -0.01486968994140625, -0.013615131378173828, -0.012360572814941406, -0.011106014251708984, -0.009851455688476562, -0.00859689712524414, -0.007342338562011719, -0.006087779998779297, -0.004833221435546875, -0.003578662872314453, -0.0023241043090820312, -0.0010695457458496094, 0.0001850128173828125, 0.0014395713806152344, 0.0026941299438476562, 0.003948688507080078, 0.0052032470703125, 0.006457805633544922, 0.007712364196777344, 0.008966922760009766, 0.010221481323242188, 0.01147603988647461, 0.012730598449707031, 0.013985157012939453, 0.015239715576171875, 0.016494274139404297, 0.01774883270263672, 0.01900339126586914, 0.020257949829101562, 0.021512508392333984, 0.022767066955566406, 0.024021625518798828, 0.02527618408203125, 0.026530742645263672, 0.027785301208496094, 0.029039859771728516, 0.030294418334960938, 0.03154897689819336, 0.03280353546142578, 0.0340580940246582, 0.035312652587890625, 0.03656721115112305, 0.03782176971435547, 0.03907632827758789, 0.04033088684082031, 0.041585445404052734, 0.042840003967285156, 0.04409456253051758, 0.04534912109375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 11.0, 20.0, 37.0, 67.0, 115.0, 168.0, 169.0, 165.0, 110.0, 62.0, 34.0, 24.0, 14.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17778435349464417, -0.16735491156578064, -0.15692545473575592, -0.1464960128068924, -0.13606657087802887, -0.12563711404800415, -0.11520767211914062, -0.1047782301902771, -0.09434878081083298, -0.08391933143138885, -0.07348988950252533, -0.06306044012308121, -0.05263099446892738, -0.04220154881477356, -0.03177209943532944, -0.021342657506465912, -0.01091320812702179, -0.0004837615415453911, 0.009945685043931007, 0.02037513256072998, 0.030804578214883804, 0.04123402386903763, 0.05166347324848175, 0.062092915177345276, 0.0725223645567894, 0.08295181393623352, 0.09338125586509705, 0.10381070524454117, 0.11424015462398529, 0.12466959655284882, 0.13509905338287354, 0.14552849531173706, 0.15595793724060059, 0.1663873791694641, 0.17681683599948883, 0.18724627792835236, 0.19767571985721588, 0.2081051766872406, 0.21853461861610413, 0.22896406054496765, 0.23939350247383118, 0.2498229444026947, 0.2602523863315582, 0.27068185806274414, 0.28111129999160767, 0.2915407419204712, 0.3019701838493347, 0.31239962577819824, 0.32282906770706177, 0.3332585096359253, 0.3436879515647888, 0.35411739349365234, 0.36454686522483826, 0.3749763071537018, 0.3854057490825653, 0.39583519101142883, 0.40626466274261475, 0.41669410467147827, 0.4271235466003418, 0.4375529885292053, 0.44798246026039124, 0.45841190218925476, 0.4688413441181183, 0.4792707860469818, 0.48970022797584534]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 5.0, 5.0, 2.0, 10.0, 10.0, 7.0, 15.0, 11.0, 16.0, 14.0, 20.0, 20.0, 27.0, 27.0, 18.0, 39.0, 39.0, 27.0, 35.0, 29.0, 45.0, 25.0, 48.0, 48.0, 35.0, 47.0, 40.0, 35.0, 30.0, 37.0, 29.0, 32.0, 28.0, 14.0, 14.0, 18.0, 17.0, 10.0, 21.0, 11.0, 10.0, 8.0, 10.0, 3.0, 4.0, 3.0, 1.0, 1.0, 5.0, 2.0], "bins": [-0.1448119878768921, -0.14098496735095978, -0.13715794682502747, -0.13333092629909515, -0.12950390577316284, -0.12567687034606934, -0.12184984982013702, -0.11802282929420471, -0.1141958087682724, -0.11036878824234009, -0.10654176771640778, -0.10271473973989487, -0.09888771921396255, -0.09506069868803024, -0.09123367071151733, -0.08740665018558502, -0.08357962965965271, -0.0797526091337204, -0.07592558860778809, -0.07209856063127518, -0.06827154010534286, -0.06444451957941055, -0.06061749532818794, -0.05679047107696533, -0.05296345055103302, -0.04913643002510071, -0.0453094057738781, -0.04148238152265549, -0.037655360996723175, -0.03382834047079086, -0.030001316219568253, -0.02617429383099079, -0.02234727144241333, -0.01852024905383587, -0.014693226665258408, -0.010866204276680946, -0.007039181888103485, -0.003212159499526024, 0.0006148628890514374, 0.004441885277628899, 0.00826890766620636, 0.012095930054783821, 0.015922952443361282, 0.019749974831938744, 0.023576997220516205, 0.027404019609093666, 0.031231041997671127, 0.03505806624889374, 0.03888508677482605, 0.04271210730075836, 0.04653913155198097, 0.05036615580320358, 0.054193176329135895, 0.05802019685506821, 0.06184722110629082, 0.06567424535751343, 0.06950126588344574, 0.07332828640937805, 0.07715530693531036, 0.08098233491182327, 0.08480935543775558, 0.0886363759636879, 0.0924634039402008, 0.09629042446613312, 0.10011744499206543]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 8.0, 3.0, 5.0, 4.0, 9.0, 9.0, 18.0, 31.0, 47.0, 57.0, 72.0, 113.0, 145.0, 256.0, 374.0, 525.0, 851.0, 1359.0, 2296.0, 3776.0, 6470.0, 11826.0, 22424.0, 44515.0, 93869.0, 208800.0, 322422.0, 170001.0, 77334.0, 37447.0, 18991.0, 10211.0, 5571.0, 3276.0, 1976.0, 1232.0, 813.0, 482.0, 326.0, 207.0, 134.0, 84.0, 58.0, 42.0, 27.0, 24.0, 16.0, 8.0, 10.0, 2.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.056488037109375, -0.0545649528503418, -0.052641868591308594, -0.05071878433227539, -0.04879570007324219, -0.046872615814208984, -0.04494953155517578, -0.04302644729614258, -0.041103363037109375, -0.03918027877807617, -0.03725719451904297, -0.035334110260009766, -0.03341102600097656, -0.03148794174194336, -0.029564857482910156, -0.027641773223876953, -0.02571868896484375, -0.023795604705810547, -0.021872520446777344, -0.01994943618774414, -0.018026351928710938, -0.016103267669677734, -0.014180183410644531, -0.012257099151611328, -0.010334014892578125, -0.008410930633544922, -0.006487846374511719, -0.004564762115478516, -0.0026416778564453125, -0.0007185935974121094, 0.0012044906616210938, 0.003127574920654297, 0.0050506591796875, 0.006973743438720703, 0.008896827697753906, 0.01081991195678711, 0.012742996215820312, 0.014666080474853516, 0.01658916473388672, 0.018512248992919922, 0.020435333251953125, 0.022358417510986328, 0.02428150177001953, 0.026204586029052734, 0.028127670288085938, 0.03005075454711914, 0.031973838806152344, 0.03389692306518555, 0.03582000732421875, 0.03774309158325195, 0.039666175842285156, 0.04158926010131836, 0.04351234436035156, 0.045435428619384766, 0.04735851287841797, 0.04928159713745117, 0.051204681396484375, 0.05312776565551758, 0.05505084991455078, 0.056973934173583984, 0.05889701843261719, 0.06082010269165039, 0.0627431869506836, 0.0646662712097168, 0.06658935546875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 6.0, 5.0, 7.0, 2.0, 5.0, 8.0, 11.0, 5.0, 11.0, 26.0, 34.0, 37.0, 47.0, 41.0, 57.0, 55.0, 55.0, 58.0, 56.0, 62.0, 73.0, 83.0, 40.0, 31.0, 39.0, 33.0, 29.0, 18.0, 20.0, 12.0, 15.0, 6.0, 5.0, 7.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01824951171875, -0.01758432388305664, -0.01691913604736328, -0.016253948211669922, -0.015588760375976562, -0.014923572540283203, -0.014258384704589844, -0.013593196868896484, -0.012928009033203125, -0.012262821197509766, -0.011597633361816406, -0.010932445526123047, -0.010267257690429688, -0.009602069854736328, -0.008936882019042969, -0.00827169418334961, -0.00760650634765625, -0.006941318511962891, -0.006276130676269531, -0.005610942840576172, -0.0049457550048828125, -0.004280567169189453, -0.0036153793334960938, -0.0029501914978027344, -0.002285003662109375, -0.0016198158264160156, -0.0009546279907226562, -0.0002894401550292969, 0.0003757476806640625, 0.0010409355163574219, 0.0017061233520507812, 0.0023713111877441406, 0.0030364990234375, 0.0037016868591308594, 0.004366874694824219, 0.005032062530517578, 0.0056972503662109375, 0.006362438201904297, 0.007027626037597656, 0.007692813873291016, 0.008358001708984375, 0.009023189544677734, 0.009688377380371094, 0.010353565216064453, 0.011018753051757812, 0.011683940887451172, 0.012349128723144531, 0.01301431655883789, 0.01367950439453125, 0.01434469223022461, 0.015009880065917969, 0.015675067901611328, 0.016340255737304688, 0.017005443572998047, 0.017670631408691406, 0.018335819244384766, 0.019001007080078125, 0.019666194915771484, 0.020331382751464844, 0.020996570587158203, 0.021661758422851562, 0.022326946258544922, 0.02299213409423828, 0.02365732192993164, 0.024322509765625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 9.0, 5.0, 8.0, 7.0, 7.0, 23.0, 35.0, 42.0, 69.0, 89.0, 124.0, 159.0, 243.0, 421.0, 550.0, 1054.0, 2137.0, 5378.0, 13835.0, 41200.0, 130828.0, 391507.0, 313058.0, 97694.0, 31067.0, 10612.0, 4074.0, 1843.0, 953.0, 494.0, 312.0, 229.0, 139.0, 94.0, 58.0, 58.0, 38.0, 25.0, 23.0, 20.0, 16.0, 8.0, 4.0, 4.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0694580078125, -0.06713294982910156, -0.06480789184570312, -0.06248283386230469, -0.06015777587890625, -0.05783271789550781, -0.055507659912109375, -0.05318260192871094, -0.0508575439453125, -0.04853248596191406, -0.046207427978515625, -0.04388236999511719, -0.04155731201171875, -0.03923225402832031, -0.036907196044921875, -0.03458213806152344, -0.032257080078125, -0.029932022094726562, -0.027606964111328125, -0.025281906127929688, -0.02295684814453125, -0.020631790161132812, -0.018306732177734375, -0.015981674194335938, -0.0136566162109375, -0.011331558227539062, -0.009006500244140625, -0.0066814422607421875, -0.00435638427734375, -0.0020313262939453125, 0.000293731689453125, 0.0026187896728515625, 0.00494384765625, 0.0072689056396484375, 0.009593963623046875, 0.011919021606445312, 0.01424407958984375, 0.016569137573242188, 0.018894195556640625, 0.021219253540039062, 0.0235443115234375, 0.025869369506835938, 0.028194427490234375, 0.030519485473632812, 0.03284454345703125, 0.03516960144042969, 0.037494659423828125, 0.03981971740722656, 0.042144775390625, 0.04446983337402344, 0.046794891357421875, 0.04911994934082031, 0.05144500732421875, 0.05377006530761719, 0.056095123291015625, 0.05842018127441406, 0.0607452392578125, 0.06307029724121094, 0.06539535522460938, 0.06772041320800781, 0.07004547119140625, 0.07237052917480469, 0.07469558715820312, 0.07702064514160156, 0.079345703125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 5.0, 4.0, 3.0, 5.0, 9.0, 7.0, 13.0, 9.0, 16.0, 13.0, 16.0, 20.0, 27.0, 21.0, 32.0, 33.0, 32.0, 40.0, 32.0, 50.0, 38.0, 42.0, 40.0, 64.0, 26.0, 23.0, 34.0, 29.0, 42.0, 35.0, 31.0, 34.0, 25.0, 24.0, 24.0, 25.0, 18.0, 16.0, 9.0, 5.0, 7.0, 8.0, 5.0, 4.0, 5.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.06695556640625, -0.06477832794189453, -0.06260108947753906, -0.060423851013183594, -0.058246612548828125, -0.056069374084472656, -0.05389213562011719, -0.05171489715576172, -0.04953765869140625, -0.04736042022705078, -0.04518318176269531, -0.043005943298339844, -0.040828704833984375, -0.038651466369628906, -0.03647422790527344, -0.03429698944091797, -0.0321197509765625, -0.02994251251220703, -0.027765274047851562, -0.025588035583496094, -0.023410797119140625, -0.021233558654785156, -0.019056320190429688, -0.01687908172607422, -0.01470184326171875, -0.012524604797363281, -0.010347366333007812, -0.008170127868652344, -0.005992889404296875, -0.0038156509399414062, -0.0016384124755859375, 0.0005388259887695312, 0.002716064453125, 0.004893302917480469, 0.0070705413818359375, 0.009247779846191406, 0.011425018310546875, 0.013602256774902344, 0.015779495239257812, 0.01795673370361328, 0.02013397216796875, 0.02231121063232422, 0.024488449096679688, 0.026665687561035156, 0.028842926025390625, 0.031020164489746094, 0.03319740295410156, 0.03537464141845703, 0.0375518798828125, 0.03972911834716797, 0.04190635681152344, 0.044083595275878906, 0.046260833740234375, 0.048438072204589844, 0.05061531066894531, 0.05279254913330078, 0.05496978759765625, 0.05714702606201172, 0.05932426452636719, 0.061501502990722656, 0.06367874145507812, 0.0658559799194336, 0.06803321838378906, 0.07021045684814453, 0.0723876953125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 8.0, 12.0, 15.0, 21.0, 41.0, 52.0, 81.0, 135.0, 227.0, 387.0, 697.0, 1286.0, 2446.0, 5103.0, 11898.0, 30100.0, 87626.0, 286990.0, 408766.0, 137465.0, 44516.0, 16661.0, 7025.0, 3212.0, 1630.0, 874.0, 500.0, 289.0, 168.0, 106.0, 59.0, 53.0, 39.0, 17.0, 9.0, 9.0, 6.0, 10.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03887939453125, -0.03763294219970703, -0.03638648986816406, -0.035140037536621094, -0.033893585205078125, -0.032647132873535156, -0.03140068054199219, -0.03015422821044922, -0.02890777587890625, -0.02766132354736328, -0.026414871215820312, -0.025168418884277344, -0.023921966552734375, -0.022675514221191406, -0.021429061889648438, -0.02018260955810547, -0.0189361572265625, -0.01768970489501953, -0.016443252563476562, -0.015196800231933594, -0.013950347900390625, -0.012703895568847656, -0.011457443237304688, -0.010210990905761719, -0.00896453857421875, -0.007718086242675781, -0.0064716339111328125, -0.005225181579589844, -0.003978729248046875, -0.0027322769165039062, -0.0014858245849609375, -0.00023937225341796875, 0.001007080078125, 0.0022535324096679688, 0.0034999847412109375, 0.004746437072753906, 0.005992889404296875, 0.007239341735839844, 0.008485794067382812, 0.009732246398925781, 0.01097869873046875, 0.012225151062011719, 0.013471603393554688, 0.014718055725097656, 0.015964508056640625, 0.017210960388183594, 0.018457412719726562, 0.01970386505126953, 0.0209503173828125, 0.02219676971435547, 0.023443222045898438, 0.024689674377441406, 0.025936126708984375, 0.027182579040527344, 0.028429031372070312, 0.02967548370361328, 0.03092193603515625, 0.03216838836669922, 0.03341484069824219, 0.034661293029785156, 0.035907745361328125, 0.037154197692871094, 0.03840065002441406, 0.03964710235595703, 0.0408935546875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 6.0, 12.0, 12.0, 15.0, 24.0, 20.0, 46.0, 68.0, 67.0, 84.0, 96.0, 106.0, 91.0, 86.0, 65.0, 57.0, 36.0, 29.0, 26.0, 22.0, 5.0, 11.0, 1.0, 5.0, 8.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5822391510009766e-05, -3.46088781952858e-05, -3.339536488056183e-05, -3.218185156583786e-05, -3.096833825111389e-05, -2.9754824936389923e-05, -2.8541311621665955e-05, -2.7327798306941986e-05, -2.6114284992218018e-05, -2.490077167749405e-05, -2.368725836277008e-05, -2.2473745048046112e-05, -2.1260231733322144e-05, -2.0046718418598175e-05, -1.8833205103874207e-05, -1.7619691789150238e-05, -1.640617847442627e-05, -1.5192665159702301e-05, -1.3979151844978333e-05, -1.2765638530254364e-05, -1.1552125215530396e-05, -1.0338611900806427e-05, -9.125098586082458e-06, -7.91158527135849e-06, -6.6980719566345215e-06, -5.484558641910553e-06, -4.2710453271865845e-06, -3.057532012462616e-06, -1.8440186977386475e-06, -6.30505383014679e-07, 5.830079317092896e-07, 1.796521246433258e-06, 3.0100345611572266e-06, 4.223547875881195e-06, 5.4370611906051636e-06, 6.650574505329132e-06, 7.8640878200531e-06, 9.077601134777069e-06, 1.0291114449501038e-05, 1.1504627764225006e-05, 1.2718141078948975e-05, 1.3931654393672943e-05, 1.5145167708396912e-05, 1.635868102312088e-05, 1.757219433784485e-05, 1.8785707652568817e-05, 1.9999220967292786e-05, 2.1212734282016754e-05, 2.2426247596740723e-05, 2.363976091146469e-05, 2.485327422618866e-05, 2.6066787540912628e-05, 2.7280300855636597e-05, 2.8493814170360565e-05, 2.9707327485084534e-05, 3.09208407998085e-05, 3.213435411453247e-05, 3.334786742925644e-05, 3.456138074398041e-05, 3.5774894058704376e-05, 3.6988407373428345e-05, 3.820192068815231e-05, 3.941543400287628e-05, 4.062894731760025e-05, 4.184246063232422e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 4.0, 6.0, 10.0, 11.0, 18.0, 20.0, 37.0, 51.0, 77.0, 114.0, 160.0, 308.0, 547.0, 995.0, 2022.0, 4057.0, 8856.0, 21707.0, 63537.0, 225624.0, 474423.0, 164985.0, 48794.0, 17735.0, 7199.0, 3478.0, 1708.0, 819.0, 489.0, 279.0, 158.0, 106.0, 73.0, 35.0, 31.0, 21.0, 18.0, 20.0, 3.0, 7.0, 4.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.041229248046875, -0.03991556167602539, -0.03860187530517578, -0.03728818893432617, -0.03597450256347656, -0.03466081619262695, -0.033347129821777344, -0.032033443450927734, -0.030719757080078125, -0.029406070709228516, -0.028092384338378906, -0.026778697967529297, -0.025465011596679688, -0.024151325225830078, -0.02283763885498047, -0.02152395248413086, -0.02021026611328125, -0.01889657974243164, -0.01758289337158203, -0.016269207000732422, -0.014955520629882812, -0.013641834259033203, -0.012328147888183594, -0.011014461517333984, -0.009700775146484375, -0.008387088775634766, -0.007073402404785156, -0.005759716033935547, -0.0044460296630859375, -0.003132343292236328, -0.0018186569213867188, -0.0005049705505371094, 0.0008087158203125, 0.0021224021911621094, 0.0034360885620117188, 0.004749774932861328, 0.0060634613037109375, 0.007377147674560547, 0.008690834045410156, 0.010004520416259766, 0.011318206787109375, 0.012631893157958984, 0.013945579528808594, 0.015259265899658203, 0.016572952270507812, 0.017886638641357422, 0.01920032501220703, 0.02051401138305664, 0.02182769775390625, 0.02314138412475586, 0.02445507049560547, 0.025768756866455078, 0.027082443237304688, 0.028396129608154297, 0.029709815979003906, 0.031023502349853516, 0.032337188720703125, 0.033650875091552734, 0.034964561462402344, 0.03627824783325195, 0.03759193420410156, 0.03890562057495117, 0.04021930694580078, 0.04153299331665039, 0.0428466796875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 8.0, 13.0, 15.0, 21.0, 21.0, 21.0, 36.0, 36.0, 65.0, 72.0, 69.0, 103.0, 78.0, 75.0, 60.0, 52.0, 36.0, 52.0, 30.0, 24.0, 28.0, 13.0, 14.0, 7.0, 14.0, 9.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0297698974609375, -0.02870965003967285, -0.027649402618408203, -0.026589155197143555, -0.025528907775878906, -0.024468660354614258, -0.02340841293334961, -0.02234816551208496, -0.021287918090820312, -0.020227670669555664, -0.019167423248291016, -0.018107175827026367, -0.01704692840576172, -0.01598668098449707, -0.014926433563232422, -0.013866186141967773, -0.012805938720703125, -0.011745691299438477, -0.010685443878173828, -0.00962519645690918, -0.008564949035644531, -0.007504701614379883, -0.006444454193115234, -0.005384206771850586, -0.0043239593505859375, -0.003263711929321289, -0.0022034645080566406, -0.0011432170867919922, -8.296966552734375e-05, 0.0009772777557373047, 0.002037525177001953, 0.0030977725982666016, 0.00415802001953125, 0.0052182674407958984, 0.006278514862060547, 0.007338762283325195, 0.008399009704589844, 0.009459257125854492, 0.01051950454711914, 0.011579751968383789, 0.012639999389648438, 0.013700246810913086, 0.014760494232177734, 0.015820741653442383, 0.01688098907470703, 0.01794123649597168, 0.019001483917236328, 0.020061731338500977, 0.021121978759765625, 0.022182226181030273, 0.023242473602294922, 0.02430272102355957, 0.02536296844482422, 0.026423215866088867, 0.027483463287353516, 0.028543710708618164, 0.029603958129882812, 0.03066420555114746, 0.03172445297241211, 0.03278470039367676, 0.033844947814941406, 0.034905195236206055, 0.0359654426574707, 0.03702569007873535, 0.0380859375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 8.0, 12.0, 20.0, 48.0, 64.0, 115.0, 168.0, 183.0, 153.0, 113.0, 67.0, 34.0, 13.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8925408124923706, -0.8664276003837585, -0.8403143882751465, -0.8142011165618896, -0.7880879044532776, -0.7619746923446655, -0.7358614802360535, -0.7097482681274414, -0.6836349964141846, -0.6575217843055725, -0.6314085721969604, -0.6052953004837036, -0.5791820883750916, -0.5530688762664795, -0.5269556641578674, -0.5008424520492554, -0.4747292101383209, -0.44861599802970886, -0.4225027561187744, -0.39638954401016235, -0.3702763020992279, -0.34416308999061584, -0.3180498480796814, -0.29193663597106934, -0.2658234238624573, -0.23971019685268402, -0.21359696984291077, -0.1874837577342987, -0.16137051582336426, -0.1352573037147522, -0.10914407670497894, -0.08303084969520569, -0.05691760778427124, -0.030804382637143135, -0.00469115749001503, 0.021422065794467926, 0.04753529280424118, 0.07364851236343384, 0.09976173937320709, 0.12587496638298035, 0.1519881933927536, 0.17810142040252686, 0.2042146474123001, 0.23032787442207336, 0.2564410865306854, 0.2825543284416199, 0.30866754055023193, 0.334780752658844, 0.36089399456977844, 0.3870072066783905, 0.41312044858932495, 0.439233660697937, 0.46534690260887146, 0.4914601147174835, 0.517573356628418, 0.54368656873703, 0.5697997808456421, 0.5959129929542542, 0.6220262050628662, 0.648139476776123, 0.6742526888847351, 0.7003659009933472, 0.7264791131019592, 0.7525923252105713, 0.7787055969238281]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 9.0, 10.0, 6.0, 11.0, 9.0, 8.0, 21.0, 24.0, 20.0, 35.0, 33.0, 34.0, 53.0, 31.0, 45.0, 41.0, 48.0, 47.0, 57.0, 36.0, 51.0, 43.0, 56.0, 39.0, 46.0, 32.0, 21.0, 17.0, 24.0, 11.0, 14.0, 9.0, 9.0, 11.0, 11.0, 13.0, 3.0, 3.0, 2.0, 1.0, 1.0, 6.0, 4.0, 1.0], "bins": [-0.551406741142273, -0.5369205474853516, -0.5224342942237854, -0.507948100566864, -0.49346187710762024, -0.47897568345069885, -0.4644894599914551, -0.4500032663345337, -0.4355170428752899, -0.42103081941604614, -0.40654462575912476, -0.392058402299881, -0.3775721788406372, -0.3630859851837158, -0.34859976172447205, -0.33411353826522827, -0.3196273446083069, -0.3051411211490631, -0.2906549274921417, -0.27616870403289795, -0.2616824805736542, -0.2471962869167328, -0.232710063457489, -0.21822385489940643, -0.20373761653900146, -0.18925140798091888, -0.1747651845216751, -0.16027897596359253, -0.14579276740550995, -0.13130655884742737, -0.1168203353881836, -0.10233412683010101, -0.08784791827201843, -0.07336170226335526, -0.058875493705272675, -0.0443892776966095, -0.029903065413236618, -0.015416853129863739, -0.0009306371212005615, 0.013555571436882019, 0.028041787445545197, 0.042527999728918076, 0.057014212012290955, 0.07150042802095413, 0.08598664402961731, 0.10047285258769989, 0.11495906859636307, 0.12944528460502625, 0.14393149316310883, 0.1584177017211914, 0.17290392518043518, 0.18739013373851776, 0.20187634229660034, 0.21636256575584412, 0.2308487743139267, 0.24533498287200928, 0.25982120633125305, 0.2743074297904968, 0.2887936234474182, 0.303279846906662, 0.31776607036590576, 0.33225226402282715, 0.3467384874820709, 0.3612247109413147, 0.3757109045982361]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 6.0, 13.0, 15.0, 17.0, 27.0, 39.0, 50.0, 92.0, 150.0, 213.0, 375.0, 679.0, 1127.0, 2288.0, 4617.0, 10707.0, 29043.0, 108291.0, 2983123.0, 928258.0, 82833.0, 24093.0, 9256.0, 4139.0, 1983.0, 1134.0, 614.0, 397.0, 214.0, 154.0, 105.0, 76.0, 45.0, 40.0, 19.0, 17.0, 9.0, 8.0, 5.0, 2.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0782470703125, -0.07544422149658203, -0.07264137268066406, -0.0698385238647461, -0.06703567504882812, -0.06423282623291016, -0.06142997741699219, -0.05862712860107422, -0.05582427978515625, -0.05302143096923828, -0.05021858215332031, -0.047415733337402344, -0.044612884521484375, -0.041810035705566406, -0.03900718688964844, -0.03620433807373047, -0.0334014892578125, -0.03059864044189453, -0.027795791625976562, -0.024992942810058594, -0.022190093994140625, -0.019387245178222656, -0.016584396362304688, -0.013781547546386719, -0.01097869873046875, -0.008175849914550781, -0.0053730010986328125, -0.0025701522827148438, 0.000232696533203125, 0.0030355453491210938, 0.0058383941650390625, 0.008641242980957031, 0.011444091796875, 0.014246940612792969, 0.017049789428710938, 0.019852638244628906, 0.022655487060546875, 0.025458335876464844, 0.028261184692382812, 0.03106403350830078, 0.03386688232421875, 0.03666973114013672, 0.03947257995605469, 0.042275428771972656, 0.045078277587890625, 0.047881126403808594, 0.05068397521972656, 0.05348682403564453, 0.0562896728515625, 0.05909252166748047, 0.06189537048339844, 0.0646982192993164, 0.06750106811523438, 0.07030391693115234, 0.07310676574707031, 0.07590961456298828, 0.07871246337890625, 0.08151531219482422, 0.08431816101074219, 0.08712100982666016, 0.08992385864257812, 0.0927267074584961, 0.09552955627441406, 0.09833240509033203, 0.10113525390625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 4.0, 6.0, 5.0, 3.0, 4.0, 4.0, 7.0, 8.0, 13.0, 16.0, 25.0, 47.0, 43.0, 47.0, 63.0, 66.0, 49.0, 67.0, 77.0, 68.0, 65.0, 65.0, 64.0, 41.0, 25.0, 25.0, 21.0, 20.0, 17.0, 14.0, 8.0, 6.0, 3.0, 4.0, 6.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01751708984375, -0.016731739044189453, -0.015946388244628906, -0.01516103744506836, -0.014375686645507812, -0.013590335845947266, -0.012804985046386719, -0.012019634246826172, -0.011234283447265625, -0.010448932647705078, -0.009663581848144531, -0.008878231048583984, -0.008092880249023438, -0.007307529449462891, -0.006522178649902344, -0.005736827850341797, -0.00495147705078125, -0.004166126251220703, -0.0033807754516601562, -0.0025954246520996094, -0.0018100738525390625, -0.0010247230529785156, -0.00023937225341796875, 0.0005459785461425781, 0.001331329345703125, 0.002116680145263672, 0.0029020309448242188, 0.0036873817443847656, 0.0044727325439453125, 0.005258083343505859, 0.006043434143066406, 0.006828784942626953, 0.0076141357421875, 0.008399486541748047, 0.009184837341308594, 0.00997018814086914, 0.010755538940429688, 0.011540889739990234, 0.012326240539550781, 0.013111591339111328, 0.013896942138671875, 0.014682292938232422, 0.015467643737792969, 0.016252994537353516, 0.017038345336914062, 0.01782369613647461, 0.018609046936035156, 0.019394397735595703, 0.02017974853515625, 0.020965099334716797, 0.021750450134277344, 0.02253580093383789, 0.023321151733398438, 0.024106502532958984, 0.02489185333251953, 0.025677204132080078, 0.026462554931640625, 0.027247905731201172, 0.02803325653076172, 0.028818607330322266, 0.029603958129882812, 0.03038930892944336, 0.031174659729003906, 0.03196001052856445, 0.032745361328125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 9.0, 14.0, 20.0, 30.0, 41.0, 73.0, 118.0, 178.0, 305.0, 471.0, 970.0, 1748.0, 3324.0, 6416.0, 14026.0, 32387.0, 88407.0, 356761.0, 3100699.0, 425053.0, 98352.0, 35132.0, 15211.0, 6930.0, 3565.0, 1788.0, 919.0, 547.0, 313.0, 178.0, 100.0, 69.0, 42.0, 30.0, 18.0, 14.0, 10.0, 9.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.07757568359375, -0.0753931999206543, -0.0732107162475586, -0.07102823257446289, -0.06884574890136719, -0.06666326522827148, -0.06448078155517578, -0.06229829788208008, -0.060115814208984375, -0.05793333053588867, -0.05575084686279297, -0.053568363189697266, -0.05138587951660156, -0.04920339584350586, -0.047020912170410156, -0.04483842849731445, -0.04265594482421875, -0.04047346115112305, -0.038290977478027344, -0.03610849380493164, -0.03392601013183594, -0.031743526458740234, -0.02956104278564453, -0.027378559112548828, -0.025196075439453125, -0.023013591766357422, -0.02083110809326172, -0.018648624420166016, -0.016466140747070312, -0.01428365707397461, -0.012101173400878906, -0.009918689727783203, -0.0077362060546875, -0.005553722381591797, -0.0033712387084960938, -0.0011887550354003906, 0.0009937286376953125, 0.0031762123107910156, 0.005358695983886719, 0.007541179656982422, 0.009723663330078125, 0.011906147003173828, 0.014088630676269531, 0.016271114349365234, 0.018453598022460938, 0.02063608169555664, 0.022818565368652344, 0.025001049041748047, 0.02718353271484375, 0.029366016387939453, 0.031548500061035156, 0.03373098373413086, 0.03591346740722656, 0.038095951080322266, 0.04027843475341797, 0.04246091842651367, 0.044643402099609375, 0.04682588577270508, 0.04900836944580078, 0.051190853118896484, 0.05337333679199219, 0.05555582046508789, 0.057738304138183594, 0.0599207878112793, 0.062103271484375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 4.0, 8.0, 13.0, 14.0, 15.0, 23.0, 29.0, 43.0, 57.0, 84.0, 109.0, 209.0, 469.0, 1376.0, 793.0, 291.0, 170.0, 102.0, 72.0, 49.0, 33.0, 26.0, 19.0, 14.0, 17.0, 11.0, 9.0, 7.0, 4.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036590576171875, -0.035320281982421875, -0.03404998779296875, -0.032779693603515625, -0.0315093994140625, -0.030239105224609375, -0.02896881103515625, -0.027698516845703125, -0.02642822265625, -0.025157928466796875, -0.02388763427734375, -0.022617340087890625, -0.0213470458984375, -0.020076751708984375, -0.01880645751953125, -0.017536163330078125, -0.016265869140625, -0.014995574951171875, -0.01372528076171875, -0.012454986572265625, -0.0111846923828125, -0.009914398193359375, -0.00864410400390625, -0.007373809814453125, -0.006103515625, -0.004833221435546875, -0.00356292724609375, -0.002292633056640625, -0.0010223388671875, 0.000247955322265625, 0.00151824951171875, 0.002788543701171875, 0.004058837890625, 0.005329132080078125, 0.00659942626953125, 0.007869720458984375, 0.0091400146484375, 0.010410308837890625, 0.01168060302734375, 0.012950897216796875, 0.01422119140625, 0.015491485595703125, 0.01676177978515625, 0.018032073974609375, 0.0193023681640625, 0.020572662353515625, 0.02184295654296875, 0.023113250732421875, 0.024383544921875, 0.025653839111328125, 0.02692413330078125, 0.028194427490234375, 0.0294647216796875, 0.030735015869140625, 0.03200531005859375, 0.033275604248046875, 0.0345458984375, 0.035816192626953125, 0.03708648681640625, 0.038356781005859375, 0.0396270751953125, 0.040897369384765625, 0.04216766357421875, 0.043437957763671875, 0.044708251953125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 8.0, 11.0, 12.0, 31.0, 38.0, 104.0, 127.0, 167.0, 177.0, 128.0, 101.0, 53.0, 29.0, 11.0, 7.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3000304102897644, -0.28862038254737854, -0.2772103548049927, -0.2658003270626068, -0.25439029932022095, -0.24298027157783508, -0.23157022893428802, -0.22016020119190216, -0.2087501734495163, -0.19734014570713043, -0.18593011796474457, -0.1745200753211975, -0.16311004757881165, -0.15170001983642578, -0.14028999209403992, -0.12887996435165405, -0.11746993660926819, -0.10605990886688232, -0.09464988112449646, -0.08323984593153, -0.07182981818914413, -0.06041979044675827, -0.04900975525379181, -0.037599727511405945, -0.02618969976902008, -0.014779670163989067, -0.0033696405589580536, 0.008040390908718109, 0.019450418651103973, 0.030860446393489838, 0.0422704815864563, 0.05368050932884216, 0.06509053707122803, 0.07650056481361389, 0.08791059255599976, 0.09932062774896622, 0.11073065549135208, 0.12214068323373795, 0.1335507184267044, 0.14496074616909027, 0.15637077391147614, 0.167780801653862, 0.17919082939624786, 0.19060087203979492, 0.2020108997821808, 0.21342092752456665, 0.22483095526695251, 0.23624098300933838, 0.24765101075172424, 0.2590610384941101, 0.27047106623649597, 0.28188109397888184, 0.2932911217212677, 0.30470114946365356, 0.3161112070083618, 0.3275212049484253, 0.33893126249313354, 0.3503412902355194, 0.3617513179779053, 0.37316134572029114, 0.384571373462677, 0.39598140120506287, 0.40739142894744873, 0.418801486492157, 0.43021148443222046]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 6.0, 5.0, 4.0, 5.0, 5.0, 8.0, 4.0, 8.0, 17.0, 18.0, 10.0, 21.0, 21.0, 26.0, 23.0, 34.0, 41.0, 33.0, 37.0, 46.0, 46.0, 45.0, 48.0, 36.0, 30.0, 48.0, 38.0, 37.0, 35.0, 33.0, 21.0, 28.0, 21.0, 29.0, 18.0, 14.0, 13.0, 15.0, 23.0, 10.0, 15.0, 7.0, 9.0, 1.0, 1.0, 7.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.14985984563827515, -0.14571259915828705, -0.14156536757946014, -0.13741812109947205, -0.13327087461948395, -0.12912362813949585, -0.12497639656066895, -0.12082915008068085, -0.11668191105127335, -0.11253467202186584, -0.10838742554187775, -0.10424018651247025, -0.10009294748306274, -0.09594570100307465, -0.09179846197366714, -0.08765122294425964, -0.08350397646427155, -0.07935673743486404, -0.07520949095487595, -0.07106225192546844, -0.06691500544548035, -0.06276776641607285, -0.058620527386665344, -0.054473284631967545, -0.050326041877269745, -0.046178799122571945, -0.042031556367874146, -0.037884317338466644, -0.033737074583768845, -0.029589831829071045, -0.025442590937018394, -0.021295350044965744, -0.017148107290267944, -0.01300086546689272, -0.008853623643517494, -0.004706381820142269, -0.0005591399967670441, 0.0035881027579307556, 0.007735343649983406, 0.011882584542036057, 0.016029827296733856, 0.020177070051431656, 0.024324310943484306, 0.028471551835536957, 0.032618794590234756, 0.036766037344932556, 0.04091327637434006, 0.04506051912903786, 0.04920776188373566, 0.053355004638433456, 0.057502247393131256, 0.06164948642253876, 0.06579673290252686, 0.06994397193193436, 0.07409121096134186, 0.07823845744132996, 0.08238569647073746, 0.08653293550014496, 0.09068018198013306, 0.09482742100954056, 0.09897466003894806, 0.10312190651893616, 0.10726914554834366, 0.11141638457775116, 0.11556363105773926]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 11.0, 7.0, 11.0, 7.0, 16.0, 31.0, 64.0, 90.0, 133.0, 213.0, 350.0, 653.0, 1030.0, 2004.0, 3648.0, 7365.0, 15371.0, 36325.0, 100324.0, 486710.0, 275957.0, 67270.0, 26595.0, 11870.0, 5724.0, 2996.0, 1606.0, 869.0, 519.0, 275.0, 179.0, 111.0, 70.0, 57.0, 28.0, 22.0, 17.0, 14.0, 3.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.076416015625, -0.07376480102539062, -0.07111358642578125, -0.06846237182617188, -0.0658111572265625, -0.06315994262695312, -0.06050872802734375, -0.057857513427734375, -0.055206298828125, -0.052555084228515625, -0.04990386962890625, -0.047252655029296875, -0.0446014404296875, -0.041950225830078125, -0.03929901123046875, -0.036647796630859375, -0.03399658203125, -0.031345367431640625, -0.02869415283203125, -0.026042938232421875, -0.0233917236328125, -0.020740509033203125, -0.01808929443359375, -0.015438079833984375, -0.012786865234375, -0.010135650634765625, -0.00748443603515625, -0.004833221435546875, -0.0021820068359375, 0.000469207763671875, 0.00312042236328125, 0.005771636962890625, 0.0084228515625, 0.011074066162109375, 0.01372528076171875, 0.016376495361328125, 0.0190277099609375, 0.021678924560546875, 0.02433013916015625, 0.026981353759765625, 0.029632568359375, 0.032283782958984375, 0.03493499755859375, 0.037586212158203125, 0.0402374267578125, 0.042888641357421875, 0.04553985595703125, 0.048191070556640625, 0.05084228515625, 0.053493499755859375, 0.05614471435546875, 0.058795928955078125, 0.0614471435546875, 0.06409835815429688, 0.06674957275390625, 0.06940078735351562, 0.072052001953125, 0.07470321655273438, 0.07735443115234375, 0.08000564575195312, 0.0826568603515625, 0.08530807495117188, 0.08795928955078125, 0.09061050415039062, 0.09326171875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 0.0, 5.0, 8.0, 2.0, 3.0, 6.0, 2.0, 5.0, 13.0, 11.0, 21.0, 24.0, 22.0, 34.0, 32.0, 39.0, 40.0, 47.0, 43.0, 52.0, 71.0, 49.0, 53.0, 47.0, 51.0, 53.0, 40.0, 32.0, 32.0, 28.0, 28.0, 20.0, 18.0, 23.0, 7.0, 8.0, 11.0, 3.0, 3.0, 5.0, 2.0, 5.0, 5.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0175628662109375, -0.01695084571838379, -0.016338825225830078, -0.015726804733276367, -0.015114784240722656, -0.014502763748168945, -0.013890743255615234, -0.013278722763061523, -0.012666702270507812, -0.012054681777954102, -0.01144266128540039, -0.01083064079284668, -0.010218620300292969, -0.009606599807739258, -0.008994579315185547, -0.008382558822631836, -0.007770538330078125, -0.007158517837524414, -0.006546497344970703, -0.005934476852416992, -0.005322456359863281, -0.00471043586730957, -0.004098415374755859, -0.0034863948822021484, -0.0028743743896484375, -0.0022623538970947266, -0.0016503334045410156, -0.0010383129119873047, -0.00042629241943359375, 0.0001857280731201172, 0.0007977485656738281, 0.001409769058227539, 0.00202178955078125, 0.002633810043334961, 0.003245830535888672, 0.003857851028442383, 0.004469871520996094, 0.005081892013549805, 0.005693912506103516, 0.0063059329986572266, 0.0069179534912109375, 0.0075299739837646484, 0.00814199447631836, 0.00875401496887207, 0.009366035461425781, 0.009978055953979492, 0.010590076446533203, 0.011202096939086914, 0.011814117431640625, 0.012426137924194336, 0.013038158416748047, 0.013650178909301758, 0.014262199401855469, 0.01487421989440918, 0.01548624038696289, 0.0160982608795166, 0.016710281372070312, 0.017322301864624023, 0.017934322357177734, 0.018546342849731445, 0.019158363342285156, 0.019770383834838867, 0.020382404327392578, 0.02099442481994629, 0.0216064453125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 11.0, 9.0, 22.0, 29.0, 29.0, 32.0, 57.0, 96.0, 109.0, 197.0, 307.0, 487.0, 828.0, 1702.0, 4010.0, 11796.0, 42259.0, 194815.0, 638600.0, 110886.0, 27962.0, 8250.0, 2926.0, 1366.0, 665.0, 407.0, 213.0, 135.0, 100.0, 67.0, 43.0, 51.0, 26.0, 16.0, 9.0, 12.0, 9.0, 7.0, 2.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.08184814453125, -0.07885456085205078, -0.07586097717285156, -0.07286739349365234, -0.06987380981445312, -0.0668802261352539, -0.06388664245605469, -0.06089305877685547, -0.05789947509765625, -0.05490589141845703, -0.05191230773925781, -0.048918724060058594, -0.045925140380859375, -0.042931556701660156, -0.03993797302246094, -0.03694438934326172, -0.0339508056640625, -0.03095722198486328, -0.027963638305664062, -0.024970054626464844, -0.021976470947265625, -0.018982887268066406, -0.015989303588867188, -0.012995719909667969, -0.01000213623046875, -0.007008552551269531, -0.0040149688720703125, -0.0010213851928710938, 0.001972198486328125, 0.004965782165527344, 0.007959365844726562, 0.010952949523925781, 0.013946533203125, 0.01694011688232422, 0.019933700561523438, 0.022927284240722656, 0.025920867919921875, 0.028914451599121094, 0.03190803527832031, 0.03490161895751953, 0.03789520263671875, 0.04088878631591797, 0.04388236999511719, 0.046875953674316406, 0.049869537353515625, 0.052863121032714844, 0.05585670471191406, 0.05885028839111328, 0.0618438720703125, 0.06483745574951172, 0.06783103942871094, 0.07082462310791016, 0.07381820678710938, 0.0768117904663086, 0.07980537414550781, 0.08279895782470703, 0.08579254150390625, 0.08878612518310547, 0.09177970886230469, 0.0947732925415039, 0.09776687622070312, 0.10076045989990234, 0.10375404357910156, 0.10674762725830078, 0.1097412109375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 9.0, 9.0, 5.0, 6.0, 16.0, 15.0, 27.0, 14.0, 18.0, 23.0, 33.0, 27.0, 37.0, 40.0, 37.0, 51.0, 48.0, 58.0, 56.0, 51.0, 52.0, 51.0, 37.0, 35.0, 33.0, 31.0, 26.0, 24.0, 20.0, 18.0, 22.0, 14.0, 11.0, 6.0, 11.0, 9.0, 1.0, 3.0, 6.0, 4.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07958984375, -0.07706356048583984, -0.07453727722167969, -0.07201099395751953, -0.06948471069335938, -0.06695842742919922, -0.06443214416503906, -0.061905860900878906, -0.05937957763671875, -0.056853294372558594, -0.05432701110839844, -0.05180072784423828, -0.049274444580078125, -0.04674816131591797, -0.04422187805175781, -0.041695594787597656, -0.0391693115234375, -0.036643028259277344, -0.03411674499511719, -0.03159046173095703, -0.029064178466796875, -0.02653789520263672, -0.024011611938476562, -0.021485328674316406, -0.01895904541015625, -0.016432762145996094, -0.013906478881835938, -0.011380195617675781, -0.008853912353515625, -0.006327629089355469, -0.0038013458251953125, -0.0012750625610351562, 0.001251220703125, 0.0037775039672851562, 0.0063037872314453125, 0.008830070495605469, 0.011356353759765625, 0.013882637023925781, 0.016408920288085938, 0.018935203552246094, 0.02146148681640625, 0.023987770080566406, 0.026514053344726562, 0.02904033660888672, 0.031566619873046875, 0.03409290313720703, 0.03661918640136719, 0.039145469665527344, 0.0416717529296875, 0.044198036193847656, 0.04672431945800781, 0.04925060272216797, 0.051776885986328125, 0.05430316925048828, 0.05682945251464844, 0.059355735778808594, 0.06188201904296875, 0.0644083023071289, 0.06693458557128906, 0.06946086883544922, 0.07198715209960938, 0.07451343536376953, 0.07703971862792969, 0.07956600189208984, 0.08209228515625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 4.0, 4.0, 12.0, 11.0, 16.0, 15.0, 18.0, 36.0, 50.0, 58.0, 102.0, 166.0, 262.0, 416.0, 648.0, 1165.0, 2013.0, 3953.0, 8286.0, 19796.0, 56535.0, 376594.0, 472795.0, 65050.0, 21838.0, 9149.0, 4285.0, 2154.0, 1213.0, 695.0, 419.0, 245.0, 188.0, 113.0, 60.0, 53.0, 39.0, 22.0, 16.0, 17.0, 13.0, 8.0, 2.0, 9.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.055938720703125, -0.05424642562866211, -0.05255413055419922, -0.05086183547973633, -0.04916954040527344, -0.04747724533081055, -0.045784950256347656, -0.044092655181884766, -0.042400360107421875, -0.040708065032958984, -0.039015769958496094, -0.0373234748840332, -0.03563117980957031, -0.03393888473510742, -0.03224658966064453, -0.03055429458618164, -0.02886199951171875, -0.02716970443725586, -0.02547740936279297, -0.023785114288330078, -0.022092819213867188, -0.020400524139404297, -0.018708229064941406, -0.017015933990478516, -0.015323638916015625, -0.013631343841552734, -0.011939048767089844, -0.010246753692626953, -0.008554458618164062, -0.006862163543701172, -0.005169868469238281, -0.0034775733947753906, -0.0017852783203125, -9.298324584960938e-05, 0.0015993118286132812, 0.003291606903076172, 0.0049839019775390625, 0.006676197052001953, 0.008368492126464844, 0.010060787200927734, 0.011753082275390625, 0.013445377349853516, 0.015137672424316406, 0.016829967498779297, 0.018522262573242188, 0.020214557647705078, 0.02190685272216797, 0.02359914779663086, 0.02529144287109375, 0.02698373794555664, 0.02867603302001953, 0.030368328094482422, 0.03206062316894531, 0.0337529182434082, 0.035445213317871094, 0.037137508392333984, 0.038829803466796875, 0.040522098541259766, 0.042214393615722656, 0.04390668869018555, 0.04559898376464844, 0.04729127883911133, 0.04898357391357422, 0.05067586898803711, 0.0523681640625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 11.0, 8.0, 16.0, 37.0, 51.0, 118.0, 169.0, 198.0, 170.0, 88.0, 63.0, 28.0, 22.0, 11.0, 6.0, 4.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.159875869750977e-05, -7.935706526041031e-05, -7.711537182331085e-05, -7.48736783862114e-05, -7.263198494911194e-05, -7.039029151201248e-05, -6.814859807491302e-05, -6.590690463781357e-05, -6.366521120071411e-05, -6.142351776361465e-05, -5.91818243265152e-05, -5.694013088941574e-05, -5.4698437452316284e-05, -5.245674401521683e-05, -5.021505057811737e-05, -4.7973357141017914e-05, -4.573166370391846e-05, -4.3489970266819e-05, -4.1248276829719543e-05, -3.900658339262009e-05, -3.676488995552063e-05, -3.452319651842117e-05, -3.2281503081321716e-05, -3.003980964422226e-05, -2.7798116207122803e-05, -2.5556422770023346e-05, -2.331472933292389e-05, -2.1073035895824432e-05, -1.8831342458724976e-05, -1.658964902162552e-05, -1.4347955584526062e-05, -1.2106262147426605e-05, -9.864568710327148e-06, -7.622875273227692e-06, -5.381181836128235e-06, -3.139488399028778e-06, -8.977949619293213e-07, 1.3438984751701355e-06, 3.5855919122695923e-06, 5.827285349369049e-06, 8.068978786468506e-06, 1.0310672223567963e-05, 1.255236566066742e-05, 1.4794059097766876e-05, 1.7035752534866333e-05, 1.927744597196579e-05, 2.1519139409065247e-05, 2.3760832846164703e-05, 2.600252628326416e-05, 2.8244219720363617e-05, 3.0485913157463074e-05, 3.272760659456253e-05, 3.496930003166199e-05, 3.7210993468761444e-05, 3.94526869058609e-05, 4.169438034296036e-05, 4.3936073780059814e-05, 4.617776721715927e-05, 4.841946065425873e-05, 5.0661154091358185e-05, 5.290284752845764e-05, 5.51445409655571e-05, 5.7386234402656555e-05, 5.962792783975601e-05, 6.186962127685547e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 3.0, 6.0, 8.0, 9.0, 14.0, 20.0, 37.0, 39.0, 83.0, 118.0, 197.0, 289.0, 454.0, 804.0, 1510.0, 2779.0, 6218.0, 16559.0, 57549.0, 568942.0, 325672.0, 43194.0, 13305.0, 5161.0, 2416.0, 1252.0, 711.0, 436.0, 251.0, 164.0, 121.0, 73.0, 41.0, 32.0, 24.0, 16.0, 12.0, 11.0, 8.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0545654296875, -0.05260944366455078, -0.05065345764160156, -0.048697471618652344, -0.046741485595703125, -0.044785499572753906, -0.04282951354980469, -0.04087352752685547, -0.03891754150390625, -0.03696155548095703, -0.03500556945800781, -0.033049583435058594, -0.031093597412109375, -0.029137611389160156, -0.027181625366210938, -0.02522563934326172, -0.0232696533203125, -0.02131366729736328, -0.019357681274414062, -0.017401695251464844, -0.015445709228515625, -0.013489723205566406, -0.011533737182617188, -0.009577751159667969, -0.00762176513671875, -0.005665779113769531, -0.0037097930908203125, -0.0017538070678710938, 0.000202178955078125, 0.0021581649780273438, 0.0041141510009765625, 0.006070137023925781, 0.008026123046875, 0.009982109069824219, 0.011938095092773438, 0.013894081115722656, 0.015850067138671875, 0.017806053161621094, 0.019762039184570312, 0.02171802520751953, 0.02367401123046875, 0.02562999725341797, 0.027585983276367188, 0.029541969299316406, 0.031497955322265625, 0.033453941345214844, 0.03540992736816406, 0.03736591339111328, 0.0393218994140625, 0.04127788543701172, 0.04323387145996094, 0.045189857482910156, 0.047145843505859375, 0.049101829528808594, 0.05105781555175781, 0.05301380157470703, 0.05496978759765625, 0.05692577362060547, 0.05888175964355469, 0.060837745666503906, 0.06279373168945312, 0.06474971771240234, 0.06670570373535156, 0.06866168975830078, 0.07061767578125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 4.0, 8.0, 9.0, 7.0, 10.0, 12.0, 25.0, 23.0, 38.0, 46.0, 75.0, 127.0, 187.0, 131.0, 87.0, 48.0, 36.0, 29.0, 24.0, 10.0, 7.0, 9.0, 8.0, 10.0, 6.0, 2.0, 3.0, 1.0, 2.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.045379638671875, -0.0439448356628418, -0.042510032653808594, -0.04107522964477539, -0.03964042663574219, -0.038205623626708984, -0.03677082061767578, -0.03533601760864258, -0.033901214599609375, -0.03246641159057617, -0.03103160858154297, -0.029596805572509766, -0.028162002563476562, -0.02672719955444336, -0.025292396545410156, -0.023857593536376953, -0.02242279052734375, -0.020987987518310547, -0.019553184509277344, -0.01811838150024414, -0.016683578491210938, -0.015248775482177734, -0.013813972473144531, -0.012379169464111328, -0.010944366455078125, -0.009509563446044922, -0.008074760437011719, -0.006639957427978516, -0.0052051544189453125, -0.0037703514099121094, -0.0023355484008789062, -0.0009007453918457031, 0.0005340576171875, 0.001968860626220703, 0.0034036636352539062, 0.004838466644287109, 0.0062732696533203125, 0.007708072662353516, 0.009142875671386719, 0.010577678680419922, 0.012012481689453125, 0.013447284698486328, 0.014882087707519531, 0.016316890716552734, 0.017751693725585938, 0.01918649673461914, 0.020621299743652344, 0.022056102752685547, 0.02349090576171875, 0.024925708770751953, 0.026360511779785156, 0.02779531478881836, 0.029230117797851562, 0.030664920806884766, 0.03209972381591797, 0.03353452682495117, 0.034969329833984375, 0.03640413284301758, 0.03783893585205078, 0.039273738861083984, 0.04070854187011719, 0.04214334487915039, 0.043578147888183594, 0.0450129508972168, 0.04644775390625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 9.0, 9.0, 54.0, 154.0, 294.0, 287.0, 149.0, 39.0, 10.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.5535879135131836, -2.5014238357543945, -2.4492597579956055, -2.3970954418182373, -2.3449313640594482, -2.292767286300659, -2.24060320854187, -2.188438892364502, -2.136274814605713, -2.084110736846924, -2.0319466590881348, -1.9797824621200562, -1.9276182651519775, -1.8754541873931885, -1.8232901096343994, -1.7711259126663208, -1.7189618349075317, -1.6667977571487427, -1.614633560180664, -1.562469482421875, -1.5103052854537964, -1.4581412076950073, -1.4059770107269287, -1.3538129329681396, -1.3016488552093506, -1.2494847774505615, -1.197320580482483, -1.1451565027236938, -1.0929923057556152, -1.0408282279968262, -0.9886640906333923, -0.9364999532699585, -0.8843357563018799, -0.832171618938446, -0.7800074815750122, -0.7278434038162231, -0.6756792068481445, -0.6235151290893555, -0.5713509917259216, -0.5191868543624878, -0.46702271699905396, -0.4148585796356201, -0.3626944422721863, -0.31053033471107483, -0.258366197347641, -0.20620205998420715, -0.1540379524230957, -0.10187381505966187, -0.04970967769622803, 0.0024544522166252136, 0.054618582129478455, 0.1067827045917511, 0.15894684195518494, 0.21111097931861877, 0.2632750868797302, 0.31543922424316406, 0.3676033616065979, 0.41976749897003174, 0.4719316363334656, 0.5240957736968994, 0.5762598514556885, 0.6284240484237671, 0.6805881261825562, 0.73275226354599, 0.7849164009094238]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 1.0, 4.0, 6.0, 4.0, 8.0, 8.0, 16.0, 17.0, 20.0, 21.0, 18.0, 35.0, 21.0, 40.0, 41.0, 38.0, 41.0, 41.0, 36.0, 42.0, 35.0, 46.0, 41.0, 51.0, 55.0, 45.0, 35.0, 43.0, 27.0, 25.0, 19.0, 21.0, 15.0, 18.0, 14.0, 10.0, 13.0, 7.0, 7.0, 6.0, 4.0, 3.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36976349353790283, -0.3567947745323181, -0.3438260555267334, -0.3308573365211487, -0.31788861751556396, -0.30491989850997925, -0.29195117950439453, -0.2789824604988098, -0.2660137414932251, -0.2530450224876404, -0.24007630348205566, -0.22710758447647095, -0.21413886547088623, -0.2011701464653015, -0.1882014274597168, -0.17523270845413208, -0.16226397454738617, -0.14929525554180145, -0.13632653653621674, -0.12335781753063202, -0.1103890985250473, -0.09742037206888199, -0.08445165306329727, -0.07148293405771255, -0.05851421505212784, -0.04554549604654312, -0.032576777040958405, -0.01960805431008339, -0.0066393353044986725, 0.006329387426376343, 0.01929810643196106, 0.032266825437545776, 0.04523554444313049, 0.05820426344871521, 0.07117298245429993, 0.08414170145988464, 0.09711042046546936, 0.11007914692163467, 0.12304786592721939, 0.1360165774822235, 0.14898529648780823, 0.16195401549339294, 0.17492273449897766, 0.18789145350456238, 0.2008601725101471, 0.2138288915157318, 0.22679761052131653, 0.23976632952690125, 0.25273507833480835, 0.26570379734039307, 0.2786725163459778, 0.2916412353515625, 0.3046099543571472, 0.31757867336273193, 0.33054739236831665, 0.34351611137390137, 0.3564848303794861, 0.3694535493850708, 0.3824222683906555, 0.39539098739624023, 0.40835970640182495, 0.42132842540740967, 0.4342971444129944, 0.4472658634185791, 0.4602345824241638]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 7.0, 4.0, 12.0, 14.0, 24.0, 31.0, 58.0, 94.0, 110.0, 175.0, 302.0, 426.0, 725.0, 1201.0, 1877.0, 3351.0, 6361.0, 12574.0, 29478.0, 88837.0, 628344.0, 3208204.0, 137802.0, 40268.0, 15863.0, 7774.0, 4062.0, 2296.0, 1425.0, 878.0, 569.0, 378.0, 258.0, 144.0, 115.0, 72.0, 58.0, 31.0, 25.0, 17.0, 13.0, 7.0, 9.0, 6.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06707763671875, -0.06477737426757812, -0.06247711181640625, -0.060176849365234375, -0.0578765869140625, -0.055576324462890625, -0.05327606201171875, -0.050975799560546875, -0.048675537109375, -0.046375274658203125, -0.04407501220703125, -0.041774749755859375, -0.0394744873046875, -0.037174224853515625, -0.03487396240234375, -0.032573699951171875, -0.0302734375, -0.027973175048828125, -0.02567291259765625, -0.023372650146484375, -0.0210723876953125, -0.018772125244140625, -0.01647186279296875, -0.014171600341796875, -0.011871337890625, -0.009571075439453125, -0.00727081298828125, -0.004970550537109375, -0.0026702880859375, -0.000370025634765625, 0.00193023681640625, 0.004230499267578125, 0.00653076171875, 0.008831024169921875, 0.01113128662109375, 0.013431549072265625, 0.0157318115234375, 0.018032073974609375, 0.02033233642578125, 0.022632598876953125, 0.024932861328125, 0.027233123779296875, 0.02953338623046875, 0.031833648681640625, 0.0341339111328125, 0.036434173583984375, 0.03873443603515625, 0.041034698486328125, 0.0433349609375, 0.045635223388671875, 0.04793548583984375, 0.050235748291015625, 0.0525360107421875, 0.054836273193359375, 0.05713653564453125, 0.059436798095703125, 0.061737060546875, 0.06403732299804688, 0.06633758544921875, 0.06863784790039062, 0.0709381103515625, 0.07323837280273438, 0.07553863525390625, 0.07783889770507812, 0.08013916015625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 7.0, 2.0, 2.0, 7.0, 6.0, 8.0, 6.0, 17.0, 14.0, 21.0, 25.0, 41.0, 35.0, 39.0, 49.0, 61.0, 39.0, 56.0, 71.0, 54.0, 57.0, 45.0, 48.0, 52.0, 44.0, 33.0, 35.0, 28.0, 18.0, 23.0, 14.0, 12.0, 11.0, 4.0, 9.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015869140625, -0.015159845352172852, -0.014450550079345703, -0.013741254806518555, -0.013031959533691406, -0.012322664260864258, -0.01161336898803711, -0.010904073715209961, -0.010194778442382812, -0.009485483169555664, -0.008776187896728516, -0.008066892623901367, -0.007357597351074219, -0.00664830207824707, -0.005939006805419922, -0.0052297115325927734, -0.004520416259765625, -0.0038111209869384766, -0.003101825714111328, -0.0023925304412841797, -0.0016832351684570312, -0.0009739398956298828, -0.0002646446228027344, 0.00044465065002441406, 0.0011539459228515625, 0.001863241195678711, 0.0025725364685058594, 0.003281831741333008, 0.003991127014160156, 0.004700422286987305, 0.005409717559814453, 0.0061190128326416016, 0.00682830810546875, 0.0075376033782958984, 0.008246898651123047, 0.008956193923950195, 0.009665489196777344, 0.010374784469604492, 0.01108407974243164, 0.011793375015258789, 0.012502670288085938, 0.013211965560913086, 0.013921260833740234, 0.014630556106567383, 0.015339851379394531, 0.01604914665222168, 0.016758441925048828, 0.017467737197875977, 0.018177032470703125, 0.018886327743530273, 0.019595623016357422, 0.02030491828918457, 0.02101421356201172, 0.021723508834838867, 0.022432804107666016, 0.023142099380493164, 0.023851394653320312, 0.02456068992614746, 0.02526998519897461, 0.025979280471801758, 0.026688575744628906, 0.027397871017456055, 0.028107166290283203, 0.02881646156311035, 0.0295257568359375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 8.0, 9.0, 20.0, 14.0, 27.0, 44.0, 59.0, 133.0, 163.0, 257.0, 449.0, 749.0, 1354.0, 2465.0, 4679.0, 9077.0, 19332.0, 47862.0, 159069.0, 2491786.0, 1240920.0, 136003.0, 42958.0, 18162.0, 8776.0, 4342.0, 2344.0, 1294.0, 765.0, 429.0, 272.0, 190.0, 76.0, 66.0, 47.0, 29.0, 21.0, 15.0, 8.0, 7.0, 0.0, 5.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.063720703125, -0.061440467834472656, -0.05916023254394531, -0.05687999725341797, -0.054599761962890625, -0.05231952667236328, -0.05003929138183594, -0.047759056091308594, -0.04547882080078125, -0.043198585510253906, -0.04091835021972656, -0.03863811492919922, -0.036357879638671875, -0.03407764434814453, -0.03179740905761719, -0.029517173767089844, -0.0272369384765625, -0.024956703186035156, -0.022676467895507812, -0.02039623260498047, -0.018115997314453125, -0.01583576202392578, -0.013555526733398438, -0.011275291442871094, -0.00899505615234375, -0.006714820861816406, -0.0044345855712890625, -0.0021543502807617188, 0.000125885009765625, 0.0024061203002929688, 0.0046863555908203125, 0.006966590881347656, 0.009246826171875, 0.011527061462402344, 0.013807296752929688, 0.01608753204345703, 0.018367767333984375, 0.02064800262451172, 0.022928237915039062, 0.025208473205566406, 0.02748870849609375, 0.029768943786621094, 0.03204917907714844, 0.03432941436767578, 0.036609649658203125, 0.03888988494873047, 0.04117012023925781, 0.043450355529785156, 0.0457305908203125, 0.048010826110839844, 0.05029106140136719, 0.05257129669189453, 0.054851531982421875, 0.05713176727294922, 0.05941200256347656, 0.061692237854003906, 0.06397247314453125, 0.0662527084350586, 0.06853294372558594, 0.07081317901611328, 0.07309341430664062, 0.07537364959716797, 0.07765388488769531, 0.07993412017822266, 0.08221435546875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 7.0, 8.0, 13.0, 15.0, 24.0, 31.0, 43.0, 65.0, 123.0, 246.0, 690.0, 1881.0, 426.0, 193.0, 91.0, 66.0, 37.0, 30.0, 21.0, 15.0, 14.0, 12.0, 8.0, 6.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047454833984375, -0.04602956771850586, -0.04460430145263672, -0.04317903518676758, -0.04175376892089844, -0.0403285026550293, -0.038903236389160156, -0.037477970123291016, -0.036052703857421875, -0.034627437591552734, -0.033202171325683594, -0.03177690505981445, -0.030351638793945312, -0.028926372528076172, -0.02750110626220703, -0.02607583999633789, -0.02465057373046875, -0.02322530746459961, -0.02180004119873047, -0.020374774932861328, -0.018949508666992188, -0.017524242401123047, -0.016098976135253906, -0.014673709869384766, -0.013248443603515625, -0.011823177337646484, -0.010397911071777344, -0.008972644805908203, -0.0075473785400390625, -0.006122112274169922, -0.004696846008300781, -0.0032715797424316406, -0.0018463134765625, -0.0004210472106933594, 0.0010042190551757812, 0.002429485321044922, 0.0038547515869140625, 0.005280017852783203, 0.006705284118652344, 0.008130550384521484, 0.009555816650390625, 0.010981082916259766, 0.012406349182128906, 0.013831615447998047, 0.015256881713867188, 0.016682147979736328, 0.01810741424560547, 0.01953268051147461, 0.02095794677734375, 0.02238321304321289, 0.02380847930908203, 0.025233745574951172, 0.026659011840820312, 0.028084278106689453, 0.029509544372558594, 0.030934810638427734, 0.032360076904296875, 0.033785343170166016, 0.035210609436035156, 0.0366358757019043, 0.03806114196777344, 0.03948640823364258, 0.04091167449951172, 0.04233694076538086, 0.04376220703125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 10.0, 10.0, 36.0, 70.0, 130.0, 181.0, 193.0, 153.0, 111.0, 61.0, 25.0, 17.0, 5.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.14869078993797302, -0.13735340535640717, -0.1260160207748413, -0.11467864364385605, -0.10334125906229019, -0.09200387448072433, -0.08066649734973907, -0.06932911276817322, -0.05799172818660736, -0.046654343605041504, -0.035316962748765945, -0.023979581892490387, -0.01264219731092453, -0.001304812729358673, 0.010032564401626587, 0.021369948983192444, 0.0327073335647583, 0.04404471814632416, 0.055382099002599716, 0.06671947985887527, 0.07805686444044113, 0.08939424902200699, 0.10073162615299225, 0.1120690107345581, 0.12340639531612396, 0.13474377989768982, 0.14608116447925568, 0.15741854906082153, 0.1687559187412262, 0.18009331822395325, 0.1914306879043579, 0.20276807248592377, 0.21410542726516724, 0.2254428118467331, 0.23678019642829895, 0.2481175661087036, 0.25945496559143066, 0.2707923352718353, 0.28212970495224, 0.29346710443496704, 0.3048045039176941, 0.31614187359809875, 0.3274792730808258, 0.33881664276123047, 0.3501540422439575, 0.3614914119243622, 0.37282878160476685, 0.3841661810874939, 0.39550355076789856, 0.4068409204483032, 0.4181783199310303, 0.42951568961143494, 0.440853089094162, 0.45219045877456665, 0.4635278582572937, 0.47486522793769836, 0.486202597618103, 0.4975399672985077, 0.5088773369789124, 0.5202147364616394, 0.5315521359443665, 0.5428895354270935, 0.5542268753051758, 0.5655642747879028, 0.5769016742706299]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 5.0, 7.0, 8.0, 11.0, 16.0, 27.0, 34.0, 29.0, 33.0, 28.0, 35.0, 36.0, 45.0, 35.0, 52.0, 55.0, 51.0, 53.0, 62.0, 44.0, 51.0, 42.0, 45.0, 32.0, 24.0, 28.0, 23.0, 28.0, 13.0, 16.0, 10.0, 7.0, 5.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11925679445266724, -0.11501452326774597, -0.11077225208282471, -0.10652998089790344, -0.10228770971298218, -0.09804543852806091, -0.09380317479372025, -0.08956090360879898, -0.08531863242387772, -0.08107636123895645, -0.07683409005403519, -0.07259181886911392, -0.06834955513477325, -0.06410728394985199, -0.059865012764930725, -0.05562274158000946, -0.051380470395088196, -0.04713819921016693, -0.042895928025245667, -0.0386536605656147, -0.034411389380693436, -0.03016911819577217, -0.025926848873496056, -0.02168457955121994, -0.017442308366298676, -0.013200038112699986, -0.008957767859101295, -0.0047154976055026054, -0.0004732273519039154, 0.0037690438330173492, 0.008011313155293465, 0.01225358247756958, 0.016495853662490845, 0.02073812484741211, 0.024980394169688225, 0.02922266349196434, 0.033464934676885605, 0.03770720586180687, 0.041949473321437836, 0.0461917445063591, 0.050434015691280365, 0.05467628687620163, 0.058918558061122894, 0.06316082924604416, 0.06740309298038483, 0.07164536416530609, 0.07588763535022736, 0.08012990653514862, 0.08437217772006989, 0.08861444890499115, 0.09285672008991241, 0.09709899127483368, 0.10134126245975494, 0.10558353364467621, 0.10982579737901688, 0.11406806856393814, 0.1183103397488594, 0.12255261093378067, 0.12679487466812134, 0.1310371458530426, 0.13527941703796387, 0.13952168822288513, 0.1437639594078064, 0.14800623059272766, 0.15224850177764893]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 1.0, 4.0, 7.0, 9.0, 17.0, 14.0, 38.0, 38.0, 65.0, 135.0, 237.0, 476.0, 1029.0, 2567.0, 6415.0, 17366.0, 50876.0, 229459.0, 577964.0, 110242.0, 32394.0, 11485.0, 4345.0, 1759.0, 778.0, 357.0, 183.0, 99.0, 63.0, 49.0, 32.0, 14.0, 15.0, 7.0, 4.0, 3.0, 8.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07135009765625, -0.06863689422607422, -0.06592369079589844, -0.06321048736572266, -0.060497283935546875, -0.057784080505371094, -0.05507087707519531, -0.05235767364501953, -0.04964447021484375, -0.04693126678466797, -0.04421806335449219, -0.041504859924316406, -0.038791656494140625, -0.036078453063964844, -0.03336524963378906, -0.03065204620361328, -0.0279388427734375, -0.02522563934326172, -0.022512435913085938, -0.019799232482910156, -0.017086029052734375, -0.014372825622558594, -0.011659622192382812, -0.008946418762207031, -0.00623321533203125, -0.0035200119018554688, -0.0008068084716796875, 0.0019063949584960938, 0.004619598388671875, 0.007332801818847656, 0.010046005249023438, 0.012759208679199219, 0.015472412109375, 0.01818561553955078, 0.020898818969726562, 0.023612022399902344, 0.026325225830078125, 0.029038429260253906, 0.03175163269042969, 0.03446483612060547, 0.03717803955078125, 0.03989124298095703, 0.04260444641113281, 0.045317649841308594, 0.048030853271484375, 0.050744056701660156, 0.05345726013183594, 0.05617046356201172, 0.0588836669921875, 0.06159687042236328, 0.06431007385253906, 0.06702327728271484, 0.06973648071289062, 0.0724496841430664, 0.07516288757324219, 0.07787609100341797, 0.08058929443359375, 0.08330249786376953, 0.08601570129394531, 0.0887289047241211, 0.09144210815429688, 0.09415531158447266, 0.09686851501464844, 0.09958171844482422, 0.102294921875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 7.0, 4.0, 4.0, 4.0, 6.0, 4.0, 11.0, 18.0, 24.0, 17.0, 37.0, 22.0, 26.0, 37.0, 46.0, 52.0, 38.0, 49.0, 67.0, 57.0, 49.0, 49.0, 49.0, 40.0, 46.0, 32.0, 38.0, 25.0, 28.0, 17.0, 22.0, 11.0, 10.0, 16.0, 8.0, 9.0, 5.0, 7.0, 4.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0184173583984375, -0.017778873443603516, -0.01714038848876953, -0.016501903533935547, -0.015863418579101562, -0.015224933624267578, -0.014586448669433594, -0.01394796371459961, -0.013309478759765625, -0.01267099380493164, -0.012032508850097656, -0.011394023895263672, -0.010755538940429688, -0.010117053985595703, -0.009478569030761719, -0.008840084075927734, -0.00820159912109375, -0.007563114166259766, -0.006924629211425781, -0.006286144256591797, -0.0056476593017578125, -0.005009174346923828, -0.004370689392089844, -0.0037322044372558594, -0.003093719482421875, -0.0024552345275878906, -0.0018167495727539062, -0.0011782646179199219, -0.0005397796630859375, 9.870529174804688e-05, 0.0007371902465820312, 0.0013756752014160156, 0.00201416015625, 0.0026526451110839844, 0.0032911300659179688, 0.003929615020751953, 0.0045680999755859375, 0.005206584930419922, 0.005845069885253906, 0.006483554840087891, 0.007122039794921875, 0.007760524749755859, 0.008399009704589844, 0.009037494659423828, 0.009675979614257812, 0.010314464569091797, 0.010952949523925781, 0.011591434478759766, 0.01222991943359375, 0.012868404388427734, 0.013506889343261719, 0.014145374298095703, 0.014783859252929688, 0.015422344207763672, 0.016060829162597656, 0.01669931411743164, 0.017337799072265625, 0.01797628402709961, 0.018614768981933594, 0.019253253936767578, 0.019891738891601562, 0.020530223846435547, 0.02116870880126953, 0.021807193756103516, 0.0224456787109375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 5.0, 3.0, 3.0, 4.0, 7.0, 5.0, 5.0, 14.0, 11.0, 16.0, 31.0, 37.0, 58.0, 93.0, 145.0, 256.0, 464.0, 844.0, 1947.0, 4356.0, 10931.0, 29395.0, 96361.0, 629253.0, 204077.0, 43211.0, 15706.0, 6100.0, 2628.0, 1132.0, 591.0, 321.0, 186.0, 112.0, 71.0, 55.0, 34.0, 21.0, 16.0, 15.0, 10.0, 11.0, 1.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.09130859375, -0.08859825134277344, -0.08588790893554688, -0.08317756652832031, -0.08046722412109375, -0.07775688171386719, -0.07504653930664062, -0.07233619689941406, -0.0696258544921875, -0.06691551208496094, -0.06420516967773438, -0.06149482727050781, -0.05878448486328125, -0.05607414245605469, -0.053363800048828125, -0.05065345764160156, -0.047943115234375, -0.04523277282714844, -0.042522430419921875, -0.03981208801269531, -0.03710174560546875, -0.03439140319824219, -0.031681060791015625, -0.028970718383789062, -0.0262603759765625, -0.023550033569335938, -0.020839691162109375, -0.018129348754882812, -0.01541900634765625, -0.012708663940429688, -0.009998321533203125, -0.0072879791259765625, -0.00457763671875, -0.0018672943115234375, 0.000843048095703125, 0.0035533905029296875, 0.00626373291015625, 0.008974075317382812, 0.011684417724609375, 0.014394760131835938, 0.0171051025390625, 0.019815444946289062, 0.022525787353515625, 0.025236129760742188, 0.02794647216796875, 0.030656814575195312, 0.033367156982421875, 0.03607749938964844, 0.038787841796875, 0.04149818420410156, 0.044208526611328125, 0.04691886901855469, 0.04962921142578125, 0.05233955383300781, 0.055049896240234375, 0.05776023864746094, 0.0604705810546875, 0.06318092346191406, 0.06589126586914062, 0.06860160827636719, 0.07131195068359375, 0.07402229309082031, 0.07673263549804688, 0.07944297790527344, 0.0821533203125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 6.0, 7.0, 5.0, 13.0, 8.0, 16.0, 19.0, 23.0, 31.0, 46.0, 58.0, 57.0, 58.0, 66.0, 68.0, 73.0, 45.0, 57.0, 61.0, 62.0, 37.0, 38.0, 30.0, 24.0, 15.0, 22.0, 12.0, 10.0, 10.0, 6.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11737060546875, -0.1137704849243164, -0.11017036437988281, -0.10657024383544922, -0.10297012329101562, -0.09937000274658203, -0.09576988220214844, -0.09216976165771484, -0.08856964111328125, -0.08496952056884766, -0.08136940002441406, -0.07776927947998047, -0.07416915893554688, -0.07056903839111328, -0.06696891784667969, -0.0633687973022461, -0.0597686767578125, -0.056168556213378906, -0.05256843566894531, -0.04896831512451172, -0.045368194580078125, -0.04176807403564453, -0.03816795349121094, -0.034567832946777344, -0.03096771240234375, -0.027367591857910156, -0.023767471313476562, -0.02016735076904297, -0.016567230224609375, -0.012967109680175781, -0.009366989135742188, -0.005766868591308594, -0.002166748046875, 0.0014333724975585938, 0.0050334930419921875, 0.008633613586425781, 0.012233734130859375, 0.01583385467529297, 0.019433975219726562, 0.023034095764160156, 0.02663421630859375, 0.030234336853027344, 0.03383445739746094, 0.03743457794189453, 0.041034698486328125, 0.04463481903076172, 0.04823493957519531, 0.051835060119628906, 0.0554351806640625, 0.059035301208496094, 0.06263542175292969, 0.06623554229736328, 0.06983566284179688, 0.07343578338623047, 0.07703590393066406, 0.08063602447509766, 0.08423614501953125, 0.08783626556396484, 0.09143638610839844, 0.09503650665283203, 0.09863662719726562, 0.10223674774169922, 0.10583686828613281, 0.1094369888305664, 0.113037109375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 8.0, 5.0, 16.0, 14.0, 29.0, 31.0, 61.0, 67.0, 93.0, 128.0, 217.0, 301.0, 431.0, 752.0, 1166.0, 2052.0, 3795.0, 8838.0, 23927.0, 96725.0, 689110.0, 165999.0, 32836.0, 11130.0, 4804.0, 2371.0, 1335.0, 765.0, 559.0, 333.0, 188.0, 140.0, 106.0, 71.0, 44.0, 34.0, 30.0, 18.0, 10.0, 4.0, 2.0, 8.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048675537109375, -0.047086238861083984, -0.04549694061279297, -0.04390764236450195, -0.04231834411621094, -0.04072904586791992, -0.039139747619628906, -0.03755044937133789, -0.035961151123046875, -0.03437185287475586, -0.032782554626464844, -0.031193256378173828, -0.029603958129882812, -0.028014659881591797, -0.02642536163330078, -0.024836063385009766, -0.02324676513671875, -0.021657466888427734, -0.02006816864013672, -0.018478870391845703, -0.016889572143554688, -0.015300273895263672, -0.013710975646972656, -0.01212167739868164, -0.010532379150390625, -0.00894308090209961, -0.007353782653808594, -0.005764484405517578, -0.0041751861572265625, -0.002585887908935547, -0.0009965896606445312, 0.0005927085876464844, 0.0021820068359375, 0.0037713050842285156, 0.005360603332519531, 0.006949901580810547, 0.008539199829101562, 0.010128498077392578, 0.011717796325683594, 0.01330709457397461, 0.014896392822265625, 0.01648569107055664, 0.018074989318847656, 0.019664287567138672, 0.021253585815429688, 0.022842884063720703, 0.02443218231201172, 0.026021480560302734, 0.02761077880859375, 0.029200077056884766, 0.03078937530517578, 0.0323786735534668, 0.03396797180175781, 0.03555727005004883, 0.037146568298339844, 0.03873586654663086, 0.040325164794921875, 0.04191446304321289, 0.043503761291503906, 0.04509305953979492, 0.04668235778808594, 0.04827165603637695, 0.04986095428466797, 0.051450252532958984, 0.05303955078125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 8.0, 6.0, 13.0, 17.0, 29.0, 55.0, 77.0, 111.0, 177.0, 142.0, 143.0, 91.0, 55.0, 25.0, 15.0, 7.0, 11.0, 7.0, 8.0, 8.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.036592483520508e-05, -4.874635487794876e-05, -4.7126784920692444e-05, -4.550721496343613e-05, -4.388764500617981e-05, -4.226807504892349e-05, -4.0648505091667175e-05, -3.902893513441086e-05, -3.740936517715454e-05, -3.5789795219898224e-05, -3.417022526264191e-05, -3.255065530538559e-05, -3.093108534812927e-05, -2.9311515390872955e-05, -2.7691945433616638e-05, -2.607237547636032e-05, -2.4452805519104004e-05, -2.2833235561847687e-05, -2.121366560459137e-05, -1.9594095647335052e-05, -1.7974525690078735e-05, -1.6354955732822418e-05, -1.4735385775566101e-05, -1.3115815818309784e-05, -1.1496245861053467e-05, -9.87667590379715e-06, -8.257105946540833e-06, -6.637535989284515e-06, -5.017966032028198e-06, -3.398396074771881e-06, -1.778826117515564e-06, -1.5925616025924683e-07, 1.4603137969970703e-06, 3.0798837542533875e-06, 4.699453711509705e-06, 6.319023668766022e-06, 7.938593626022339e-06, 9.558163583278656e-06, 1.1177733540534973e-05, 1.279730349779129e-05, 1.4416873455047607e-05, 1.6036443412303925e-05, 1.7656013369560242e-05, 1.927558332681656e-05, 2.0895153284072876e-05, 2.2514723241329193e-05, 2.413429319858551e-05, 2.5753863155841827e-05, 2.7373433113098145e-05, 2.899300307035446e-05, 3.061257302761078e-05, 3.2232142984867096e-05, 3.385171294212341e-05, 3.547128289937973e-05, 3.709085285663605e-05, 3.8710422813892365e-05, 4.032999277114868e-05, 4.1949562728405e-05, 4.3569132685661316e-05, 4.518870264291763e-05, 4.680827260017395e-05, 4.842784255743027e-05, 5.0047412514686584e-05, 5.16669824719429e-05, 5.328655242919922e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 10.0, 5.0, 8.0, 17.0, 22.0, 23.0, 38.0, 79.0, 114.0, 207.0, 389.0, 902.0, 2444.0, 7322.0, 34522.0, 718804.0, 254899.0, 20190.0, 5154.0, 1879.0, 792.0, 325.0, 148.0, 91.0, 58.0, 39.0, 24.0, 21.0, 7.0, 13.0, 4.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08721923828125, -0.08448123931884766, -0.08174324035644531, -0.07900524139404297, -0.07626724243164062, -0.07352924346923828, -0.07079124450683594, -0.0680532455444336, -0.06531524658203125, -0.0625772476196289, -0.05983924865722656, -0.05710124969482422, -0.054363250732421875, -0.05162525177001953, -0.04888725280761719, -0.046149253845214844, -0.0434112548828125, -0.040673255920410156, -0.03793525695800781, -0.03519725799560547, -0.032459259033203125, -0.02972126007080078, -0.026983261108398438, -0.024245262145996094, -0.02150726318359375, -0.018769264221191406, -0.016031265258789062, -0.013293266296386719, -0.010555267333984375, -0.007817268371582031, -0.0050792694091796875, -0.0023412704467773438, 0.000396728515625, 0.0031347274780273438, 0.0058727264404296875, 0.008610725402832031, 0.011348724365234375, 0.014086723327636719, 0.016824722290039062, 0.019562721252441406, 0.02230072021484375, 0.025038719177246094, 0.027776718139648438, 0.03051471710205078, 0.033252716064453125, 0.03599071502685547, 0.03872871398925781, 0.041466712951660156, 0.0442047119140625, 0.046942710876464844, 0.04968070983886719, 0.05241870880126953, 0.055156707763671875, 0.05789470672607422, 0.06063270568847656, 0.0633707046508789, 0.06610870361328125, 0.0688467025756836, 0.07158470153808594, 0.07432270050048828, 0.07706069946289062, 0.07979869842529297, 0.08253669738769531, 0.08527469635009766, 0.0880126953125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 4.0, 4.0, 9.0, 6.0, 16.0, 14.0, 22.0, 47.0, 88.0, 147.0, 211.0, 172.0, 89.0, 67.0, 32.0, 15.0, 8.0, 11.0, 4.0, 6.0, 7.0, 5.0, 1.0, 1.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.072265625, -0.07039642333984375, -0.0685272216796875, -0.06665802001953125, -0.064788818359375, -0.06291961669921875, -0.0610504150390625, -0.05918121337890625, -0.05731201171875, -0.05544281005859375, -0.0535736083984375, -0.05170440673828125, -0.049835205078125, -0.04796600341796875, -0.0460968017578125, -0.04422760009765625, -0.0423583984375, -0.04048919677734375, -0.0386199951171875, -0.03675079345703125, -0.034881591796875, -0.03301239013671875, -0.0311431884765625, -0.02927398681640625, -0.02740478515625, -0.02553558349609375, -0.0236663818359375, -0.02179718017578125, -0.019927978515625, -0.01805877685546875, -0.0161895751953125, -0.01432037353515625, -0.012451171875, -0.01058197021484375, -0.0087127685546875, -0.00684356689453125, -0.004974365234375, -0.00310516357421875, -0.0012359619140625, 0.00063323974609375, 0.00250244140625, 0.00437164306640625, 0.0062408447265625, 0.00811004638671875, 0.009979248046875, 0.01184844970703125, 0.0137176513671875, 0.01558685302734375, 0.0174560546875, 0.01932525634765625, 0.0211944580078125, 0.02306365966796875, 0.024932861328125, 0.02680206298828125, 0.0286712646484375, 0.03054046630859375, 0.03240966796875, 0.03427886962890625, 0.0361480712890625, 0.03801727294921875, 0.039886474609375, 0.04175567626953125, 0.0436248779296875, 0.04549407958984375, 0.04736328125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 7.0, 28.0, 38.0, 87.0, 158.0, 237.0, 203.0, 113.0, 84.0, 33.0, 13.0, 6.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9615683555603027, -0.9269771575927734, -0.8923859596252441, -0.8577947616577148, -0.8232035636901855, -0.7886123657226562, -0.754021167755127, -0.7194299697875977, -0.6848387718200684, -0.6502475738525391, -0.6156563758850098, -0.5810651779174805, -0.5464739799499512, -0.5118827819824219, -0.4772915840148926, -0.4427003860473633, -0.408109188079834, -0.3735179901123047, -0.3389267921447754, -0.3043355941772461, -0.2697443962097168, -0.2351531982421875, -0.2005620002746582, -0.1659708023071289, -0.1313796043395996, -0.09678840637207031, -0.062197208404541016, -0.02760601043701172, 0.006985187530517578, 0.041576385498046875, 0.07616758346557617, 0.11075878143310547, 0.14534986019134521, 0.1799410581588745, 0.2145322561264038, 0.2491234540939331, 0.2837146520614624, 0.3183058500289917, 0.352897047996521, 0.3874882459640503, 0.4220794439315796, 0.4566706418991089, 0.4912618398666382, 0.5258530378341675, 0.5604442358016968, 0.5950354337692261, 0.6296266317367554, 0.6642178297042847, 0.698809027671814, 0.7334002256393433, 0.7679914236068726, 0.8025826215744019, 0.8371738195419312, 0.8717650175094604, 0.9063562154769897, 0.940947413444519, 0.9755386114120483, 1.0101298093795776, 1.044721007347107, 1.0793122053146362, 1.1139034032821655, 1.1484946012496948, 1.1830857992172241, 1.2176769971847534, 1.2522681951522827]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 4.0, 5.0, 2.0, 8.0, 9.0, 15.0, 10.0, 19.0, 9.0, 11.0, 21.0, 23.0, 23.0, 24.0, 24.0, 35.0, 32.0, 41.0, 34.0, 42.0, 40.0, 43.0, 34.0, 39.0, 47.0, 46.0, 33.0, 43.0, 34.0, 27.0, 25.0, 23.0, 22.0, 21.0, 20.0, 23.0, 13.0, 9.0, 15.0, 8.0, 8.0, 5.0, 9.0, 4.0, 6.0, 8.0, 3.0, 0.0, 1.0, 3.0, 3.0, 0.0, 2.0], "bins": [-0.3852055072784424, -0.37379270792007446, -0.36237990856170654, -0.350967139005661, -0.3395543396472931, -0.32814154028892517, -0.31672874093055725, -0.3053159713745117, -0.2939031720161438, -0.2824903726577759, -0.27107757329940796, -0.2596648037433624, -0.2482520043849945, -0.2368392050266266, -0.22542640566825867, -0.21401362121105194, -0.20260082185268402, -0.1911880224943161, -0.17977523803710938, -0.16836243867874146, -0.15694965422153473, -0.1455368548631668, -0.13412407040596008, -0.12271127104759216, -0.11129847913980484, -0.09988568723201752, -0.0884728953242302, -0.07706010341644287, -0.06564730405807495, -0.05423451587557793, -0.042821720242500305, -0.03140892833471298, -0.01999613642692566, -0.008583343587815762, 0.002829449251294136, 0.014242243021726608, 0.02565503492951393, 0.037067826837301254, 0.048480622470378876, 0.0598934143781662, 0.07130620628595352, 0.08271899819374084, 0.09413179010152817, 0.10554458200931549, 0.11695738136768341, 0.12837016582489014, 0.13978296518325806, 0.15119576454162598, 0.1626085489988327, 0.17402134835720062, 0.18543413281440735, 0.19684693217277527, 0.208259716629982, 0.21967251598834991, 0.23108530044555664, 0.24249809980392456, 0.2539108991622925, 0.2653236985206604, 0.2767364978790283, 0.28814926743507385, 0.2995620667934418, 0.3109748661518097, 0.3223876655101776, 0.33380043506622314, 0.34521323442459106]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 7.0, 5.0, 20.0, 23.0, 21.0, 48.0, 62.0, 92.0, 168.0, 223.0, 390.0, 722.0, 1101.0, 2141.0, 4268.0, 9189.0, 22546.0, 73230.0, 644900.0, 3277758.0, 106134.0, 28944.0, 11243.0, 5045.0, 2602.0, 1341.0, 789.0, 464.0, 255.0, 189.0, 113.0, 72.0, 53.0, 33.0, 24.0, 16.0, 13.0, 6.0, 8.0, 7.0, 6.0, 4.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10296630859375, -0.09954833984375, -0.09613037109375, -0.09271240234375, -0.08929443359375, -0.08587646484375, -0.08245849609375, -0.07904052734375, -0.07562255859375, -0.07220458984375, -0.06878662109375, -0.06536865234375, -0.06195068359375, -0.05853271484375, -0.05511474609375, -0.05169677734375, -0.04827880859375, -0.04486083984375, -0.04144287109375, -0.03802490234375, -0.03460693359375, -0.03118896484375, -0.02777099609375, -0.02435302734375, -0.02093505859375, -0.01751708984375, -0.01409912109375, -0.01068115234375, -0.00726318359375, -0.00384521484375, -0.00042724609375, 0.00299072265625, 0.00640869140625, 0.00982666015625, 0.01324462890625, 0.01666259765625, 0.02008056640625, 0.02349853515625, 0.02691650390625, 0.03033447265625, 0.03375244140625, 0.03717041015625, 0.04058837890625, 0.04400634765625, 0.04742431640625, 0.05084228515625, 0.05426025390625, 0.05767822265625, 0.06109619140625, 0.06451416015625, 0.06793212890625, 0.07135009765625, 0.07476806640625, 0.07818603515625, 0.08160400390625, 0.08502197265625, 0.08843994140625, 0.09185791015625, 0.09527587890625, 0.09869384765625, 0.10211181640625, 0.10552978515625, 0.10894775390625, 0.11236572265625, 0.11578369140625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 6.0, 3.0, 10.0, 8.0, 9.0, 16.0, 14.0, 26.0, 16.0, 33.0, 28.0, 35.0, 50.0, 44.0, 56.0, 49.0, 56.0, 62.0, 53.0, 61.0, 39.0, 53.0, 49.0, 35.0, 31.0, 32.0, 29.0, 14.0, 15.0, 18.0, 4.0, 10.0, 8.0, 10.0, 8.0, 2.0, 4.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0175933837890625, -0.016881942749023438, -0.016170501708984375, -0.015459060668945312, -0.01474761962890625, -0.014036178588867188, -0.013324737548828125, -0.012613296508789062, -0.01190185546875, -0.011190414428710938, -0.010478973388671875, -0.009767532348632812, -0.00905609130859375, -0.008344650268554688, -0.007633209228515625, -0.0069217681884765625, -0.0062103271484375, -0.0054988861083984375, -0.004787445068359375, -0.0040760040283203125, -0.00336456298828125, -0.0026531219482421875, -0.001941680908203125, -0.0012302398681640625, -0.000518798828125, 0.0001926422119140625, 0.000904083251953125, 0.0016155242919921875, 0.00232696533203125, 0.0030384063720703125, 0.003749847412109375, 0.0044612884521484375, 0.0051727294921875, 0.0058841705322265625, 0.006595611572265625, 0.0073070526123046875, 0.00801849365234375, 0.008729934692382812, 0.009441375732421875, 0.010152816772460938, 0.0108642578125, 0.011575698852539062, 0.012287139892578125, 0.012998580932617188, 0.01371002197265625, 0.014421463012695312, 0.015132904052734375, 0.015844345092773438, 0.0165557861328125, 0.017267227172851562, 0.017978668212890625, 0.018690109252929688, 0.01940155029296875, 0.020112991333007812, 0.020824432373046875, 0.021535873413085938, 0.022247314453125, 0.022958755493164062, 0.023670196533203125, 0.024381637573242188, 0.02509307861328125, 0.025804519653320312, 0.026515960693359375, 0.027227401733398438, 0.0279388427734375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 7.0, 2.0, 6.0, 6.0, 12.0, 14.0, 25.0, 25.0, 31.0, 55.0, 75.0, 106.0, 162.0, 226.0, 359.0, 638.0, 1054.0, 1990.0, 3982.0, 8114.0, 18702.0, 52059.0, 209444.0, 3370290.0, 405085.0, 75245.0, 25433.0, 10554.0, 4977.0, 2340.0, 1346.0, 731.0, 445.0, 253.0, 154.0, 104.0, 67.0, 48.0, 35.0, 27.0, 17.0, 8.0, 8.0, 8.0, 9.0, 4.0, 1.0, 4.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10577392578125, -0.10232353210449219, -0.09887313842773438, -0.09542274475097656, -0.09197235107421875, -0.08852195739746094, -0.08507156372070312, -0.08162117004394531, -0.0781707763671875, -0.07472038269042969, -0.07126998901367188, -0.06781959533691406, -0.06436920166015625, -0.06091880798339844, -0.057468414306640625, -0.05401802062988281, -0.050567626953125, -0.04711723327636719, -0.043666839599609375, -0.04021644592285156, -0.03676605224609375, -0.03331565856933594, -0.029865264892578125, -0.026414871215820312, -0.0229644775390625, -0.019514083862304688, -0.016063690185546875, -0.012613296508789062, -0.00916290283203125, -0.0057125091552734375, -0.002262115478515625, 0.0011882781982421875, 0.004638671875, 0.008089065551757812, 0.011539459228515625, 0.014989852905273438, 0.01844024658203125, 0.021890640258789062, 0.025341033935546875, 0.028791427612304688, 0.0322418212890625, 0.03569221496582031, 0.039142608642578125, 0.04259300231933594, 0.04604339599609375, 0.04949378967285156, 0.052944183349609375, 0.05639457702636719, 0.059844970703125, 0.06329536437988281, 0.06674575805664062, 0.07019615173339844, 0.07364654541015625, 0.07709693908691406, 0.08054733276367188, 0.08399772644042969, 0.0874481201171875, 0.09089851379394531, 0.09434890747070312, 0.09779930114746094, 0.10124969482421875, 0.10470008850097656, 0.10815048217773438, 0.11160087585449219, 0.11505126953125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 1.0, 4.0, 6.0, 10.0, 16.0, 19.0, 41.0, 38.0, 65.0, 83.0, 134.0, 301.0, 1821.0, 895.0, 245.0, 126.0, 71.0, 50.0, 50.0, 24.0, 18.0, 8.0, 10.0, 12.0, 7.0, 2.0, 6.0, 3.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049835205078125, -0.04822063446044922, -0.04660606384277344, -0.044991493225097656, -0.043376922607421875, -0.041762351989746094, -0.04014778137207031, -0.03853321075439453, -0.03691864013671875, -0.03530406951904297, -0.03368949890136719, -0.032074928283691406, -0.030460357666015625, -0.028845787048339844, -0.027231216430664062, -0.02561664581298828, -0.0240020751953125, -0.02238750457763672, -0.020772933959960938, -0.019158363342285156, -0.017543792724609375, -0.015929222106933594, -0.014314651489257812, -0.012700080871582031, -0.01108551025390625, -0.009470939636230469, -0.007856369018554688, -0.006241798400878906, -0.004627227783203125, -0.0030126571655273438, -0.0013980865478515625, 0.00021648406982421875, 0.0018310546875, 0.0034456253051757812, 0.0050601959228515625, 0.006674766540527344, 0.008289337158203125, 0.009903907775878906, 0.011518478393554688, 0.013133049011230469, 0.01474761962890625, 0.01636219024658203, 0.017976760864257812, 0.019591331481933594, 0.021205902099609375, 0.022820472717285156, 0.024435043334960938, 0.02604961395263672, 0.0276641845703125, 0.02927875518798828, 0.030893325805664062, 0.032507896423339844, 0.034122467041015625, 0.035737037658691406, 0.03735160827636719, 0.03896617889404297, 0.04058074951171875, 0.04219532012939453, 0.04380989074707031, 0.045424461364746094, 0.047039031982421875, 0.048653602600097656, 0.05026817321777344, 0.05188274383544922, 0.053497314453125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 7.0, 5.0, 7.0, 15.0, 20.0, 53.0, 63.0, 100.0, 124.0, 144.0, 125.0, 113.0, 96.0, 51.0, 36.0, 19.0, 9.0, 14.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34678295254707336, -0.33577069640159607, -0.3247584104537964, -0.3137461543083191, -0.3027338981628418, -0.2917216420173645, -0.2807093858718872, -0.2696970999240875, -0.25868484377861023, -0.24767258763313293, -0.23666031658649445, -0.22564804553985596, -0.21463578939437866, -0.20362353324890137, -0.19261126220226288, -0.1815989911556244, -0.1705867350101471, -0.1595744788646698, -0.1485622078180313, -0.13754993677139282, -0.12653768062591553, -0.11552541702985764, -0.10451315343379974, -0.09350088983774185, -0.08248862624168396, -0.07147636264562607, -0.060464099049568176, -0.049451835453510284, -0.03843957185745239, -0.0274273082613945, -0.01641504466533661, -0.005402781069278717, 0.0056095123291015625, 0.016621775925159454, 0.027634039521217346, 0.03864630311727524, 0.04965856671333313, 0.06067083030939102, 0.07168309390544891, 0.0826953575015068, 0.0937076210975647, 0.10471988469362259, 0.11573214828968048, 0.12674441933631897, 0.13775667548179626, 0.14876893162727356, 0.15978120267391205, 0.17079347372055054, 0.18180572986602783, 0.19281798601150513, 0.20383025705814362, 0.2148425281047821, 0.2258547842502594, 0.2368670403957367, 0.24787931144237518, 0.25889158248901367, 0.26990383863449097, 0.28091609477996826, 0.29192835092544556, 0.30294063687324524, 0.31395289301872253, 0.32496514916419983, 0.3359774351119995, 0.3469896912574768, 0.3580019474029541]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 8.0, 5.0, 11.0, 8.0, 12.0, 12.0, 15.0, 13.0, 27.0, 24.0, 22.0, 22.0, 28.0, 17.0, 40.0, 29.0, 35.0, 31.0, 50.0, 41.0, 46.0, 37.0, 49.0, 33.0, 36.0, 46.0, 35.0, 27.0, 26.0, 25.0, 26.0, 28.0, 24.0, 14.0, 14.0, 13.0, 6.0, 9.0, 11.0, 5.0, 8.0, 6.0, 7.0, 7.0, 7.0, 1.0, 4.0, 0.0, 2.0], "bins": [-0.155536949634552, -0.15125305950641632, -0.14696915447711945, -0.14268526434898376, -0.1384013593196869, -0.1341174691915512, -0.12983357906341553, -0.12554967403411865, -0.12126578390598297, -0.1169818863272667, -0.11269798874855042, -0.10841409862041473, -0.10413020104169846, -0.09984630346298218, -0.0955624133348465, -0.09127851575613022, -0.08699461817741394, -0.08271072059869766, -0.07842682301998138, -0.0741429328918457, -0.06985903531312943, -0.06557513773441315, -0.06129124388098717, -0.05700735002756119, -0.05272345244884491, -0.04843955487012863, -0.04415566101670265, -0.03987176716327667, -0.035587869584560394, -0.031303972005844116, -0.027020078152418137, -0.022736182436347008, -0.01845228672027588, -0.01416839100420475, -0.009884495288133621, -0.005600599572062492, -0.0013167038559913635, 0.0029671918600797653, 0.007251087576150894, 0.011534983292222023, 0.015818879008293152, 0.02010277472436428, 0.02438667044043541, 0.02867056615650654, 0.03295446187257767, 0.037238359451293945, 0.041522253304719925, 0.045806147158145905, 0.05009004473686218, 0.05437394231557846, 0.05865783616900444, 0.06294173002243042, 0.0672256276011467, 0.07150952517986298, 0.07579341530799866, 0.08007731288671494, 0.08436121046543121, 0.08864510804414749, 0.09292900562286377, 0.09721289575099945, 0.10149679332971573, 0.105780690908432, 0.11006458103656769, 0.11434847861528397, 0.11863237619400024]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 2.0, 7.0, 5.0, 17.0, 15.0, 17.0, 29.0, 58.0, 60.0, 114.0, 142.0, 247.0, 367.0, 634.0, 1094.0, 1857.0, 3454.0, 6297.0, 11836.0, 22768.0, 43621.0, 85845.0, 183577.0, 322907.0, 184358.0, 86831.0, 43383.0, 22349.0, 11887.0, 6429.0, 3556.0, 1921.0, 1166.0, 635.0, 375.0, 266.0, 131.0, 90.0, 62.0, 46.0, 26.0, 22.0, 20.0, 14.0, 5.0, 3.0, 6.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.065673828125, -0.06371355056762695, -0.061753273010253906, -0.05979299545288086, -0.05783271789550781, -0.055872440338134766, -0.05391216278076172, -0.05195188522338867, -0.049991607666015625, -0.04803133010864258, -0.04607105255126953, -0.044110774993896484, -0.04215049743652344, -0.04019021987915039, -0.038229942321777344, -0.0362696647644043, -0.03430938720703125, -0.0323491096496582, -0.030388832092285156, -0.02842855453491211, -0.026468276977539062, -0.024507999420166016, -0.02254772186279297, -0.020587444305419922, -0.018627166748046875, -0.016666889190673828, -0.014706611633300781, -0.012746334075927734, -0.010786056518554688, -0.00882577896118164, -0.006865501403808594, -0.004905223846435547, -0.0029449462890625, -0.0009846687316894531, 0.0009756088256835938, 0.0029358863830566406, 0.0048961639404296875, 0.006856441497802734, 0.008816719055175781, 0.010776996612548828, 0.012737274169921875, 0.014697551727294922, 0.01665782928466797, 0.018618106842041016, 0.020578384399414062, 0.02253866195678711, 0.024498939514160156, 0.026459217071533203, 0.02841949462890625, 0.030379772186279297, 0.032340049743652344, 0.03430032730102539, 0.03626060485839844, 0.038220882415771484, 0.04018115997314453, 0.04214143753051758, 0.044101715087890625, 0.04606199264526367, 0.04802227020263672, 0.049982547760009766, 0.05194282531738281, 0.05390310287475586, 0.055863380432128906, 0.05782365798950195, 0.059783935546875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 8.0, 6.0, 9.0, 7.0, 13.0, 9.0, 8.0, 16.0, 23.0, 21.0, 25.0, 16.0, 30.0, 28.0, 30.0, 42.0, 52.0, 48.0, 47.0, 36.0, 49.0, 42.0, 33.0, 41.0, 28.0, 45.0, 31.0, 33.0, 34.0, 21.0, 18.0, 24.0, 24.0, 19.0, 9.0, 11.0, 12.0, 10.0, 12.0, 6.0, 2.0, 3.0, 4.0, 3.0, 3.0, 3.0, 3.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.01678466796875, -0.016205310821533203, -0.015625953674316406, -0.01504659652709961, -0.014467239379882812, -0.013887882232666016, -0.013308525085449219, -0.012729167938232422, -0.012149810791015625, -0.011570453643798828, -0.010991096496582031, -0.010411739349365234, -0.009832382202148438, -0.00925302505493164, -0.008673667907714844, -0.008094310760498047, -0.00751495361328125, -0.006935596466064453, -0.006356239318847656, -0.005776882171630859, -0.0051975250244140625, -0.004618167877197266, -0.004038810729980469, -0.003459453582763672, -0.002880096435546875, -0.002300739288330078, -0.0017213821411132812, -0.0011420249938964844, -0.0005626678466796875, 1.6689300537109375e-05, 0.0005960464477539062, 0.0011754035949707031, 0.0017547607421875, 0.002334117889404297, 0.0029134750366210938, 0.0034928321838378906, 0.0040721893310546875, 0.004651546478271484, 0.005230903625488281, 0.005810260772705078, 0.006389617919921875, 0.006968975067138672, 0.007548332214355469, 0.008127689361572266, 0.008707046508789062, 0.00928640365600586, 0.009865760803222656, 0.010445117950439453, 0.01102447509765625, 0.011603832244873047, 0.012183189392089844, 0.01276254653930664, 0.013341903686523438, 0.013921260833740234, 0.014500617980957031, 0.015079975128173828, 0.015659332275390625, 0.016238689422607422, 0.01681804656982422, 0.017397403717041016, 0.017976760864257812, 0.01855611801147461, 0.019135475158691406, 0.019714832305908203, 0.020294189453125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 8.0, 9.0, 7.0, 14.0, 21.0, 18.0, 41.0, 62.0, 69.0, 94.0, 131.0, 160.0, 267.0, 379.0, 582.0, 1014.0, 1747.0, 3596.0, 8250.0, 20084.0, 52175.0, 142129.0, 438034.0, 244519.0, 80789.0, 30855.0, 12358.0, 5111.0, 2496.0, 1252.0, 741.0, 469.0, 285.0, 201.0, 161.0, 97.0, 95.0, 66.0, 49.0, 36.0, 16.0, 25.0, 11.0, 9.0, 6.0, 10.0, 0.0, 1.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.06939697265625, -0.06698131561279297, -0.06456565856933594, -0.062150001525878906, -0.059734344482421875, -0.057318687438964844, -0.05490303039550781, -0.05248737335205078, -0.05007171630859375, -0.04765605926513672, -0.04524040222167969, -0.042824745178222656, -0.040409088134765625, -0.037993431091308594, -0.03557777404785156, -0.03316211700439453, -0.0307464599609375, -0.02833080291748047, -0.025915145874023438, -0.023499488830566406, -0.021083831787109375, -0.018668174743652344, -0.016252517700195312, -0.013836860656738281, -0.01142120361328125, -0.009005546569824219, -0.0065898895263671875, -0.004174232482910156, -0.001758575439453125, 0.0006570816040039062, 0.0030727386474609375, 0.005488395690917969, 0.007904052734375, 0.010319709777832031, 0.012735366821289062, 0.015151023864746094, 0.017566680908203125, 0.019982337951660156, 0.022397994995117188, 0.02481365203857422, 0.02722930908203125, 0.02964496612548828, 0.03206062316894531, 0.034476280212402344, 0.036891937255859375, 0.039307594299316406, 0.04172325134277344, 0.04413890838623047, 0.0465545654296875, 0.04897022247314453, 0.05138587951660156, 0.053801536560058594, 0.056217193603515625, 0.058632850646972656, 0.06104850769042969, 0.06346416473388672, 0.06587982177734375, 0.06829547882080078, 0.07071113586425781, 0.07312679290771484, 0.07554244995117188, 0.0779581069946289, 0.08037376403808594, 0.08278942108154297, 0.085205078125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 3.0, 6.0, 6.0, 11.0, 12.0, 10.0, 8.0, 18.0, 18.0, 33.0, 39.0, 31.0, 46.0, 25.0, 44.0, 44.0, 37.0, 46.0, 44.0, 46.0, 38.0, 48.0, 54.0, 21.0, 46.0, 47.0, 39.0, 29.0, 20.0, 27.0, 17.0, 10.0, 13.0, 13.0, 14.0, 9.0, 4.0, 5.0, 7.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1044921875, -0.10136032104492188, -0.09822845458984375, -0.09509658813476562, -0.0919647216796875, -0.08883285522460938, -0.08570098876953125, -0.08256912231445312, -0.079437255859375, -0.07630538940429688, -0.07317352294921875, -0.07004165649414062, -0.0669097900390625, -0.06377792358398438, -0.06064605712890625, -0.057514190673828125, -0.05438232421875, -0.051250457763671875, -0.04811859130859375, -0.044986724853515625, -0.0418548583984375, -0.038722991943359375, -0.03559112548828125, -0.032459259033203125, -0.029327392578125, -0.026195526123046875, -0.02306365966796875, -0.019931793212890625, -0.0167999267578125, -0.013668060302734375, -0.01053619384765625, -0.007404327392578125, -0.0042724609375, -0.001140594482421875, 0.00199127197265625, 0.005123138427734375, 0.0082550048828125, 0.011386871337890625, 0.01451873779296875, 0.017650604248046875, 0.020782470703125, 0.023914337158203125, 0.02704620361328125, 0.030178070068359375, 0.0333099365234375, 0.036441802978515625, 0.03957366943359375, 0.042705535888671875, 0.04583740234375, 0.048969268798828125, 0.05210113525390625, 0.055233001708984375, 0.0583648681640625, 0.061496734619140625, 0.06462860107421875, 0.06776046752929688, 0.070892333984375, 0.07402420043945312, 0.07715606689453125, 0.08028793334960938, 0.0834197998046875, 0.08655166625976562, 0.08968353271484375, 0.09281539916992188, 0.095947265625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 5.0, 3.0, 6.0, 12.0, 13.0, 23.0, 33.0, 57.0, 109.0, 238.0, 507.0, 1266.0, 3743.0, 13626.0, 68414.0, 421708.0, 446997.0, 71331.0, 14383.0, 3790.0, 1331.0, 487.0, 220.0, 104.0, 69.0, 39.0, 20.0, 7.0, 9.0, 6.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07391357421875, -0.07160472869873047, -0.06929588317871094, -0.0669870376586914, -0.06467819213867188, -0.062369346618652344, -0.06006050109863281, -0.05775165557861328, -0.05544281005859375, -0.05313396453857422, -0.05082511901855469, -0.048516273498535156, -0.046207427978515625, -0.043898582458496094, -0.04158973693847656, -0.03928089141845703, -0.0369720458984375, -0.03466320037841797, -0.03235435485839844, -0.030045509338378906, -0.027736663818359375, -0.025427818298339844, -0.023118972778320312, -0.02081012725830078, -0.01850128173828125, -0.01619243621826172, -0.013883590698242188, -0.011574745178222656, -0.009265899658203125, -0.006957054138183594, -0.0046482086181640625, -0.0023393630981445312, -3.0517578125e-05, 0.0022783279418945312, 0.0045871734619140625, 0.006896018981933594, 0.009204864501953125, 0.011513710021972656, 0.013822555541992188, 0.01613140106201172, 0.01844024658203125, 0.02074909210205078, 0.023057937622070312, 0.025366783142089844, 0.027675628662109375, 0.029984474182128906, 0.03229331970214844, 0.03460216522216797, 0.0369110107421875, 0.03921985626220703, 0.04152870178222656, 0.043837547302246094, 0.046146392822265625, 0.048455238342285156, 0.05076408386230469, 0.05307292938232422, 0.05538177490234375, 0.05769062042236328, 0.05999946594238281, 0.062308311462402344, 0.06461715698242188, 0.0669260025024414, 0.06923484802246094, 0.07154369354248047, 0.0738525390625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 9.0, 11.0, 14.0, 20.0, 14.0, 21.0, 30.0, 37.0, 56.0, 68.0, 98.0, 91.0, 87.0, 94.0, 69.0, 61.0, 66.0, 36.0, 24.0, 22.0, 16.0, 14.0, 8.0, 9.0, 6.0, 9.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.170967102050781e-05, -3.06982547044754e-05, -2.9686838388442993e-05, -2.8675422072410583e-05, -2.7664005756378174e-05, -2.6652589440345764e-05, -2.5641173124313354e-05, -2.4629756808280945e-05, -2.3618340492248535e-05, -2.2606924176216125e-05, -2.1595507860183716e-05, -2.0584091544151306e-05, -1.9572675228118896e-05, -1.8561258912086487e-05, -1.7549842596054077e-05, -1.6538426280021667e-05, -1.5527009963989258e-05, -1.4515593647956848e-05, -1.3504177331924438e-05, -1.2492761015892029e-05, -1.1481344699859619e-05, -1.046992838382721e-05, -9.4585120677948e-06, -8.44709575176239e-06, -7.4356794357299805e-06, -6.424263119697571e-06, -5.412846803665161e-06, -4.4014304876327515e-06, -3.390014171600342e-06, -2.378597855567932e-06, -1.3671815395355225e-06, -3.557652235031128e-07, 6.556510925292969e-07, 1.6670674085617065e-06, 2.678483724594116e-06, 3.689900040626526e-06, 4.7013163566589355e-06, 5.712732672691345e-06, 6.724148988723755e-06, 7.735565304756165e-06, 8.746981620788574e-06, 9.758397936820984e-06, 1.0769814252853394e-05, 1.1781230568885803e-05, 1.2792646884918213e-05, 1.3804063200950623e-05, 1.4815479516983032e-05, 1.5826895833015442e-05, 1.683831214904785e-05, 1.784972846508026e-05, 1.886114478111267e-05, 1.987256109714508e-05, 2.088397741317749e-05, 2.18953937292099e-05, 2.290681004524231e-05, 2.391822636127472e-05, 2.492964267730713e-05, 2.594105899333954e-05, 2.6952475309371948e-05, 2.7963891625404358e-05, 2.8975307941436768e-05, 2.9986724257469177e-05, 3.099814057350159e-05, 3.2009556889533997e-05, 3.3020973205566406e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 6.0, 6.0, 9.0, 20.0, 42.0, 88.0, 210.0, 497.0, 1423.0, 5322.0, 36800.0, 470600.0, 487388.0, 38337.0, 5493.0, 1454.0, 502.0, 193.0, 74.0, 36.0, 21.0, 15.0, 9.0, 7.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12078857421875, -0.11733818054199219, -0.11388778686523438, -0.11043739318847656, -0.10698699951171875, -0.10353660583496094, -0.10008621215820312, -0.09663581848144531, -0.0931854248046875, -0.08973503112792969, -0.08628463745117188, -0.08283424377441406, -0.07938385009765625, -0.07593345642089844, -0.07248306274414062, -0.06903266906738281, -0.065582275390625, -0.06213188171386719, -0.058681488037109375, -0.05523109436035156, -0.05178070068359375, -0.04833030700683594, -0.044879913330078125, -0.04142951965332031, -0.0379791259765625, -0.03452873229980469, -0.031078338623046875, -0.027627944946289062, -0.02417755126953125, -0.020727157592773438, -0.017276763916015625, -0.013826370239257812, -0.0103759765625, -0.0069255828857421875, -0.003475189208984375, -2.47955322265625e-05, 0.00342559814453125, 0.0068759918212890625, 0.010326385498046875, 0.013776779174804688, 0.0172271728515625, 0.020677566528320312, 0.024127960205078125, 0.027578353881835938, 0.03102874755859375, 0.03447914123535156, 0.037929534912109375, 0.04137992858886719, 0.044830322265625, 0.04828071594238281, 0.051731109619140625, 0.05518150329589844, 0.05863189697265625, 0.06208229064941406, 0.06553268432617188, 0.06898307800292969, 0.0724334716796875, 0.07588386535644531, 0.07933425903320312, 0.08278465270996094, 0.08623504638671875, 0.08968544006347656, 0.09313583374023438, 0.09658622741699219, 0.10003662109375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 5.0, 11.0, 8.0, 15.0, 17.0, 29.0, 30.0, 45.0, 48.0, 67.0, 98.0, 119.0, 132.0, 100.0, 55.0, 46.0, 43.0, 39.0, 22.0, 13.0, 13.0, 15.0, 13.0, 7.0, 3.0, 7.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.07861328125, -0.07664871215820312, -0.07468414306640625, -0.07271957397460938, -0.0707550048828125, -0.06879043579101562, -0.06682586669921875, -0.06486129760742188, -0.062896728515625, -0.060932159423828125, -0.05896759033203125, -0.057003021240234375, -0.0550384521484375, -0.053073883056640625, -0.05110931396484375, -0.049144744873046875, -0.04718017578125, -0.045215606689453125, -0.04325103759765625, -0.041286468505859375, -0.0393218994140625, -0.037357330322265625, -0.03539276123046875, -0.033428192138671875, -0.031463623046875, -0.029499053955078125, -0.02753448486328125, -0.025569915771484375, -0.0236053466796875, -0.021640777587890625, -0.01967620849609375, -0.017711639404296875, -0.0157470703125, -0.013782501220703125, -0.01181793212890625, -0.009853363037109375, -0.0078887939453125, -0.005924224853515625, -0.00395965576171875, -0.001995086669921875, -3.0517578125e-05, 0.001934051513671875, 0.00389862060546875, 0.005863189697265625, 0.0078277587890625, 0.009792327880859375, 0.01175689697265625, 0.013721466064453125, 0.01568603515625, 0.017650604248046875, 0.01961517333984375, 0.021579742431640625, 0.0235443115234375, 0.025508880615234375, 0.02747344970703125, 0.029438018798828125, 0.031402587890625, 0.033367156982421875, 0.03533172607421875, 0.037296295166015625, 0.0392608642578125, 0.041225433349609375, 0.04319000244140625, 0.045154571533203125, 0.047119140625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 16.0, 55.0, 169.0, 296.0, 288.0, 130.0, 39.0, 11.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9571785926818848, -2.8942370414733887, -2.8312954902648926, -2.7683537006378174, -2.7054121494293213, -2.642470598220825, -2.57952880859375, -2.516587257385254, -2.453645706176758, -2.3907041549682617, -2.3277626037597656, -2.2648208141326904, -2.2018792629241943, -2.1389377117156982, -2.075995922088623, -2.013054370880127, -1.9501128196716309, -1.8871712684631348, -1.8242295980453491, -1.7612879276275635, -1.6983463764190674, -1.6354048252105713, -1.5724631547927856, -1.509521484375, -1.446579933166504, -1.3836383819580078, -1.3206967115402222, -1.2577550411224365, -1.1948134899139404, -1.1318719387054443, -1.0689302682876587, -1.005988597869873, -0.9430468082427979, -0.880105197429657, -0.8171635866165161, -0.7542219758033752, -0.6912803649902344, -0.6283387541770935, -0.5653971433639526, -0.5024555325508118, -0.4395139217376709, -0.37657231092453003, -0.31363070011138916, -0.2506890892982483, -0.18774747848510742, -0.12480586767196655, -0.061864256858825684, 0.0010773539543151855, 0.06401896476745605, 0.12696057558059692, 0.1899021863937378, 0.25284379720687866, 0.31578540802001953, 0.3787270188331604, 0.44166862964630127, 0.5046102404594421, 0.567551851272583, 0.6304934620857239, 0.6934350728988647, 0.7563766837120056, 0.8193182945251465, 0.8822599053382874, 0.9452015161514282, 1.0081431865692139, 1.07108473777771]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 6.0, 9.0, 5.0, 14.0, 16.0, 14.0, 20.0, 19.0, 22.0, 31.0, 34.0, 38.0, 37.0, 23.0, 47.0, 40.0, 62.0, 64.0, 55.0, 30.0, 53.0, 41.0, 29.0, 38.0, 39.0, 28.0, 27.0, 24.0, 20.0, 13.0, 16.0, 13.0, 11.0, 12.0, 10.0, 6.0, 8.0, 4.0, 4.0, 6.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.5803826451301575, -0.5642767548561096, -0.548170804977417, -0.5320649147033691, -0.5159590244293213, -0.49985307455062866, -0.4837471842765808, -0.46764126420021057, -0.45153534412384033, -0.4354294240474701, -0.41932350397109985, -0.403217613697052, -0.38711169362068176, -0.3710057735443115, -0.35489988327026367, -0.33879396319389343, -0.3226880431175232, -0.30658212304115295, -0.2904762029647827, -0.27437031269073486, -0.2582643926143646, -0.24215847253799438, -0.22605256736278534, -0.2099466621875763, -0.19384074211120605, -0.17773482203483582, -0.16162891685962677, -0.14552301168441772, -0.12941709160804749, -0.11331117898225784, -0.0972052663564682, -0.08109935373067856, -0.06499338150024414, -0.0488874688744545, -0.032781556248664856, -0.016675643622875214, -0.0005697309970855713, 0.015536181628704071, 0.03164209425449371, 0.047748006880283356, 0.063853919506073, 0.07995983213186264, 0.09606574475765228, 0.11217165738344193, 0.12827757000923157, 0.1443834900856018, 0.16048939526081085, 0.1765953004360199, 0.19270122051239014, 0.20880714058876038, 0.22491304576396942, 0.24101895093917847, 0.2571248710155487, 0.27323079109191895, 0.2893366813659668, 0.30544260144233704, 0.3215485215187073, 0.3376544415950775, 0.35376036167144775, 0.3698662519454956, 0.38597217202186584, 0.4020780920982361, 0.41818398237228394, 0.4342899024486542, 0.4503958225250244]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 4.0, 6.0, 9.0, 13.0, 11.0, 18.0, 37.0, 54.0, 83.0, 122.0, 183.0, 295.0, 513.0, 961.0, 1773.0, 3700.0, 7951.0, 20058.0, 66287.0, 559884.0, 3360481.0, 120431.0, 29728.0, 11248.0, 5066.0, 2376.0, 1243.0, 664.0, 394.0, 228.0, 159.0, 78.0, 68.0, 54.0, 31.0, 15.0, 15.0, 10.0, 7.0, 7.0, 4.0, 4.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.1329345703125, -0.12904644012451172, -0.12515830993652344, -0.12127017974853516, -0.11738204956054688, -0.1134939193725586, -0.10960578918457031, -0.10571765899658203, -0.10182952880859375, -0.09794139862060547, -0.09405326843261719, -0.0901651382446289, -0.08627700805664062, -0.08238887786865234, -0.07850074768066406, -0.07461261749267578, -0.0707244873046875, -0.06683635711669922, -0.06294822692871094, -0.059060096740722656, -0.055171966552734375, -0.051283836364746094, -0.04739570617675781, -0.04350757598876953, -0.03961944580078125, -0.03573131561279297, -0.03184318542480469, -0.027955055236816406, -0.024066925048828125, -0.020178794860839844, -0.016290664672851562, -0.012402534484863281, -0.008514404296875, -0.004626274108886719, -0.0007381439208984375, 0.0031499862670898438, 0.007038116455078125, 0.010926246643066406, 0.014814376831054688, 0.01870250701904297, 0.02259063720703125, 0.02647876739501953, 0.030366897583007812, 0.034255027770996094, 0.038143157958984375, 0.042031288146972656, 0.04591941833496094, 0.04980754852294922, 0.0536956787109375, 0.05758380889892578, 0.06147193908691406, 0.06536006927490234, 0.06924819946289062, 0.0731363296508789, 0.07702445983886719, 0.08091259002685547, 0.08480072021484375, 0.08868885040283203, 0.09257698059082031, 0.0964651107788086, 0.10035324096679688, 0.10424137115478516, 0.10812950134277344, 0.11201763153076172, 0.11590576171875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 6.0, 3.0, 1.0, 12.0, 7.0, 6.0, 14.0, 19.0, 19.0, 14.0, 19.0, 24.0, 26.0, 30.0, 29.0, 47.0, 40.0, 46.0, 46.0, 39.0, 46.0, 51.0, 46.0, 46.0, 49.0, 39.0, 36.0, 33.0, 28.0, 23.0, 19.0, 18.0, 22.0, 16.0, 15.0, 18.0, 10.0, 5.0, 11.0, 6.0, 6.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0202484130859375, -0.019598960876464844, -0.018949508666992188, -0.01830005645751953, -0.017650604248046875, -0.01700115203857422, -0.016351699829101562, -0.015702247619628906, -0.01505279541015625, -0.014403343200683594, -0.013753890991210938, -0.013104438781738281, -0.012454986572265625, -0.011805534362792969, -0.011156082153320312, -0.010506629943847656, -0.009857177734375, -0.009207725524902344, -0.008558273315429688, -0.007908821105957031, -0.007259368896484375, -0.006609916687011719, -0.0059604644775390625, -0.005311012268066406, -0.00466156005859375, -0.004012107849121094, -0.0033626556396484375, -0.0027132034301757812, -0.002063751220703125, -0.0014142990112304688, -0.0007648468017578125, -0.00011539459228515625, 0.0005340576171875, 0.0011835098266601562, 0.0018329620361328125, 0.0024824142456054688, 0.003131866455078125, 0.0037813186645507812, 0.0044307708740234375, 0.005080223083496094, 0.00572967529296875, 0.006379127502441406, 0.0070285797119140625, 0.007678031921386719, 0.008327484130859375, 0.008976936340332031, 0.009626388549804688, 0.010275840759277344, 0.01092529296875, 0.011574745178222656, 0.012224197387695312, 0.012873649597167969, 0.013523101806640625, 0.014172554016113281, 0.014822006225585938, 0.015471458435058594, 0.01612091064453125, 0.016770362854003906, 0.017419815063476562, 0.01806926727294922, 0.018718719482421875, 0.01936817169189453, 0.020017623901367188, 0.020667076110839844, 0.0213165283203125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 5.0, 4.0, 8.0, 8.0, 13.0, 11.0, 22.0, 30.0, 55.0, 84.0, 109.0, 167.0, 237.0, 383.0, 598.0, 929.0, 1514.0, 2777.0, 4890.0, 9556.0, 19342.0, 44536.0, 128447.0, 735094.0, 2885973.0, 235744.0, 68278.0, 27427.0, 12777.0, 6426.0, 3490.0, 2047.0, 1243.0, 689.0, 471.0, 296.0, 193.0, 139.0, 85.0, 70.0, 32.0, 29.0, 15.0, 15.0, 14.0, 4.0, 8.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.09649658203125, -0.09367656707763672, -0.09085655212402344, -0.08803653717041016, -0.08521652221679688, -0.0823965072631836, -0.07957649230957031, -0.07675647735595703, -0.07393646240234375, -0.07111644744873047, -0.06829643249511719, -0.0654764175415039, -0.06265640258789062, -0.059836387634277344, -0.05701637268066406, -0.05419635772705078, -0.0513763427734375, -0.04855632781982422, -0.04573631286621094, -0.042916297912597656, -0.040096282958984375, -0.037276268005371094, -0.03445625305175781, -0.03163623809814453, -0.02881622314453125, -0.02599620819091797, -0.023176193237304688, -0.020356178283691406, -0.017536163330078125, -0.014716148376464844, -0.011896133422851562, -0.009076118469238281, -0.006256103515625, -0.0034360885620117188, -0.0006160736083984375, 0.0022039413452148438, 0.005023956298828125, 0.007843971252441406, 0.010663986206054688, 0.013484001159667969, 0.01630401611328125, 0.01912403106689453, 0.021944046020507812, 0.024764060974121094, 0.027584075927734375, 0.030404090881347656, 0.03322410583496094, 0.03604412078857422, 0.0388641357421875, 0.04168415069580078, 0.04450416564941406, 0.047324180603027344, 0.050144195556640625, 0.052964210510253906, 0.05578422546386719, 0.05860424041748047, 0.06142425537109375, 0.06424427032470703, 0.06706428527832031, 0.0698843002319336, 0.07270431518554688, 0.07552433013916016, 0.07834434509277344, 0.08116436004638672, 0.083984375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 3.0, 10.0, 4.0, 11.0, 11.0, 16.0, 20.0, 25.0, 31.0, 44.0, 60.0, 100.0, 170.0, 296.0, 835.0, 1449.0, 369.0, 187.0, 121.0, 94.0, 53.0, 37.0, 30.0, 21.0, 12.0, 18.0, 7.0, 8.0, 6.0, 1.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.052764892578125, -0.05112457275390625, -0.0494842529296875, -0.04784393310546875, -0.04620361328125, -0.04456329345703125, -0.0429229736328125, -0.04128265380859375, -0.039642333984375, -0.03800201416015625, -0.0363616943359375, -0.03472137451171875, -0.0330810546875, -0.03144073486328125, -0.0298004150390625, -0.02816009521484375, -0.026519775390625, -0.02487945556640625, -0.0232391357421875, -0.02159881591796875, -0.01995849609375, -0.01831817626953125, -0.0166778564453125, -0.01503753662109375, -0.013397216796875, -0.01175689697265625, -0.0101165771484375, -0.00847625732421875, -0.0068359375, -0.00519561767578125, -0.0035552978515625, -0.00191497802734375, -0.000274658203125, 0.00136566162109375, 0.0030059814453125, 0.00464630126953125, 0.00628662109375, 0.00792694091796875, 0.0095672607421875, 0.01120758056640625, 0.012847900390625, 0.01448822021484375, 0.0161285400390625, 0.01776885986328125, 0.0194091796875, 0.02104949951171875, 0.0226898193359375, 0.02433013916015625, 0.025970458984375, 0.02761077880859375, 0.0292510986328125, 0.03089141845703125, 0.03253173828125, 0.03417205810546875, 0.0358123779296875, 0.03745269775390625, 0.039093017578125, 0.04073333740234375, 0.0423736572265625, 0.04401397705078125, 0.045654296875, 0.04729461669921875, 0.0489349365234375, 0.05057525634765625, 0.052215576171875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 6.0, 4.0, 10.0, 12.0, 25.0, 36.0, 32.0, 48.0, 65.0, 85.0, 98.0, 107.0, 90.0, 93.0, 76.0, 68.0, 51.0, 22.0, 20.0, 13.0, 13.0, 12.0, 7.0, 3.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34757858514785767, -0.33721330761909485, -0.32684803009033203, -0.3164827227592468, -0.306117445230484, -0.2957521677017212, -0.285386860370636, -0.27502158284187317, -0.26465630531311035, -0.25429102778434753, -0.24392573535442352, -0.2335604429244995, -0.2231951653957367, -0.21282988786697388, -0.20246459543704987, -0.19209930300712585, -0.18173402547836304, -0.17136874794960022, -0.1610034555196762, -0.1506381630897522, -0.14027288556098938, -0.12990760803222656, -0.11954231560230255, -0.10917703062295914, -0.09881174564361572, -0.08844646066427231, -0.0780811756849289, -0.06771589070558548, -0.057350605726242065, -0.04698532074689865, -0.03662003576755524, -0.026254750788211823, -0.015889465808868408, -0.005524180829524994, 0.00484110414981842, 0.015206389129161835, 0.02557167410850525, 0.03593695908784866, 0.04630224406719208, 0.05666752904653549, 0.0670328140258789, 0.07739809900522232, 0.08776338398456573, 0.09812866896390915, 0.10849395394325256, 0.11885923892259598, 0.1292245239019394, 0.1395898163318634, 0.14995509386062622, 0.16032037138938904, 0.17068566381931305, 0.18105095624923706, 0.19141623377799988, 0.2017815113067627, 0.2121468037366867, 0.22251209616661072, 0.23287737369537354, 0.24324265122413635, 0.25360792875289917, 0.2639732360839844, 0.2743385136127472, 0.28470379114151, 0.2950690984725952, 0.30543437600135803, 0.31579965353012085]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 5.0, 5.0, 8.0, 5.0, 14.0, 14.0, 13.0, 16.0, 18.0, 21.0, 21.0, 25.0, 23.0, 28.0, 43.0, 36.0, 43.0, 33.0, 48.0, 38.0, 45.0, 47.0, 46.0, 46.0, 40.0, 42.0, 38.0, 25.0, 41.0, 30.0, 23.0, 21.0, 27.0, 17.0, 11.0, 11.0, 7.0, 11.0, 9.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19329124689102173, -0.18715421855449677, -0.1810171753168106, -0.17488014698028564, -0.1687431037425995, -0.16260607540607452, -0.15646904706954956, -0.1503320038318634, -0.14419497549533844, -0.13805794715881348, -0.13192090392112732, -0.12578387558460236, -0.1196468397974968, -0.11350980401039124, -0.10737277567386627, -0.10123573988676071, -0.09509870409965515, -0.08896166831254959, -0.08282463252544403, -0.07668760418891907, -0.07055056840181351, -0.06441353261470795, -0.058276500552892685, -0.05213946849107742, -0.04600243270397186, -0.0398653969168663, -0.03372836485505104, -0.02759133093059063, -0.02145429700613022, -0.015317263081669807, -0.009180229157209396, -0.0030431970953941345, 0.0030938386917114258, 0.009230872616171837, 0.015367906540632248, 0.02150494046509266, 0.02764197438955307, 0.03377901017665863, 0.03991604223847389, 0.046053074300289154, 0.052190110087394714, 0.058327145874500275, 0.06446418166160583, 0.0706012099981308, 0.07673824578523636, 0.08287528157234192, 0.08901230990886688, 0.09514934569597244, 0.101286381483078, 0.10742341727018356, 0.11356045305728912, 0.11969748139381409, 0.12583452463150024, 0.1319715529680252, 0.13810858130455017, 0.14424562454223633, 0.1503826528787613, 0.15651968121528625, 0.1626567244529724, 0.16879375278949738, 0.17493078112602234, 0.1810678243637085, 0.18720485270023346, 0.19334188103675842, 0.19947892427444458]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 3.0, 11.0, 13.0, 21.0, 23.0, 32.0, 64.0, 55.0, 124.0, 178.0, 266.0, 336.0, 620.0, 957.0, 1557.0, 2701.0, 4777.0, 8416.0, 15406.0, 29094.0, 55342.0, 106444.0, 187080.0, 238217.0, 180998.0, 101298.0, 52842.0, 27695.0, 14829.0, 8051.0, 4467.0, 2536.0, 1538.0, 901.0, 555.0, 378.0, 241.0, 167.0, 101.0, 65.0, 50.0, 32.0, 30.0, 9.0, 8.0, 6.0, 7.0, 5.0, 4.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.051971435546875, -0.05026531219482422, -0.04855918884277344, -0.046853065490722656, -0.045146942138671875, -0.043440818786621094, -0.04173469543457031, -0.04002857208251953, -0.03832244873046875, -0.03661632537841797, -0.03491020202636719, -0.033204078674316406, -0.031497955322265625, -0.029791831970214844, -0.028085708618164062, -0.02637958526611328, -0.0246734619140625, -0.02296733856201172, -0.021261215209960938, -0.019555091857910156, -0.017848968505859375, -0.016142845153808594, -0.014436721801757812, -0.012730598449707031, -0.01102447509765625, -0.009318351745605469, -0.0076122283935546875, -0.005906105041503906, -0.004199981689453125, -0.0024938583374023438, -0.0007877349853515625, 0.0009183883666992188, 0.00262451171875, 0.004330635070800781, 0.0060367584228515625, 0.007742881774902344, 0.009449005126953125, 0.011155128479003906, 0.012861251831054688, 0.014567375183105469, 0.01627349853515625, 0.01797962188720703, 0.019685745239257812, 0.021391868591308594, 0.023097991943359375, 0.024804115295410156, 0.026510238647460938, 0.02821636199951172, 0.0299224853515625, 0.03162860870361328, 0.03333473205566406, 0.035040855407714844, 0.036746978759765625, 0.038453102111816406, 0.04015922546386719, 0.04186534881591797, 0.04357147216796875, 0.04527759552001953, 0.04698371887207031, 0.048689842224121094, 0.050395965576171875, 0.052102088928222656, 0.05380821228027344, 0.05551433563232422, 0.057220458984375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 3.0, 6.0, 15.0, 9.0, 13.0, 22.0, 13.0, 19.0, 24.0, 17.0, 34.0, 31.0, 37.0, 44.0, 44.0, 47.0, 35.0, 46.0, 43.0, 42.0, 51.0, 42.0, 49.0, 40.0, 51.0, 34.0, 25.0, 25.0, 22.0, 19.0, 15.0, 18.0, 16.0, 11.0, 16.0, 6.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0222930908203125, -0.021569252014160156, -0.020845413208007812, -0.02012157440185547, -0.019397735595703125, -0.01867389678955078, -0.017950057983398438, -0.017226219177246094, -0.01650238037109375, -0.015778541564941406, -0.015054702758789062, -0.014330863952636719, -0.013607025146484375, -0.012883186340332031, -0.012159347534179688, -0.011435508728027344, -0.010711669921875, -0.009987831115722656, -0.009263992309570312, -0.008540153503417969, -0.007816314697265625, -0.007092475891113281, -0.0063686370849609375, -0.005644798278808594, -0.00492095947265625, -0.004197120666503906, -0.0034732818603515625, -0.0027494430541992188, -0.002025604248046875, -0.0013017654418945312, -0.0005779266357421875, 0.00014591217041015625, 0.0008697509765625, 0.0015935897827148438, 0.0023174285888671875, 0.0030412673950195312, 0.003765106201171875, 0.004488945007324219, 0.0052127838134765625, 0.005936622619628906, 0.00666046142578125, 0.007384300231933594, 0.008108139038085938, 0.008831977844238281, 0.009555816650390625, 0.010279655456542969, 0.011003494262695312, 0.011727333068847656, 0.012451171875, 0.013175010681152344, 0.013898849487304688, 0.014622688293457031, 0.015346527099609375, 0.01607036590576172, 0.016794204711914062, 0.017518043518066406, 0.01824188232421875, 0.018965721130371094, 0.019689559936523438, 0.02041339874267578, 0.021137237548828125, 0.02186107635498047, 0.022584915161132812, 0.023308753967285156, 0.0240325927734375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 8.0, 5.0, 7.0, 8.0, 16.0, 17.0, 32.0, 35.0, 53.0, 114.0, 179.0, 321.0, 570.0, 1306.0, 3688.0, 14089.0, 67398.0, 371853.0, 471403.0, 91228.0, 18330.0, 4734.0, 1641.0, 695.0, 326.0, 190.0, 118.0, 72.0, 36.0, 39.0, 16.0, 12.0, 6.0, 7.0, 2.0, 6.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1307373046875, -0.1266632080078125, -0.122589111328125, -0.1185150146484375, -0.11444091796875, -0.1103668212890625, -0.106292724609375, -0.1022186279296875, -0.09814453125, -0.0940704345703125, -0.089996337890625, -0.0859222412109375, -0.08184814453125, -0.0777740478515625, -0.073699951171875, -0.0696258544921875, -0.0655517578125, -0.0614776611328125, -0.057403564453125, -0.0533294677734375, -0.04925537109375, -0.0451812744140625, -0.041107177734375, -0.0370330810546875, -0.032958984375, -0.0288848876953125, -0.024810791015625, -0.0207366943359375, -0.01666259765625, -0.0125885009765625, -0.008514404296875, -0.0044403076171875, -0.0003662109375, 0.0037078857421875, 0.007781982421875, 0.0118560791015625, 0.01593017578125, 0.0200042724609375, 0.024078369140625, 0.0281524658203125, 0.0322265625, 0.0363006591796875, 0.040374755859375, 0.0444488525390625, 0.04852294921875, 0.0525970458984375, 0.056671142578125, 0.0607452392578125, 0.0648193359375, 0.0688934326171875, 0.072967529296875, 0.0770416259765625, 0.08111572265625, 0.0851898193359375, 0.089263916015625, 0.0933380126953125, 0.097412109375, 0.1014862060546875, 0.105560302734375, 0.1096343994140625, 0.11370849609375, 0.1177825927734375, 0.121856689453125, 0.1259307861328125, 0.1300048828125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 7.0, 3.0, 7.0, 11.0, 17.0, 22.0, 18.0, 32.0, 29.0, 36.0, 35.0, 48.0, 42.0, 40.0, 46.0, 39.0, 53.0, 58.0, 52.0, 46.0, 37.0, 44.0, 43.0, 32.0, 26.0, 41.0, 22.0, 24.0, 20.0, 15.0, 15.0, 8.0, 8.0, 10.0, 5.0, 0.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1512451171875, -0.14704227447509766, -0.1428394317626953, -0.13863658905029297, -0.13443374633789062, -0.13023090362548828, -0.12602806091308594, -0.1218252182006836, -0.11762237548828125, -0.1134195327758789, -0.10921669006347656, -0.10501384735107422, -0.10081100463867188, -0.09660816192626953, -0.09240531921386719, -0.08820247650146484, -0.0839996337890625, -0.07979679107666016, -0.07559394836425781, -0.07139110565185547, -0.06718826293945312, -0.06298542022705078, -0.05878257751464844, -0.054579734802246094, -0.05037689208984375, -0.046174049377441406, -0.04197120666503906, -0.03776836395263672, -0.033565521240234375, -0.02936267852783203, -0.025159835815429688, -0.020956993103027344, -0.016754150390625, -0.012551307678222656, -0.008348464965820312, -0.004145622253417969, 5.7220458984375e-05, 0.004260063171386719, 0.008462905883789062, 0.012665748596191406, 0.01686859130859375, 0.021071434020996094, 0.025274276733398438, 0.02947711944580078, 0.033679962158203125, 0.03788280487060547, 0.04208564758300781, 0.046288490295410156, 0.0504913330078125, 0.054694175720214844, 0.05889701843261719, 0.06309986114501953, 0.06730270385742188, 0.07150554656982422, 0.07570838928222656, 0.0799112319946289, 0.08411407470703125, 0.0883169174194336, 0.09251976013183594, 0.09672260284423828, 0.10092544555664062, 0.10512828826904297, 0.10933113098144531, 0.11353397369384766, 0.11773681640625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 2.0, 6.0, 10.0, 12.0, 26.0, 40.0, 106.0, 189.0, 482.0, 1344.0, 4262.0, 18926.0, 134164.0, 658803.0, 196743.0, 25275.0, 5512.0, 1666.0, 562.0, 215.0, 103.0, 53.0, 23.0, 13.0, 10.0, 7.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07818603515625, -0.07535171508789062, -0.07251739501953125, -0.06968307495117188, -0.0668487548828125, -0.06401443481445312, -0.06118011474609375, -0.058345794677734375, -0.055511474609375, -0.052677154541015625, -0.04984283447265625, -0.047008514404296875, -0.0441741943359375, -0.041339874267578125, -0.03850555419921875, -0.035671234130859375, -0.0328369140625, -0.030002593994140625, -0.02716827392578125, -0.024333953857421875, -0.0214996337890625, -0.018665313720703125, -0.01583099365234375, -0.012996673583984375, -0.010162353515625, -0.007328033447265625, -0.00449371337890625, -0.001659393310546875, 0.0011749267578125, 0.004009246826171875, 0.00684356689453125, 0.009677886962890625, 0.01251220703125, 0.015346527099609375, 0.01818084716796875, 0.021015167236328125, 0.0238494873046875, 0.026683807373046875, 0.02951812744140625, 0.032352447509765625, 0.035186767578125, 0.038021087646484375, 0.04085540771484375, 0.043689727783203125, 0.0465240478515625, 0.049358367919921875, 0.05219268798828125, 0.055027008056640625, 0.057861328125, 0.060695648193359375, 0.06352996826171875, 0.06636428833007812, 0.0691986083984375, 0.07203292846679688, 0.07486724853515625, 0.07770156860351562, 0.080535888671875, 0.08337020874023438, 0.08620452880859375, 0.08903884887695312, 0.0918731689453125, 0.09470748901367188, 0.09754180908203125, 0.10037612915039062, 0.10321044921875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 12.0, 14.0, 7.0, 12.0, 16.0, 23.0, 23.0, 28.0, 35.0, 50.0, 47.0, 68.0, 54.0, 56.0, 71.0, 68.0, 77.0, 56.0, 38.0, 47.0, 41.0, 28.0, 21.0, 18.0, 19.0, 15.0, 14.0, 12.0, 14.0, 7.0, 3.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.9981136322021484e-05, -2.9064714908599854e-05, -2.8148293495178223e-05, -2.7231872081756592e-05, -2.631545066833496e-05, -2.539902925491333e-05, -2.44826078414917e-05, -2.356618642807007e-05, -2.2649765014648438e-05, -2.1733343601226807e-05, -2.0816922187805176e-05, -1.9900500774383545e-05, -1.8984079360961914e-05, -1.8067657947540283e-05, -1.7151236534118652e-05, -1.623481512069702e-05, -1.531839370727539e-05, -1.440197229385376e-05, -1.3485550880432129e-05, -1.2569129467010498e-05, -1.1652708053588867e-05, -1.0736286640167236e-05, -9.819865226745605e-06, -8.903443813323975e-06, -7.987022399902344e-06, -7.070600986480713e-06, -6.154179573059082e-06, -5.237758159637451e-06, -4.32133674621582e-06, -3.4049153327941895e-06, -2.4884939193725586e-06, -1.5720725059509277e-06, -6.556510925292969e-07, 2.60770320892334e-07, 1.1771917343139648e-06, 2.0936131477355957e-06, 3.0100345611572266e-06, 3.926455974578857e-06, 4.842877388000488e-06, 5.759298801422119e-06, 6.67572021484375e-06, 7.592141628265381e-06, 8.508563041687012e-06, 9.424984455108643e-06, 1.0341405868530273e-05, 1.1257827281951904e-05, 1.2174248695373535e-05, 1.3090670108795166e-05, 1.4007091522216797e-05, 1.4923512935638428e-05, 1.583993434906006e-05, 1.675635576248169e-05, 1.767277717590332e-05, 1.858919858932495e-05, 1.9505620002746582e-05, 2.0422041416168213e-05, 2.1338462829589844e-05, 2.2254884243011475e-05, 2.3171305656433105e-05, 2.4087727069854736e-05, 2.5004148483276367e-05, 2.5920569896697998e-05, 2.683699131011963e-05, 2.775341272354126e-05, 2.866983413696289e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 5.0, 8.0, 21.0, 18.0, 23.0, 40.0, 56.0, 97.0, 124.0, 181.0, 304.0, 492.0, 952.0, 1949.0, 4039.0, 8983.0, 23889.0, 74084.0, 245071.0, 416149.0, 184057.0, 55253.0, 18364.0, 7284.0, 3443.0, 1598.0, 791.0, 483.0, 270.0, 174.0, 106.0, 85.0, 49.0, 37.0, 28.0, 16.0, 10.0, 4.0, 7.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.04931640625, -0.04769277572631836, -0.04606914520263672, -0.04444551467895508, -0.04282188415527344, -0.0411982536315918, -0.039574623107910156, -0.037950992584228516, -0.036327362060546875, -0.034703731536865234, -0.033080101013183594, -0.03145647048950195, -0.029832839965820312, -0.028209209442138672, -0.02658557891845703, -0.02496194839477539, -0.02333831787109375, -0.02171468734741211, -0.02009105682373047, -0.018467426300048828, -0.016843795776367188, -0.015220165252685547, -0.013596534729003906, -0.011972904205322266, -0.010349273681640625, -0.008725643157958984, -0.007102012634277344, -0.005478382110595703, -0.0038547515869140625, -0.002231121063232422, -0.0006074905395507812, 0.0010161399841308594, 0.0026397705078125, 0.004263401031494141, 0.005887031555175781, 0.007510662078857422, 0.009134292602539062, 0.010757923126220703, 0.012381553649902344, 0.014005184173583984, 0.015628814697265625, 0.017252445220947266, 0.018876075744628906, 0.020499706268310547, 0.022123336791992188, 0.023746967315673828, 0.02537059783935547, 0.02699422836303711, 0.02861785888671875, 0.03024148941040039, 0.03186511993408203, 0.03348875045776367, 0.03511238098144531, 0.03673601150512695, 0.038359642028808594, 0.039983272552490234, 0.041606903076171875, 0.043230533599853516, 0.044854164123535156, 0.0464777946472168, 0.04810142517089844, 0.04972505569458008, 0.05134868621826172, 0.05297231674194336, 0.054595947265625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 9.0, 6.0, 6.0, 9.0, 15.0, 11.0, 17.0, 17.0, 26.0, 28.0, 36.0, 48.0, 57.0, 59.0, 69.0, 86.0, 64.0, 57.0, 54.0, 59.0, 38.0, 39.0, 35.0, 30.0, 21.0, 18.0, 13.0, 15.0, 17.0, 9.0, 6.0, 5.0, 5.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.046783447265625, -0.045366764068603516, -0.04395008087158203, -0.04253339767456055, -0.04111671447753906, -0.03970003128051758, -0.038283348083496094, -0.03686666488647461, -0.035449981689453125, -0.03403329849243164, -0.032616615295410156, -0.031199932098388672, -0.029783248901367188, -0.028366565704345703, -0.02694988250732422, -0.025533199310302734, -0.02411651611328125, -0.022699832916259766, -0.02128314971923828, -0.019866466522216797, -0.018449783325195312, -0.017033100128173828, -0.015616416931152344, -0.01419973373413086, -0.012783050537109375, -0.01136636734008789, -0.009949684143066406, -0.008533000946044922, -0.0071163177490234375, -0.005699634552001953, -0.004282951354980469, -0.0028662681579589844, -0.0014495849609375, -3.2901763916015625e-05, 0.0013837814331054688, 0.002800464630126953, 0.0042171478271484375, 0.005633831024169922, 0.007050514221191406, 0.00846719741821289, 0.009883880615234375, 0.01130056381225586, 0.012717247009277344, 0.014133930206298828, 0.015550613403320312, 0.016967296600341797, 0.01838397979736328, 0.019800662994384766, 0.02121734619140625, 0.022634029388427734, 0.02405071258544922, 0.025467395782470703, 0.026884078979492188, 0.028300762176513672, 0.029717445373535156, 0.03113412857055664, 0.032550811767578125, 0.03396749496459961, 0.035384178161621094, 0.03680086135864258, 0.03821754455566406, 0.03963422775268555, 0.04105091094970703, 0.042467594146728516, 0.04388427734375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 8.0, 9.0, 11.0, 21.0, 30.0, 41.0, 70.0, 87.0, 122.0, 131.0, 127.0, 109.0, 76.0, 61.0, 30.0, 26.0, 13.0, 12.0, 5.0, 6.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6081541776657104, -0.5803227424621582, -0.552491307258606, -0.5246598720550537, -0.49682846665382385, -0.4689970314502716, -0.44116559624671936, -0.4133341908454895, -0.38550275564193726, -0.357671320438385, -0.32983988523483276, -0.3020084500312805, -0.27417704463005066, -0.2463456094264984, -0.21851417422294617, -0.19068275392055511, -0.16285130381584167, -0.13501986861228943, -0.10718844830989838, -0.07935701310634613, -0.05152558535337448, -0.023694157600402832, 0.004137277603149414, 0.031968697905540466, 0.05980013310909271, 0.08763156086206436, 0.11546298861503601, 0.14329442381858826, 0.1711258590221405, 0.19895727932453156, 0.2267887145280838, 0.25462013483047485, 0.2824515700340271, 0.31028300523757935, 0.3381144404411316, 0.36594587564468384, 0.3937772810459137, 0.42160871624946594, 0.4494401514530182, 0.47727155685424805, 0.5051029920578003, 0.5329344272613525, 0.5607658624649048, 0.588597297668457, 0.6164287328720093, 0.6442601680755615, 0.6720916032791138, 0.6999229788780212, 0.7277544736862183, 0.7555859088897705, 0.7834173440933228, 0.811248779296875, 0.8390802145004272, 0.8669116497039795, 0.8947430849075317, 0.9225744605064392, 0.9504058957099915, 0.9782373309135437, 1.0060687065124512, 1.0339001417160034, 1.0617315769195557, 1.089563012123108, 1.1173944473266602, 1.1452258825302124, 1.1730573177337646]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 8.0, 10.0, 11.0, 6.0, 12.0, 8.0, 19.0, 23.0, 18.0, 18.0, 26.0, 19.0, 39.0, 29.0, 31.0, 29.0, 33.0, 46.0, 42.0, 44.0, 51.0, 50.0, 50.0, 29.0, 39.0, 37.0, 38.0, 35.0, 34.0, 30.0, 26.0, 24.0, 8.0, 16.0, 6.0, 13.0, 6.0, 9.0, 10.0, 7.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5535398125648499, -0.5352002382278442, -0.5168606638908386, -0.4985211193561554, -0.48018157482147217, -0.46184200048446655, -0.44350242614746094, -0.4251628816127777, -0.4068233370780945, -0.38848376274108887, -0.37014421820640564, -0.3518046438694, -0.3334650993347168, -0.3151255249977112, -0.29678595066070557, -0.27844640612602234, -0.2601068317890167, -0.2417672723531723, -0.22342771291732788, -0.20508813858032227, -0.18674859404563904, -0.16840901970863342, -0.150069460272789, -0.13172990083694458, -0.11339034140110016, -0.09505078196525574, -0.07671122252941132, -0.0583716556429863, -0.040032096207141876, -0.021692536771297455, -0.0033529698848724365, 0.014986589550971985, 0.033326148986816406, 0.05166570842266083, 0.07000526785850525, 0.08834483474493027, 0.10668439418077469, 0.1250239610671997, 0.14336352050304413, 0.16170307993888855, 0.18004263937473297, 0.1983821988105774, 0.21672175824642181, 0.23506131768226624, 0.25340089201927185, 0.2717404365539551, 0.2900800108909607, 0.3084195852279663, 0.32675912976264954, 0.34509870409965515, 0.3634382486343384, 0.381777822971344, 0.4001173675060272, 0.41845694184303284, 0.43679648637771606, 0.4551360607147217, 0.4734756350517273, 0.4918152093887329, 0.5101547837257385, 0.5284942984580994, 0.546833872795105, 0.5651734471321106, 0.5835130214691162, 0.601852536201477, 0.6201921105384827]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 3.0, 7.0, 7.0, 4.0, 8.0, 10.0, 11.0, 25.0, 23.0, 38.0, 37.0, 46.0, 59.0, 74.0, 111.0, 164.0, 212.0, 376.0, 455.0, 772.0, 1373.0, 2770.0, 7238.0, 32811.0, 4052784.0, 75945.0, 10715.0, 3601.0, 1727.0, 955.0, 600.0, 391.0, 253.0, 173.0, 123.0, 89.0, 74.0, 34.0, 34.0, 36.0, 29.0, 12.0, 7.0, 15.0, 10.0, 13.0, 7.0, 8.0, 3.0, 6.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.2086181640625, -0.20223236083984375, -0.1958465576171875, -0.18946075439453125, -0.183074951171875, -0.17668914794921875, -0.1703033447265625, -0.16391754150390625, -0.15753173828125, -0.15114593505859375, -0.1447601318359375, -0.13837432861328125, -0.131988525390625, -0.12560272216796875, -0.1192169189453125, -0.11283111572265625, -0.1064453125, -0.10005950927734375, -0.0936737060546875, -0.08728790283203125, -0.080902099609375, -0.07451629638671875, -0.0681304931640625, -0.06174468994140625, -0.05535888671875, -0.04897308349609375, -0.0425872802734375, -0.03620147705078125, -0.029815673828125, -0.02342987060546875, -0.0170440673828125, -0.01065826416015625, -0.0042724609375, 0.00211334228515625, 0.0084991455078125, 0.01488494873046875, 0.021270751953125, 0.02765655517578125, 0.0340423583984375, 0.04042816162109375, 0.04681396484375, 0.05319976806640625, 0.0595855712890625, 0.06597137451171875, 0.072357177734375, 0.07874298095703125, 0.0851287841796875, 0.09151458740234375, 0.097900390625, 0.10428619384765625, 0.1106719970703125, 0.11705780029296875, 0.123443603515625, 0.12982940673828125, 0.1362152099609375, 0.14260101318359375, 0.14898681640625, 0.15537261962890625, 0.1617584228515625, 0.16814422607421875, 0.174530029296875, 0.18091583251953125, 0.1873016357421875, 0.19368743896484375, 0.2000732421875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 2.0, 7.0, 1.0, 8.0, 14.0, 10.0, 6.0, 13.0, 17.0, 17.0, 22.0, 13.0, 27.0, 29.0, 32.0, 34.0, 37.0, 40.0, 42.0, 32.0, 44.0, 38.0, 40.0, 38.0, 43.0, 35.0, 39.0, 31.0, 36.0, 38.0, 32.0, 34.0, 21.0, 17.0, 25.0, 10.0, 11.0, 13.0, 11.0, 8.0, 2.0, 14.0, 5.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.022979736328125, -0.022265195846557617, -0.021550655364990234, -0.02083611488342285, -0.02012157440185547, -0.019407033920288086, -0.018692493438720703, -0.01797795295715332, -0.017263412475585938, -0.016548871994018555, -0.015834331512451172, -0.015119791030883789, -0.014405250549316406, -0.013690710067749023, -0.01297616958618164, -0.012261629104614258, -0.011547088623046875, -0.010832548141479492, -0.01011800765991211, -0.009403467178344727, -0.008688926696777344, -0.007974386215209961, -0.007259845733642578, -0.006545305252075195, -0.0058307647705078125, -0.00511622428894043, -0.004401683807373047, -0.003687143325805664, -0.0029726028442382812, -0.0022580623626708984, -0.0015435218811035156, -0.0008289813995361328, -0.00011444091796875, 0.0006000995635986328, 0.0013146400451660156, 0.0020291805267333984, 0.0027437210083007812, 0.003458261489868164, 0.004172801971435547, 0.00488734245300293, 0.0056018829345703125, 0.006316423416137695, 0.007030963897705078, 0.007745504379272461, 0.008460044860839844, 0.009174585342407227, 0.00988912582397461, 0.010603666305541992, 0.011318206787109375, 0.012032747268676758, 0.01274728775024414, 0.013461828231811523, 0.014176368713378906, 0.014890909194946289, 0.015605449676513672, 0.016319990158081055, 0.017034530639648438, 0.01774907112121582, 0.018463611602783203, 0.019178152084350586, 0.01989269256591797, 0.02060723304748535, 0.021321773529052734, 0.022036314010620117, 0.0227508544921875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 1.0, 4.0, 2.0, 9.0, 5.0, 10.0, 13.0, 11.0, 26.0, 35.0, 51.0, 57.0, 83.0, 112.0, 152.0, 209.0, 320.0, 501.0, 763.0, 1225.0, 2353.0, 5280.0, 15446.0, 130337.0, 3982670.0, 37652.0, 8778.0, 3605.0, 1799.0, 882.0, 630.0, 354.0, 255.0, 193.0, 132.0, 82.0, 62.0, 45.0, 48.0, 30.0, 15.0, 15.0, 11.0, 6.0, 7.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.25244140625, -0.2452831268310547, -0.23812484741210938, -0.23096656799316406, -0.22380828857421875, -0.21665000915527344, -0.20949172973632812, -0.2023334503173828, -0.1951751708984375, -0.1880168914794922, -0.18085861206054688, -0.17370033264160156, -0.16654205322265625, -0.15938377380371094, -0.15222549438476562, -0.1450672149658203, -0.137908935546875, -0.1307506561279297, -0.12359237670898438, -0.11643409729003906, -0.10927581787109375, -0.10211753845214844, -0.09495925903320312, -0.08780097961425781, -0.0806427001953125, -0.07348442077636719, -0.06632614135742188, -0.05916786193847656, -0.05200958251953125, -0.04485130310058594, -0.037693023681640625, -0.030534744262695312, -0.02337646484375, -0.016218185424804688, -0.009059906005859375, -0.0019016265869140625, 0.00525665283203125, 0.012414932250976562, 0.019573211669921875, 0.026731491088867188, 0.0338897705078125, 0.04104804992675781, 0.048206329345703125, 0.05536460876464844, 0.06252288818359375, 0.06968116760253906, 0.07683944702148438, 0.08399772644042969, 0.091156005859375, 0.09831428527832031, 0.10547256469726562, 0.11263084411621094, 0.11978912353515625, 0.12694740295410156, 0.13410568237304688, 0.1412639617919922, 0.1484222412109375, 0.1555805206298828, 0.16273880004882812, 0.16989707946777344, 0.17705535888671875, 0.18421363830566406, 0.19137191772460938, 0.1985301971435547, 0.2056884765625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 2.0, 5.0, 0.0, 12.0, 9.0, 14.0, 34.0, 81.0, 463.0, 3227.0, 123.0, 47.0, 24.0, 10.0, 4.0, 6.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049774169921875, -0.04822492599487305, -0.046675682067871094, -0.04512643814086914, -0.04357719421386719, -0.042027950286865234, -0.04047870635986328, -0.03892946243286133, -0.037380218505859375, -0.03583097457885742, -0.03428173065185547, -0.032732486724853516, -0.031183242797851562, -0.02963399887084961, -0.028084754943847656, -0.026535511016845703, -0.02498626708984375, -0.023437023162841797, -0.021887779235839844, -0.02033853530883789, -0.018789291381835938, -0.017240047454833984, -0.01569080352783203, -0.014141559600830078, -0.012592315673828125, -0.011043071746826172, -0.009493827819824219, -0.007944583892822266, -0.0063953399658203125, -0.004846096038818359, -0.0032968521118164062, -0.0017476081848144531, -0.0001983642578125, 0.0013508796691894531, 0.0029001235961914062, 0.004449367523193359, 0.0059986114501953125, 0.007547855377197266, 0.009097099304199219, 0.010646343231201172, 0.012195587158203125, 0.013744831085205078, 0.015294075012207031, 0.016843318939208984, 0.018392562866210938, 0.01994180679321289, 0.021491050720214844, 0.023040294647216797, 0.02458953857421875, 0.026138782501220703, 0.027688026428222656, 0.02923727035522461, 0.030786514282226562, 0.032335758209228516, 0.03388500213623047, 0.03543424606323242, 0.036983489990234375, 0.03853273391723633, 0.04008197784423828, 0.041631221771240234, 0.04318046569824219, 0.04472970962524414, 0.046278953552246094, 0.04782819747924805, 0.04937744140625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 1.0, 4.0, 4.0, 13.0, 9.0, 12.0, 19.0, 36.0, 38.0, 69.0, 87.0, 101.0, 118.0, 110.0, 109.0, 71.0, 60.0, 59.0, 27.0, 22.0, 15.0, 8.0, 3.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14739945530891418, -0.14217491447925568, -0.13695037364959717, -0.13172583281993866, -0.12650129199028015, -0.12127675861120224, -0.11605222523212433, -0.11082768440246582, -0.10560314357280731, -0.1003786027431488, -0.0951540619134903, -0.08992952853441238, -0.08470498770475388, -0.07948044687509537, -0.07425591349601746, -0.06903137266635895, -0.06380683183670044, -0.05858229100704193, -0.05335775390267372, -0.04813321679830551, -0.042908675968647, -0.037684135138988495, -0.032459598034620285, -0.027235060930252075, -0.022010520100593567, -0.016785981133580208, -0.011561442166566849, -0.00633690319955349, -0.0011123642325401306, 0.0041121747344732285, 0.009336713701486588, 0.014561250805854797, 0.019785791635513306, 0.025010330602526665, 0.030234869569540024, 0.035459406673908234, 0.04068394750356674, 0.04590848833322525, 0.05113302543759346, 0.05635756254196167, 0.06158210337162018, 0.06680664420127869, 0.0720311850309372, 0.0772557184100151, 0.08248025923967361, 0.08770480006933212, 0.09292933344841003, 0.09815387427806854, 0.10337841510772705, 0.10860295593738556, 0.11382749676704407, 0.11905203014612198, 0.12427657097578049, 0.1295011043548584, 0.1347256451845169, 0.13995018601417542, 0.14517472684383392, 0.15039926767349243, 0.15562380850315094, 0.16084834933280945, 0.16607287526130676, 0.17129741609096527, 0.17652195692062378, 0.1817464977502823, 0.1869710385799408]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 6.0, 10.0, 6.0, 5.0, 4.0, 13.0, 15.0, 24.0, 13.0, 23.0, 28.0, 18.0, 26.0, 31.0, 47.0, 43.0, 44.0, 47.0, 50.0, 59.0, 53.0, 49.0, 35.0, 36.0, 52.0, 34.0, 34.0, 26.0, 33.0, 26.0, 26.0, 18.0, 14.0, 11.0, 9.0, 14.0, 10.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.08530747890472412, -0.08259212970733643, -0.07987678050994873, -0.07716142386198044, -0.07444607466459274, -0.07173072546720505, -0.06901536881923676, -0.06630001962184906, -0.06358467042446136, -0.06086932122707367, -0.058153968304395676, -0.05543861538171768, -0.05272326618432999, -0.05000791698694229, -0.0472925640642643, -0.044577211141586304, -0.04186186194419861, -0.03914651274681091, -0.03643115982413292, -0.033715806901454926, -0.03100045770406723, -0.028285106644034386, -0.02556975558400154, -0.022854404523968697, -0.020139053463935852, -0.017423702403903008, -0.014708351343870163, -0.011993000283837318, -0.009277649223804474, -0.006562298163771629, -0.003846947103738785, -0.0011315960437059402, 0.0015837550163269043, 0.004299106076359749, 0.007014457136392593, 0.009729808196425438, 0.012445159256458282, 0.015160510316491127, 0.01787586137652397, 0.020591212436556816, 0.02330656349658966, 0.026021914556622505, 0.02873726561665535, 0.031452618539333344, 0.03416796773672104, 0.036883316934108734, 0.03959866985678673, 0.04231402277946472, 0.04502937197685242, 0.04774472117424011, 0.050460074096918106, 0.0531754270195961, 0.055890776216983795, 0.05860612541437149, 0.061321478337049484, 0.06403683125972748, 0.06675218045711517, 0.06946752965450287, 0.07218287885189056, 0.07489823549985886, 0.07761358469724655, 0.08032893389463425, 0.08304429054260254, 0.08575963973999023, 0.08847498893737793]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 9.0, 11.0, 15.0, 26.0, 37.0, 45.0, 67.0, 102.0, 130.0, 252.0, 356.0, 521.0, 901.0, 1495.0, 2569.0, 4578.0, 8540.0, 16754.0, 34574.0, 71812.0, 147712.0, 249193.0, 239987.0, 137511.0, 66006.0, 31437.0, 15572.0, 7879.0, 4211.0, 2433.0, 1419.0, 868.0, 555.0, 328.0, 212.0, 142.0, 87.0, 66.0, 42.0, 26.0, 20.0, 20.0, 13.0, 3.0, 9.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052032470703125, -0.0501704216003418, -0.048308372497558594, -0.04644632339477539, -0.04458427429199219, -0.042722225189208984, -0.04086017608642578, -0.03899812698364258, -0.037136077880859375, -0.03527402877807617, -0.03341197967529297, -0.031549930572509766, -0.029687881469726562, -0.02782583236694336, -0.025963783264160156, -0.024101734161376953, -0.02223968505859375, -0.020377635955810547, -0.018515586853027344, -0.01665353775024414, -0.014791488647460938, -0.012929439544677734, -0.011067390441894531, -0.009205341339111328, -0.007343292236328125, -0.005481243133544922, -0.0036191940307617188, -0.0017571449279785156, 0.0001049041748046875, 0.0019669532775878906, 0.0038290023803710938, 0.005691051483154297, 0.0075531005859375, 0.009415149688720703, 0.011277198791503906, 0.01313924789428711, 0.015001296997070312, 0.016863346099853516, 0.01872539520263672, 0.020587444305419922, 0.022449493408203125, 0.024311542510986328, 0.02617359161376953, 0.028035640716552734, 0.029897689819335938, 0.03175973892211914, 0.033621788024902344, 0.03548383712768555, 0.03734588623046875, 0.03920793533325195, 0.041069984436035156, 0.04293203353881836, 0.04479408264160156, 0.046656131744384766, 0.04851818084716797, 0.05038022994995117, 0.052242279052734375, 0.05410432815551758, 0.05596637725830078, 0.057828426361083984, 0.05969047546386719, 0.06155252456665039, 0.0634145736694336, 0.0652766227722168, 0.067138671875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 0.0, 6.0, 11.0, 8.0, 6.0, 17.0, 16.0, 13.0, 25.0, 18.0, 21.0, 28.0, 20.0, 30.0, 34.0, 36.0, 38.0, 36.0, 38.0, 44.0, 46.0, 44.0, 53.0, 46.0, 42.0, 38.0, 44.0, 33.0, 27.0, 31.0, 32.0, 18.0, 24.0, 18.0, 15.0, 6.0, 7.0, 12.0, 5.0, 9.0, 6.0, 4.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.021697998046875, -0.020832061767578125, -0.01996612548828125, -0.019100189208984375, -0.0182342529296875, -0.017368316650390625, -0.01650238037109375, -0.015636444091796875, -0.0147705078125, -0.013904571533203125, -0.01303863525390625, -0.012172698974609375, -0.0113067626953125, -0.010440826416015625, -0.00957489013671875, -0.008708953857421875, -0.007843017578125, -0.006977081298828125, -0.00611114501953125, -0.005245208740234375, -0.0043792724609375, -0.003513336181640625, -0.00264739990234375, -0.001781463623046875, -0.00091552734375, -4.9591064453125e-05, 0.00081634521484375, 0.001682281494140625, 0.0025482177734375, 0.003414154052734375, 0.00428009033203125, 0.005146026611328125, 0.006011962890625, 0.006877899169921875, 0.00774383544921875, 0.008609771728515625, 0.0094757080078125, 0.010341644287109375, 0.01120758056640625, 0.012073516845703125, 0.012939453125, 0.013805389404296875, 0.01467132568359375, 0.015537261962890625, 0.0164031982421875, 0.017269134521484375, 0.01813507080078125, 0.019001007080078125, 0.019866943359375, 0.020732879638671875, 0.02159881591796875, 0.022464752197265625, 0.0233306884765625, 0.024196624755859375, 0.02506256103515625, 0.025928497314453125, 0.02679443359375, 0.027660369873046875, 0.02852630615234375, 0.029392242431640625, 0.0302581787109375, 0.031124114990234375, 0.03199005126953125, 0.032855987548828125, 0.033721923828125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 16.0, 8.0, 17.0, 26.0, 46.0, 87.0, 97.0, 175.0, 325.0, 559.0, 1076.0, 2345.0, 6668.0, 24314.0, 124864.0, 585610.0, 243485.0, 42056.0, 10336.0, 3379.0, 1413.0, 718.0, 363.0, 215.0, 126.0, 94.0, 50.0, 30.0, 19.0, 20.0, 8.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.15283203125, -0.14877605438232422, -0.14472007751464844, -0.14066410064697266, -0.13660812377929688, -0.1325521469116211, -0.1284961700439453, -0.12444019317626953, -0.12038421630859375, -0.11632823944091797, -0.11227226257324219, -0.1082162857055664, -0.10416030883789062, -0.10010433197021484, -0.09604835510253906, -0.09199237823486328, -0.0879364013671875, -0.08388042449951172, -0.07982444763183594, -0.07576847076416016, -0.07171249389648438, -0.0676565170288086, -0.06360054016113281, -0.05954456329345703, -0.05548858642578125, -0.05143260955810547, -0.04737663269042969, -0.043320655822753906, -0.039264678955078125, -0.035208702087402344, -0.031152725219726562, -0.02709674835205078, -0.023040771484375, -0.01898479461669922, -0.014928817749023438, -0.010872840881347656, -0.006816864013671875, -0.0027608871459960938, 0.0012950897216796875, 0.005351066589355469, 0.00940704345703125, 0.013463020324707031, 0.017518997192382812, 0.021574974060058594, 0.025630950927734375, 0.029686927795410156, 0.03374290466308594, 0.03779888153076172, 0.0418548583984375, 0.04591083526611328, 0.04996681213378906, 0.054022789001464844, 0.058078765869140625, 0.062134742736816406, 0.06619071960449219, 0.07024669647216797, 0.07430267333984375, 0.07835865020751953, 0.08241462707519531, 0.0864706039428711, 0.09052658081054688, 0.09458255767822266, 0.09863853454589844, 0.10269451141357422, 0.10675048828125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 6.0, 2.0, 6.0, 7.0, 8.0, 10.0, 9.0, 10.0, 10.0, 21.0, 17.0, 22.0, 18.0, 35.0, 33.0, 31.0, 39.0, 31.0, 41.0, 44.0, 51.0, 43.0, 39.0, 48.0, 38.0, 43.0, 33.0, 41.0, 30.0, 30.0, 30.0, 31.0, 19.0, 25.0, 16.0, 13.0, 15.0, 11.0, 8.0, 10.0, 5.0, 7.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.1290283203125, -0.12491607666015625, -0.1208038330078125, -0.11669158935546875, -0.112579345703125, -0.10846710205078125, -0.1043548583984375, -0.10024261474609375, -0.09613037109375, -0.09201812744140625, -0.0879058837890625, -0.08379364013671875, -0.079681396484375, -0.07556915283203125, -0.0714569091796875, -0.06734466552734375, -0.063232421875, -0.05912017822265625, -0.0550079345703125, -0.05089569091796875, -0.046783447265625, -0.04267120361328125, -0.0385589599609375, -0.03444671630859375, -0.03033447265625, -0.02622222900390625, -0.0221099853515625, -0.01799774169921875, -0.013885498046875, -0.00977325439453125, -0.0056610107421875, -0.00154876708984375, 0.0025634765625, 0.00667572021484375, 0.0107879638671875, 0.01490020751953125, 0.019012451171875, 0.02312469482421875, 0.0272369384765625, 0.03134918212890625, 0.03546142578125, 0.03957366943359375, 0.0436859130859375, 0.04779815673828125, 0.051910400390625, 0.05602264404296875, 0.0601348876953125, 0.06424713134765625, 0.068359375, 0.07247161865234375, 0.0765838623046875, 0.08069610595703125, 0.084808349609375, 0.08892059326171875, 0.0930328369140625, 0.09714508056640625, 0.10125732421875, 0.10536956787109375, 0.1094818115234375, 0.11359405517578125, 0.117706298828125, 0.12181854248046875, 0.1259307861328125, 0.13004302978515625, 0.1341552734375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 5.0, 4.0, 4.0, 26.0, 28.0, 40.0, 62.0, 91.0, 231.0, 525.0, 1617.0, 6515.0, 116863.0, 898852.0, 18976.0, 3064.0, 950.0, 320.0, 145.0, 92.0, 48.0, 22.0, 29.0, 12.0, 7.0, 10.0, 7.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.29150390625, -0.28426170349121094, -0.2770195007324219, -0.2697772979736328, -0.26253509521484375, -0.2552928924560547, -0.24805068969726562, -0.24080848693847656, -0.2335662841796875, -0.22632408142089844, -0.21908187866210938, -0.2118396759033203, -0.20459747314453125, -0.1973552703857422, -0.19011306762695312, -0.18287086486816406, -0.175628662109375, -0.16838645935058594, -0.16114425659179688, -0.1539020538330078, -0.14665985107421875, -0.1394176483154297, -0.13217544555664062, -0.12493324279785156, -0.1176910400390625, -0.11044883728027344, -0.10320663452148438, -0.09596443176269531, -0.08872222900390625, -0.08148002624511719, -0.07423782348632812, -0.06699562072753906, -0.05975341796875, -0.05251121520996094, -0.045269012451171875, -0.03802680969238281, -0.03078460693359375, -0.023542404174804688, -0.016300201416015625, -0.009057998657226562, -0.0018157958984375, 0.0054264068603515625, 0.012668609619140625, 0.019910812377929688, 0.02715301513671875, 0.03439521789550781, 0.041637420654296875, 0.04887962341308594, 0.056121826171875, 0.06336402893066406, 0.07060623168945312, 0.07784843444824219, 0.08509063720703125, 0.09233283996582031, 0.09957504272460938, 0.10681724548339844, 0.1140594482421875, 0.12130165100097656, 0.12854385375976562, 0.1357860565185547, 0.14302825927734375, 0.1502704620361328, 0.15751266479492188, 0.16475486755371094, 0.1719970703125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 7.0, 11.0, 12.0, 24.0, 33.0, 56.0, 57.0, 72.0, 101.0, 122.0, 109.0, 94.0, 75.0, 56.0, 48.0, 47.0, 27.0, 22.0, 10.0, 7.0, 5.0, 3.0, 5.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-5.835294723510742e-05, -5.705840885639191e-05, -5.576387047767639e-05, -5.4469332098960876e-05, -5.317479372024536e-05, -5.1880255341529846e-05, -5.058571696281433e-05, -4.9291178584098816e-05, -4.79966402053833e-05, -4.6702101826667786e-05, -4.540756344795227e-05, -4.4113025069236755e-05, -4.281848669052124e-05, -4.1523948311805725e-05, -4.022940993309021e-05, -3.8934871554374695e-05, -3.764033317565918e-05, -3.6345794796943665e-05, -3.505125641822815e-05, -3.3756718039512634e-05, -3.246217966079712e-05, -3.1167641282081604e-05, -2.987310290336609e-05, -2.8578564524650574e-05, -2.728402614593506e-05, -2.5989487767219543e-05, -2.469494938850403e-05, -2.3400411009788513e-05, -2.2105872631072998e-05, -2.0811334252357483e-05, -1.9516795873641968e-05, -1.8222257494926453e-05, -1.6927719116210938e-05, -1.5633180737495422e-05, -1.4338642358779907e-05, -1.3044103980064392e-05, -1.1749565601348877e-05, -1.0455027222633362e-05, -9.160488843917847e-06, -7.865950465202332e-06, -6.571412086486816e-06, -5.276873707771301e-06, -3.982335329055786e-06, -2.687796950340271e-06, -1.3932585716247559e-06, -9.872019290924072e-08, 1.1958181858062744e-06, 2.4903565645217896e-06, 3.7848949432373047e-06, 5.07943332195282e-06, 6.373971700668335e-06, 7.66851007938385e-06, 8.963048458099365e-06, 1.025758683681488e-05, 1.1552125215530396e-05, 1.284666359424591e-05, 1.4141201972961426e-05, 1.543574035167694e-05, 1.6730278730392456e-05, 1.802481710910797e-05, 1.9319355487823486e-05, 2.0613893866539e-05, 2.1908432245254517e-05, 2.3202970623970032e-05, 2.4497509002685547e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 4.0, 7.0, 4.0, 12.0, 17.0, 28.0, 25.0, 52.0, 73.0, 101.0, 153.0, 280.0, 398.0, 742.0, 1358.0, 2971.0, 8143.0, 35933.0, 418088.0, 521092.0, 43359.0, 8981.0, 3221.0, 1498.0, 789.0, 464.0, 256.0, 183.0, 93.0, 61.0, 51.0, 38.0, 32.0, 18.0, 7.0, 6.0, 4.0, 4.0, 1.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1060791015625, -0.1027688980102539, -0.09945869445800781, -0.09614849090576172, -0.09283828735351562, -0.08952808380126953, -0.08621788024902344, -0.08290767669677734, -0.07959747314453125, -0.07628726959228516, -0.07297706604003906, -0.06966686248779297, -0.06635665893554688, -0.06304645538330078, -0.05973625183105469, -0.056426048278808594, -0.0531158447265625, -0.049805641174316406, -0.04649543762207031, -0.04318523406982422, -0.039875030517578125, -0.03656482696533203, -0.03325462341308594, -0.029944419860839844, -0.02663421630859375, -0.023324012756347656, -0.020013809204101562, -0.01670360565185547, -0.013393402099609375, -0.010083198547363281, -0.0067729949951171875, -0.0034627914428710938, -0.000152587890625, 0.0031576156616210938, 0.0064678192138671875, 0.009778022766113281, 0.013088226318359375, 0.01639842987060547, 0.019708633422851562, 0.023018836975097656, 0.02632904052734375, 0.029639244079589844, 0.03294944763183594, 0.03625965118408203, 0.039569854736328125, 0.04288005828857422, 0.04619026184082031, 0.049500465393066406, 0.0528106689453125, 0.056120872497558594, 0.05943107604980469, 0.06274127960205078, 0.06605148315429688, 0.06936168670654297, 0.07267189025878906, 0.07598209381103516, 0.07929229736328125, 0.08260250091552734, 0.08591270446777344, 0.08922290802001953, 0.09253311157226562, 0.09584331512451172, 0.09915351867675781, 0.1024637222290039, 0.10577392578125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 2.0, 3.0, 5.0, 9.0, 8.0, 13.0, 5.0, 17.0, 27.0, 26.0, 41.0, 45.0, 66.0, 90.0, 78.0, 84.0, 106.0, 89.0, 67.0, 48.0, 35.0, 33.0, 25.0, 19.0, 15.0, 17.0, 12.0, 5.0, 3.0, 1.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06634521484375, -0.06403923034667969, -0.061733245849609375, -0.05942726135253906, -0.05712127685546875, -0.05481529235839844, -0.052509307861328125, -0.05020332336425781, -0.0478973388671875, -0.04559135437011719, -0.043285369873046875, -0.04097938537597656, -0.03867340087890625, -0.03636741638183594, -0.034061431884765625, -0.03175544738769531, -0.029449462890625, -0.027143478393554688, -0.024837493896484375, -0.022531509399414062, -0.02022552490234375, -0.017919540405273438, -0.015613555908203125, -0.013307571411132812, -0.0110015869140625, -0.008695602416992188, -0.006389617919921875, -0.0040836334228515625, -0.00177764892578125, 0.0005283355712890625, 0.002834320068359375, 0.0051403045654296875, 0.0074462890625, 0.009752273559570312, 0.012058258056640625, 0.014364242553710938, 0.01667022705078125, 0.018976211547851562, 0.021282196044921875, 0.023588180541992188, 0.0258941650390625, 0.028200149536132812, 0.030506134033203125, 0.03281211853027344, 0.03511810302734375, 0.03742408752441406, 0.039730072021484375, 0.04203605651855469, 0.044342041015625, 0.04664802551269531, 0.048954010009765625, 0.05125999450683594, 0.05356597900390625, 0.05587196350097656, 0.058177947998046875, 0.06048393249511719, 0.0627899169921875, 0.06509590148925781, 0.06740188598632812, 0.06970787048339844, 0.07201385498046875, 0.07431983947753906, 0.07662582397460938, 0.07893180847167969, 0.08123779296875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 10.0, 10.0, 21.0, 46.0, 80.0, 117.0, 148.0, 149.0, 141.0, 110.0, 77.0, 45.0, 20.0, 13.0, 11.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0901665687561035, -1.0443147420883179, -0.9984630346298218, -0.9526112079620361, -0.9067594408988953, -0.8609076738357544, -0.8150558471679688, -0.7692040801048279, -0.723352313041687, -0.6775005459785461, -0.6316487789154053, -0.5857969522476196, -0.5399451851844788, -0.4940934181213379, -0.44824162125587463, -0.4023898243904114, -0.3565380573272705, -0.31068629026412964, -0.2648344933986664, -0.21898271143436432, -0.17313092947006226, -0.1272791475057602, -0.08142736554145813, -0.03557556867599487, 0.010276198387145996, 0.05612798035144806, 0.10197976231575012, 0.14783154428005219, 0.19368332624435425, 0.2395351082086563, 0.2853868901729584, 0.33123868703842163, 0.3770904541015625, 0.42294222116470337, 0.4687940180301666, 0.5146458148956299, 0.5604975819587708, 0.6063493490219116, 0.6522011756896973, 0.6980529427528381, 0.743904709815979, 0.7897564768791199, 0.8356082439422607, 0.8814600706100464, 0.9273118376731873, 0.9731636047363281, 1.0190154314041138, 1.0648672580718994, 1.1107189655303955, 1.1565707921981812, 1.2024224996566772, 1.248274326324463, 1.294126033782959, 1.3399778604507446, 1.3858296871185303, 1.4316813945770264, 1.477533221244812, 1.5233850479125977, 1.5692367553710938, 1.6150885820388794, 1.660940408706665, 1.7067921161651611, 1.7526439428329468, 1.7984957695007324, 1.8443474769592285]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 7.0, 8.0, 11.0, 9.0, 11.0, 14.0, 15.0, 30.0, 28.0, 28.0, 32.0, 54.0, 48.0, 52.0, 47.0, 61.0, 56.0, 66.0, 67.0, 49.0, 45.0, 37.0, 36.0, 30.0, 32.0, 26.0, 14.0, 18.0, 21.0, 15.0, 7.0, 17.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.1282103061676025, -1.0989480018615723, -1.0696858167648315, -1.0404235124588013, -1.0111613273620605, -0.9818990230560303, -0.9526367783546448, -0.9233745336532593, -0.894112229347229, -0.8648499846458435, -0.835587739944458, -0.8063254356384277, -0.7770631909370422, -0.7478009462356567, -0.7185387015342712, -0.6892764568328857, -0.6600141525268555, -0.63075190782547, -0.6014896631240845, -0.5722273588180542, -0.5429651141166687, -0.5137028694152832, -0.4844406247138977, -0.4551783502101898, -0.4259161353111267, -0.3966538906097412, -0.3673916161060333, -0.3381293714046478, -0.30886709690093994, -0.27960485219955444, -0.25034260749816895, -0.22108033299446106, -0.19181805849075317, -0.16255579888820648, -0.1332935392856598, -0.1040312871336937, -0.074769027531147, -0.04550677537918091, -0.016244515776634216, 0.013017743825912476, 0.04228000342845917, 0.07154226303100586, 0.10080452263355255, 0.13006678223609924, 0.15932902693748474, 0.18859128654003143, 0.21785354614257812, 0.24711580574512482, 0.2763780653476715, 0.305640310049057, 0.3349025845527649, 0.3641648292541504, 0.3934271037578583, 0.4226893484592438, 0.45195162296295166, 0.48121386766433716, 0.5104761123657227, 0.5397383570671082, 0.5690006017684937, 0.5982629060745239, 0.6275251507759094, 0.6567873954772949, 0.6860496401786804, 0.7153118848800659, 0.7445741891860962]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 12.0, 8.0, 9.0, 10.0, 23.0, 30.0, 46.0, 47.0, 76.0, 118.0, 167.0, 254.0, 401.0, 786.0, 1629.0, 4176.0, 18943.0, 4070729.0, 83403.0, 8365.0, 2461.0, 1055.0, 548.0, 346.0, 206.0, 128.0, 86.0, 66.0, 44.0, 31.0, 20.0, 17.0, 12.0, 9.0, 4.0, 5.0, 6.0, 2.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.315185546875, -0.30556488037109375, -0.2959442138671875, -0.28632354736328125, -0.276702880859375, -0.26708221435546875, -0.2574615478515625, -0.24784088134765625, -0.23822021484375, -0.22859954833984375, -0.2189788818359375, -0.20935821533203125, -0.199737548828125, -0.19011688232421875, -0.1804962158203125, -0.17087554931640625, -0.1612548828125, -0.15163421630859375, -0.1420135498046875, -0.13239288330078125, -0.122772216796875, -0.11315155029296875, -0.1035308837890625, -0.09391021728515625, -0.08428955078125, -0.07466888427734375, -0.0650482177734375, -0.05542755126953125, -0.045806884765625, -0.03618621826171875, -0.0265655517578125, -0.01694488525390625, -0.00732421875, 0.00229644775390625, 0.0119171142578125, 0.02153778076171875, 0.031158447265625, 0.04077911376953125, 0.0503997802734375, 0.06002044677734375, 0.06964111328125, 0.07926177978515625, 0.0888824462890625, 0.09850311279296875, 0.108123779296875, 0.11774444580078125, 0.1273651123046875, 0.13698577880859375, 0.1466064453125, 0.15622711181640625, 0.1658477783203125, 0.17546844482421875, 0.185089111328125, 0.19470977783203125, 0.2043304443359375, 0.21395111083984375, 0.22357177734375, 0.23319244384765625, 0.2428131103515625, 0.25243377685546875, 0.262054443359375, 0.27167510986328125, 0.2812957763671875, 0.29091644287109375, 0.300537109375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 6.0, 4.0, 5.0, 3.0, 8.0, 9.0, 13.0, 11.0, 25.0, 16.0, 26.0, 30.0, 43.0, 27.0, 41.0, 50.0, 53.0, 54.0, 46.0, 65.0, 57.0, 50.0, 43.0, 45.0, 43.0, 29.0, 41.0, 38.0, 20.0, 20.0, 18.0, 15.0, 13.0, 11.0, 10.0, 4.0, 5.0, 5.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.038726806640625, -0.037693023681640625, -0.03665924072265625, -0.035625457763671875, -0.0345916748046875, -0.033557891845703125, -0.03252410888671875, -0.031490325927734375, -0.03045654296875, -0.029422760009765625, -0.02838897705078125, -0.027355194091796875, -0.0263214111328125, -0.025287628173828125, -0.02425384521484375, -0.023220062255859375, -0.022186279296875, -0.021152496337890625, -0.02011871337890625, -0.019084930419921875, -0.0180511474609375, -0.017017364501953125, -0.01598358154296875, -0.014949798583984375, -0.013916015625, -0.012882232666015625, -0.01184844970703125, -0.010814666748046875, -0.0097808837890625, -0.008747100830078125, -0.00771331787109375, -0.006679534912109375, -0.005645751953125, -0.004611968994140625, -0.00357818603515625, -0.002544403076171875, -0.0015106201171875, -0.000476837158203125, 0.00055694580078125, 0.001590728759765625, 0.00262451171875, 0.003658294677734375, 0.00469207763671875, 0.005725860595703125, 0.0067596435546875, 0.007793426513671875, 0.00882720947265625, 0.009860992431640625, 0.010894775390625, 0.011928558349609375, 0.01296234130859375, 0.013996124267578125, 0.0150299072265625, 0.016063690185546875, 0.01709747314453125, 0.018131256103515625, 0.0191650390625, 0.020198822021484375, 0.02123260498046875, 0.022266387939453125, 0.0233001708984375, 0.024333953857421875, 0.02536773681640625, 0.026401519775390625, 0.027435302734375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 8.0, 9.0, 8.0, 10.0, 17.0, 20.0, 28.0, 42.0, 70.0, 98.0, 106.0, 133.0, 197.0, 328.0, 529.0, 832.0, 1451.0, 3059.0, 8172.0, 36818.0, 4028192.0, 93184.0, 12246.0, 4097.0, 1800.0, 963.0, 597.0, 372.0, 260.0, 185.0, 120.0, 83.0, 90.0, 60.0, 20.0, 21.0, 18.0, 17.0, 3.0, 8.0, 5.0, 5.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.270751953125, -0.261627197265625, -0.25250244140625, -0.243377685546875, -0.2342529296875, -0.225128173828125, -0.21600341796875, -0.206878662109375, -0.19775390625, -0.188629150390625, -0.17950439453125, -0.170379638671875, -0.1612548828125, -0.152130126953125, -0.14300537109375, -0.133880615234375, -0.124755859375, -0.115631103515625, -0.10650634765625, -0.097381591796875, -0.0882568359375, -0.079132080078125, -0.07000732421875, -0.060882568359375, -0.0517578125, -0.042633056640625, -0.03350830078125, -0.024383544921875, -0.0152587890625, -0.006134033203125, 0.00299072265625, 0.012115478515625, 0.021240234375, 0.030364990234375, 0.03948974609375, 0.048614501953125, 0.0577392578125, 0.066864013671875, 0.07598876953125, 0.085113525390625, 0.09423828125, 0.103363037109375, 0.11248779296875, 0.121612548828125, 0.1307373046875, 0.139862060546875, 0.14898681640625, 0.158111572265625, 0.167236328125, 0.176361083984375, 0.18548583984375, 0.194610595703125, 0.2037353515625, 0.212860107421875, 0.22198486328125, 0.231109619140625, 0.240234375, 0.249359130859375, 0.25848388671875, 0.267608642578125, 0.2767333984375, 0.285858154296875, 0.29498291015625, 0.304107666015625, 0.313232421875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 9.0, 2.0, 8.0, 13.0, 39.0, 95.0, 3152.0, 589.0, 77.0, 34.0, 15.0, 14.0, 11.0, 3.0, 3.0, 5.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0899658203125, -0.08759450912475586, -0.08522319793701172, -0.08285188674926758, -0.08048057556152344, -0.0781092643737793, -0.07573795318603516, -0.07336664199829102, -0.07099533081054688, -0.06862401962280273, -0.0662527084350586, -0.06388139724731445, -0.06151008605957031, -0.05913877487182617, -0.05676746368408203, -0.05439615249633789, -0.05202484130859375, -0.04965353012084961, -0.04728221893310547, -0.04491090774536133, -0.04253959655761719, -0.04016828536987305, -0.037796974182128906, -0.035425662994384766, -0.033054351806640625, -0.030683040618896484, -0.028311729431152344, -0.025940418243408203, -0.023569107055664062, -0.021197795867919922, -0.01882648468017578, -0.01645517349243164, -0.0140838623046875, -0.01171255111694336, -0.009341239929199219, -0.006969928741455078, -0.0045986175537109375, -0.002227306365966797, 0.00014400482177734375, 0.0025153160095214844, 0.004886627197265625, 0.007257938385009766, 0.009629249572753906, 0.012000560760498047, 0.014371871948242188, 0.016743183135986328, 0.01911449432373047, 0.02148580551147461, 0.02385711669921875, 0.02622842788696289, 0.02859973907470703, 0.030971050262451172, 0.03334236145019531, 0.03571367263793945, 0.038084983825683594, 0.040456295013427734, 0.042827606201171875, 0.045198917388916016, 0.047570228576660156, 0.0499415397644043, 0.05231285095214844, 0.05468416213989258, 0.05705547332763672, 0.05942678451538086, 0.061798095703125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 10.0, 14.0, 18.0, 30.0, 43.0, 74.0, 103.0, 116.0, 143.0, 133.0, 84.0, 79.0, 49.0, 29.0, 29.0, 11.0, 7.0, 8.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18322843313217163, -0.17545722424983978, -0.16768601536750793, -0.15991482138633728, -0.15214361250400543, -0.14437240362167358, -0.13660119473934174, -0.1288299858570099, -0.12105877697467804, -0.11328756809234619, -0.10551636666059494, -0.09774515777826309, -0.08997394889593124, -0.08220274746417999, -0.07443153858184814, -0.0666603296995163, -0.058889128267765045, -0.051117923110723495, -0.04334671422839165, -0.0355755090713501, -0.0278043020516634, -0.0200330950319767, -0.01226188987493515, -0.004490680992603302, 0.0032805241644382477, 0.011051731184124947, 0.018822938203811646, 0.026594143360853195, 0.034365348517894745, 0.04213655740022659, 0.04990776255726814, 0.05767897143959999, 0.06545017659664154, 0.07322138547897339, 0.08099258691072464, 0.08876379579305649, 0.09653500467538834, 0.10430620610713959, 0.11207741498947144, 0.11984862387180328, 0.12761983275413513, 0.13539104163646698, 0.14316225051879883, 0.15093344449996948, 0.15870465338230133, 0.16647586226463318, 0.17424707114696503, 0.18201828002929688, 0.18978947401046753, 0.19756068289279938, 0.20533189177513123, 0.21310308575630188, 0.22087429463863373, 0.22864550352096558, 0.23641671240329742, 0.24418792128562927, 0.2519591450691223, 0.25973033905029297, 0.267501562833786, 0.27527275681495667, 0.2830439805984497, 0.29081517457962036, 0.298586368560791, 0.30635759234428406, 0.3141287863254547]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 11.0, 7.0, 12.0, 8.0, 13.0, 19.0, 18.0, 17.0, 19.0, 27.0, 28.0, 29.0, 33.0, 28.0, 34.0, 31.0, 41.0, 37.0, 36.0, 51.0, 40.0, 29.0, 33.0, 31.0, 31.0, 36.0, 35.0, 34.0, 29.0, 23.0, 23.0, 25.0, 21.0, 20.0, 14.0, 12.0, 16.0, 11.0, 6.0, 6.0, 6.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09320485591888428, -0.08998407423496246, -0.08676329255104065, -0.08354251086711884, -0.08032172918319702, -0.07710094749927521, -0.0738801583647728, -0.07065937668085098, -0.06743859499692917, -0.06421781331300735, -0.06099703162908554, -0.05777624621987343, -0.054555464535951614, -0.0513346828520298, -0.04811389744281769, -0.044893115758895874, -0.04167233407497406, -0.038451552391052246, -0.03523077070713043, -0.03200998529791832, -0.028789203613996506, -0.025568421930074692, -0.02234763838350773, -0.019126854836940765, -0.01590607315301895, -0.012685290537774563, -0.009464507922530174, -0.006243725307285786, -0.003022942692041397, 0.00019783899188041687, 0.00341862253844738, 0.006639406085014343, 0.009860187768936157, 0.013080970384180546, 0.016301752999424934, 0.019522536545991898, 0.02274331822991371, 0.025964099913835526, 0.02918488346040249, 0.03240566700696945, 0.035626448690891266, 0.03884723037481308, 0.042068012058734894, 0.045288797467947006, 0.04850957915186882, 0.051730360835790634, 0.05495114624500275, 0.05817192792892456, 0.061392709612846375, 0.06461349129676819, 0.06783427298069, 0.07105505466461182, 0.07427583634853363, 0.07749661803245544, 0.08071740716695786, 0.08393818885087967, 0.08715897053480148, 0.0903797522187233, 0.09360053390264511, 0.09682131558656693, 0.10004210472106934, 0.10326288640499115, 0.10648366808891296, 0.10970444977283478, 0.11292523145675659]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 4.0, 6.0, 3.0, 9.0, 14.0, 17.0, 31.0, 53.0, 69.0, 111.0, 220.0, 274.0, 510.0, 860.0, 1686.0, 3472.0, 6996.0, 15422.0, 34762.0, 81852.0, 181734.0, 294416.0, 229716.0, 110074.0, 47607.0, 20221.0, 9254.0, 4292.0, 2162.0, 1162.0, 582.0, 369.0, 207.0, 140.0, 89.0, 56.0, 37.0, 29.0, 5.0, 17.0, 10.0, 4.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0704345703125, -0.0683431625366211, -0.06625175476074219, -0.06416034698486328, -0.062068939208984375, -0.05997753143310547, -0.05788612365722656, -0.055794715881347656, -0.05370330810546875, -0.051611900329589844, -0.04952049255371094, -0.04742908477783203, -0.045337677001953125, -0.04324626922607422, -0.04115486145019531, -0.039063453674316406, -0.0369720458984375, -0.034880638122558594, -0.03278923034667969, -0.03069782257080078, -0.028606414794921875, -0.02651500701904297, -0.024423599243164062, -0.022332191467285156, -0.02024078369140625, -0.018149375915527344, -0.016057968139648438, -0.013966560363769531, -0.011875152587890625, -0.009783744812011719, -0.0076923370361328125, -0.005600929260253906, -0.003509521484375, -0.0014181137084960938, 0.0006732940673828125, 0.0027647018432617188, 0.004856109619140625, 0.006947517395019531, 0.009038925170898438, 0.011130332946777344, 0.01322174072265625, 0.015313148498535156, 0.017404556274414062, 0.01949596405029297, 0.021587371826171875, 0.02367877960205078, 0.025770187377929688, 0.027861595153808594, 0.0299530029296875, 0.032044410705566406, 0.03413581848144531, 0.03622722625732422, 0.038318634033203125, 0.04041004180908203, 0.04250144958496094, 0.044592857360839844, 0.04668426513671875, 0.048775672912597656, 0.05086708068847656, 0.05295848846435547, 0.055049896240234375, 0.05714130401611328, 0.05923271179199219, 0.061324119567871094, 0.06341552734375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 5.0, 11.0, 6.0, 16.0, 11.0, 15.0, 18.0, 14.0, 14.0, 18.0, 32.0, 32.0, 41.0, 28.0, 40.0, 48.0, 41.0, 59.0, 44.0, 38.0, 33.0, 39.0, 50.0, 42.0, 40.0, 43.0, 30.0, 27.0, 26.0, 31.0, 16.0, 13.0, 13.0, 18.0, 10.0, 10.0, 4.0, 2.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0290374755859375, -0.028041601181030273, -0.027045726776123047, -0.02604985237121582, -0.025053977966308594, -0.024058103561401367, -0.02306222915649414, -0.022066354751586914, -0.021070480346679688, -0.02007460594177246, -0.019078731536865234, -0.018082857131958008, -0.01708698272705078, -0.016091108322143555, -0.015095233917236328, -0.014099359512329102, -0.013103485107421875, -0.012107610702514648, -0.011111736297607422, -0.010115861892700195, -0.009119987487792969, -0.008124113082885742, -0.007128238677978516, -0.006132364273071289, -0.0051364898681640625, -0.004140615463256836, -0.0031447410583496094, -0.002148866653442383, -0.0011529922485351562, -0.0001571178436279297, 0.0008387565612792969, 0.0018346309661865234, 0.00283050537109375, 0.0038263797760009766, 0.004822254180908203, 0.00581812858581543, 0.006814002990722656, 0.007809877395629883, 0.00880575180053711, 0.009801626205444336, 0.010797500610351562, 0.011793375015258789, 0.012789249420166016, 0.013785123825073242, 0.014780998229980469, 0.015776872634887695, 0.016772747039794922, 0.01776862144470215, 0.018764495849609375, 0.0197603702545166, 0.020756244659423828, 0.021752119064331055, 0.02274799346923828, 0.023743867874145508, 0.024739742279052734, 0.02573561668395996, 0.026731491088867188, 0.027727365493774414, 0.02872323989868164, 0.029719114303588867, 0.030714988708496094, 0.03171086311340332, 0.03270673751831055, 0.03370261192321777, 0.034698486328125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 2.0, 2.0, 5.0, 6.0, 3.0, 7.0, 13.0, 15.0, 28.0, 30.0, 73.0, 79.0, 133.0, 191.0, 297.0, 473.0, 921.0, 1932.0, 5059.0, 17124.0, 83425.0, 495341.0, 364175.0, 58743.0, 12624.0, 4112.0, 1655.0, 800.0, 442.0, 272.0, 188.0, 101.0, 89.0, 49.0, 33.0, 28.0, 25.0, 12.0, 20.0, 7.0, 5.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.141357421875, -0.1374197006225586, -0.1334819793701172, -0.12954425811767578, -0.12560653686523438, -0.12166881561279297, -0.11773109436035156, -0.11379337310791016, -0.10985565185546875, -0.10591793060302734, -0.10198020935058594, -0.09804248809814453, -0.09410476684570312, -0.09016704559326172, -0.08622932434082031, -0.0822916030883789, -0.0783538818359375, -0.0744161605834961, -0.07047843933105469, -0.06654071807861328, -0.06260299682617188, -0.05866527557373047, -0.05472755432128906, -0.050789833068847656, -0.04685211181640625, -0.042914390563964844, -0.03897666931152344, -0.03503894805908203, -0.031101226806640625, -0.02716350555419922, -0.023225784301757812, -0.019288063049316406, -0.015350341796875, -0.011412620544433594, -0.0074748992919921875, -0.0035371780395507812, 0.000400543212890625, 0.004338264465332031, 0.008275985717773438, 0.012213706970214844, 0.01615142822265625, 0.020089149475097656, 0.024026870727539062, 0.02796459197998047, 0.031902313232421875, 0.03584003448486328, 0.03977775573730469, 0.043715476989746094, 0.0476531982421875, 0.051590919494628906, 0.05552864074707031, 0.05946636199951172, 0.06340408325195312, 0.06734180450439453, 0.07127952575683594, 0.07521724700927734, 0.07915496826171875, 0.08309268951416016, 0.08703041076660156, 0.09096813201904297, 0.09490585327148438, 0.09884357452392578, 0.10278129577636719, 0.1067190170288086, 0.11065673828125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 2.0, 6.0, 3.0, 8.0, 3.0, 12.0, 10.0, 13.0, 14.0, 13.0, 22.0, 33.0, 28.0, 32.0, 21.0, 34.0, 47.0, 31.0, 48.0, 60.0, 60.0, 50.0, 45.0, 58.0, 36.0, 35.0, 23.0, 33.0, 31.0, 32.0, 25.0, 29.0, 18.0, 15.0, 17.0, 12.0, 13.0, 9.0, 4.0, 5.0, 4.0, 5.0, 2.0, 1.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1376953125, -0.13295745849609375, -0.1282196044921875, -0.12348175048828125, -0.118743896484375, -0.11400604248046875, -0.1092681884765625, -0.10453033447265625, -0.09979248046875, -0.09505462646484375, -0.0903167724609375, -0.08557891845703125, -0.080841064453125, -0.07610321044921875, -0.0713653564453125, -0.06662750244140625, -0.0618896484375, -0.05715179443359375, -0.0524139404296875, -0.04767608642578125, -0.042938232421875, -0.03820037841796875, -0.0334625244140625, -0.02872467041015625, -0.02398681640625, -0.01924896240234375, -0.0145111083984375, -0.00977325439453125, -0.005035400390625, -0.00029754638671875, 0.0044403076171875, 0.00917816162109375, 0.013916015625, 0.01865386962890625, 0.0233917236328125, 0.02812957763671875, 0.032867431640625, 0.03760528564453125, 0.0423431396484375, 0.04708099365234375, 0.05181884765625, 0.05655670166015625, 0.0612945556640625, 0.06603240966796875, 0.070770263671875, 0.07550811767578125, 0.0802459716796875, 0.08498382568359375, 0.0897216796875, 0.09445953369140625, 0.0991973876953125, 0.10393524169921875, 0.108673095703125, 0.11341094970703125, 0.1181488037109375, 0.12288665771484375, 0.12762451171875, 0.13236236572265625, 0.1371002197265625, 0.14183807373046875, 0.146575927734375, 0.15131378173828125, 0.1560516357421875, 0.16078948974609375, 0.16552734375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 6.0, 3.0, 5.0, 9.0, 9.0, 15.0, 20.0, 28.0, 48.0, 74.0, 149.0, 301.0, 781.0, 3271.0, 27469.0, 858417.0, 148013.0, 7556.0, 1449.0, 439.0, 213.0, 112.0, 53.0, 29.0, 21.0, 13.0, 13.0, 8.0, 5.0, 4.0, 9.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1849365234375, -0.1801614761352539, -0.1753864288330078, -0.17061138153076172, -0.16583633422851562, -0.16106128692626953, -0.15628623962402344, -0.15151119232177734, -0.14673614501953125, -0.14196109771728516, -0.13718605041503906, -0.13241100311279297, -0.12763595581054688, -0.12286090850830078, -0.11808586120605469, -0.1133108139038086, -0.1085357666015625, -0.1037607192993164, -0.09898567199707031, -0.09421062469482422, -0.08943557739257812, -0.08466053009033203, -0.07988548278808594, -0.07511043548583984, -0.07033538818359375, -0.06556034088134766, -0.06078529357910156, -0.05601024627685547, -0.051235198974609375, -0.04646015167236328, -0.04168510437011719, -0.036910057067871094, -0.032135009765625, -0.027359962463378906, -0.022584915161132812, -0.01780986785888672, -0.013034820556640625, -0.008259773254394531, -0.0034847259521484375, 0.0012903213500976562, 0.00606536865234375, 0.010840415954589844, 0.015615463256835938, 0.02039051055908203, 0.025165557861328125, 0.02994060516357422, 0.03471565246582031, 0.039490699768066406, 0.0442657470703125, 0.049040794372558594, 0.05381584167480469, 0.05859088897705078, 0.06336593627929688, 0.06814098358154297, 0.07291603088378906, 0.07769107818603516, 0.08246612548828125, 0.08724117279052734, 0.09201622009277344, 0.09679126739501953, 0.10156631469726562, 0.10634136199951172, 0.11111640930175781, 0.1158914566040039, 0.12066650390625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 7.0, 16.0, 13.0, 24.0, 29.0, 26.0, 50.0, 51.0, 77.0, 73.0, 93.0, 76.0, 78.0, 67.0, 69.0, 39.0, 34.0, 37.0, 22.0, 24.0, 13.0, 25.0, 11.0, 13.0, 9.0, 3.0, 5.0, 5.0, 2.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.300739288330078e-05, -2.2184103727340698e-05, -2.1360814571380615e-05, -2.0537525415420532e-05, -1.971423625946045e-05, -1.8890947103500366e-05, -1.8067657947540283e-05, -1.72443687915802e-05, -1.6421079635620117e-05, -1.5597790479660034e-05, -1.4774501323699951e-05, -1.3951212167739868e-05, -1.3127923011779785e-05, -1.2304633855819702e-05, -1.1481344699859619e-05, -1.0658055543899536e-05, -9.834766387939453e-06, -9.01147723197937e-06, -8.188188076019287e-06, -7.364898920059204e-06, -6.541609764099121e-06, -5.718320608139038e-06, -4.895031452178955e-06, -4.071742296218872e-06, -3.248453140258789e-06, -2.425163984298706e-06, -1.601874828338623e-06, -7.7858567237854e-07, 4.470348358154297e-08, 8.67992639541626e-07, 1.691281795501709e-06, 2.514570951461792e-06, 3.337860107421875e-06, 4.161149263381958e-06, 4.984438419342041e-06, 5.807727575302124e-06, 6.631016731262207e-06, 7.45430588722229e-06, 8.277595043182373e-06, 9.100884199142456e-06, 9.924173355102539e-06, 1.0747462511062622e-05, 1.1570751667022705e-05, 1.2394040822982788e-05, 1.3217329978942871e-05, 1.4040619134902954e-05, 1.4863908290863037e-05, 1.568719744682312e-05, 1.6510486602783203e-05, 1.7333775758743286e-05, 1.815706491470337e-05, 1.8980354070663452e-05, 1.9803643226623535e-05, 2.0626932382583618e-05, 2.14502215385437e-05, 2.2273510694503784e-05, 2.3096799850463867e-05, 2.392008900642395e-05, 2.4743378162384033e-05, 2.5566667318344116e-05, 2.63899564743042e-05, 2.7213245630264282e-05, 2.8036534786224365e-05, 2.8859823942184448e-05, 2.968311309814453e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 7.0, 6.0, 7.0, 8.0, 19.0, 28.0, 30.0, 38.0, 76.0, 135.0, 202.0, 345.0, 725.0, 1524.0, 3858.0, 12858.0, 83399.0, 687958.0, 223287.0, 23869.0, 5943.0, 2121.0, 974.0, 470.0, 234.0, 126.0, 90.0, 78.0, 33.0, 31.0, 16.0, 8.0, 17.0, 8.0, 7.0, 5.0, 4.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.08917236328125, -0.08635902404785156, -0.08354568481445312, -0.08073234558105469, -0.07791900634765625, -0.07510566711425781, -0.07229232788085938, -0.06947898864746094, -0.0666656494140625, -0.06385231018066406, -0.061038970947265625, -0.05822563171386719, -0.05541229248046875, -0.05259895324707031, -0.049785614013671875, -0.04697227478027344, -0.044158935546875, -0.04134559631347656, -0.038532257080078125, -0.03571891784667969, -0.03290557861328125, -0.030092239379882812, -0.027278900146484375, -0.024465560913085938, -0.0216522216796875, -0.018838882446289062, -0.016025543212890625, -0.013212203979492188, -0.01039886474609375, -0.0075855255126953125, -0.004772186279296875, -0.0019588470458984375, 0.0008544921875, 0.0036678314208984375, 0.006481170654296875, 0.009294509887695312, 0.01210784912109375, 0.014921188354492188, 0.017734527587890625, 0.020547866821289062, 0.0233612060546875, 0.026174545288085938, 0.028987884521484375, 0.03180122375488281, 0.03461456298828125, 0.03742790222167969, 0.040241241455078125, 0.04305458068847656, 0.045867919921875, 0.04868125915527344, 0.051494598388671875, 0.05430793762207031, 0.05712127685546875, 0.05993461608886719, 0.06274795532226562, 0.06556129455566406, 0.0683746337890625, 0.07118797302246094, 0.07400131225585938, 0.07681465148925781, 0.07962799072265625, 0.08244132995605469, 0.08525466918945312, 0.08806800842285156, 0.09088134765625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 1.0, 3.0, 5.0, 6.0, 7.0, 9.0, 23.0, 36.0, 67.0, 116.0, 134.0, 150.0, 162.0, 104.0, 69.0, 45.0, 27.0, 13.0, 12.0, 7.0, 3.0, 5.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1597900390625, -0.15594959259033203, -0.15210914611816406, -0.1482686996459961, -0.14442825317382812, -0.14058780670166016, -0.1367473602294922, -0.13290691375732422, -0.12906646728515625, -0.12522602081298828, -0.12138557434082031, -0.11754512786865234, -0.11370468139648438, -0.1098642349243164, -0.10602378845214844, -0.10218334197998047, -0.0983428955078125, -0.09450244903564453, -0.09066200256347656, -0.0868215560913086, -0.08298110961914062, -0.07914066314697266, -0.07530021667480469, -0.07145977020263672, -0.06761932373046875, -0.06377887725830078, -0.05993843078613281, -0.056097984313964844, -0.052257537841796875, -0.048417091369628906, -0.04457664489746094, -0.04073619842529297, -0.036895751953125, -0.03305530548095703, -0.029214859008789062, -0.025374412536621094, -0.021533966064453125, -0.017693519592285156, -0.013853073120117188, -0.010012626647949219, -0.00617218017578125, -0.0023317337036132812, 0.0015087127685546875, 0.005349159240722656, 0.009189605712890625, 0.013030052185058594, 0.016870498657226562, 0.02071094512939453, 0.0245513916015625, 0.02839183807373047, 0.03223228454589844, 0.036072731018066406, 0.039913177490234375, 0.043753623962402344, 0.04759407043457031, 0.05143451690673828, 0.05527496337890625, 0.05911540985107422, 0.06295585632324219, 0.06679630279541016, 0.07063674926757812, 0.0744771957397461, 0.07831764221191406, 0.08215808868408203, 0.08599853515625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 7.0, 25.0, 60.0, 186.0, 271.0, 257.0, 143.0, 31.0, 15.0, 6.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0014524459838867, -0.9235528111457825, -0.8456531763076782, -0.7677536010742188, -0.6898539662361145, -0.6119543313980103, -0.5340547561645508, -0.45615512132644653, -0.3782554864883423, -0.30035585165023804, -0.22245624661445618, -0.14455662667751312, -0.06665700674057007, 0.01124262809753418, 0.08914223313331604, 0.1670418381690979, 0.24494147300720215, 0.3228411078453064, 0.40074071288108826, 0.4786403179168701, 0.5565399527549744, 0.6344395875930786, 0.7123391628265381, 0.7902387976646423, 0.8681384325027466, 0.9460380673408508, 1.023937702178955, 1.1018372774124146, 1.179736852645874, 1.257636547088623, 1.3355361223220825, 1.413435697555542, 1.491335153579712, 1.5692347288131714, 1.6471344232559204, 1.7250339984893799, 1.802933692932129, 1.8808332681655884, 1.9587328433990479, 2.036632537841797, 2.114531993865967, 2.192431688308716, 2.2703311443328857, 2.3482308387756348, 2.426130533218384, 2.504030227661133, 2.5819296836853027, 2.6598293781280518, 2.737729072570801, 2.81562876701355, 2.8935282230377197, 2.9714279174804688, 3.0493276119232178, 3.127227306365967, 3.2051267623901367, 3.2830264568328857, 3.3609261512756348, 3.438825845718384, 3.5167253017425537, 3.5946249961853027, 3.6725246906280518, 3.750424385070801, 3.8283238410949707, 3.9062235355377197, 3.9841229915618896]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 7.0, 11.0, 8.0, 13.0, 13.0, 14.0, 15.0, 22.0, 32.0, 34.0, 32.0, 34.0, 42.0, 42.0, 47.0, 55.0, 59.0, 49.0, 44.0, 48.0, 55.0, 38.0, 38.0, 41.0, 34.0, 33.0, 33.0, 13.0, 18.0, 11.0, 19.0, 9.0, 9.0, 8.0, 7.0, 6.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8185887336730957, -0.794086217880249, -0.7695837616920471, -0.7450812458992004, -0.7205787897109985, -0.6960762739181519, -0.6715737581253052, -0.6470712423324585, -0.6225687861442566, -0.5980662703514099, -0.573563814163208, -0.5490612983703613, -0.5245587825775146, -0.5000563263893127, -0.47555381059646606, -0.4510513246059418, -0.4265488386154175, -0.4020463526248932, -0.3775438666343689, -0.3530413508415222, -0.3285388648509979, -0.30403637886047363, -0.27953386306762695, -0.25503137707710266, -0.23052889108657837, -0.20602640509605408, -0.1815239042043686, -0.1570214033126831, -0.1325189173221588, -0.10801642388105392, -0.08351393043994904, -0.05901142954826355, -0.03450888395309448, -0.010006390511989594, 0.014496102929115295, 0.038998596370220184, 0.06350108981132507, 0.08800358325242996, 0.11250607669353485, 0.13700857758522034, 0.16151106357574463, 0.18601354956626892, 0.2105160504579544, 0.2350185513496399, 0.2595210373401642, 0.2840235233306885, 0.30852603912353516, 0.33302852511405945, 0.35753101110458374, 0.38203349709510803, 0.4065359830856323, 0.431038498878479, 0.4555409848690033, 0.4800434708595276, 0.5045459866523743, 0.5290484428405762, 0.5535509586334229, 0.5780534744262695, 0.6025559306144714, 0.6270584464073181, 0.65156090259552, 0.6760634183883667, 0.7005659341812134, 0.7250684499740601, 0.749570906162262]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 2.0, 6.0, 5.0, 5.0, 8.0, 23.0, 29.0, 50.0, 49.0, 104.0, 150.0, 274.0, 354.0, 684.0, 1150.0, 2496.0, 6454.0, 44672.0, 4113567.0, 15875.0, 4160.0, 1798.0, 940.0, 526.0, 332.0, 174.0, 120.0, 105.0, 61.0, 42.0, 24.0, 12.0, 11.0, 10.0, 7.0, 7.0, 5.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.185546875, -0.17722702026367188, -0.16890716552734375, -0.16058731079101562, -0.1522674560546875, -0.14394760131835938, -0.13562774658203125, -0.12730789184570312, -0.118988037109375, -0.11066818237304688, -0.10234832763671875, -0.09402847290039062, -0.0857086181640625, -0.07738876342773438, -0.06906890869140625, -0.060749053955078125, -0.05242919921875, -0.044109344482421875, -0.03578948974609375, -0.027469635009765625, -0.0191497802734375, -0.010829925537109375, -0.00251007080078125, 0.005809783935546875, 0.014129638671875, 0.022449493408203125, 0.03076934814453125, 0.039089202880859375, 0.0474090576171875, 0.055728912353515625, 0.06404876708984375, 0.07236862182617188, 0.0806884765625, 0.08900833129882812, 0.09732818603515625, 0.10564804077148438, 0.1139678955078125, 0.12228775024414062, 0.13060760498046875, 0.13892745971679688, 0.147247314453125, 0.15556716918945312, 0.16388702392578125, 0.17220687866210938, 0.1805267333984375, 0.18884658813476562, 0.19716644287109375, 0.20548629760742188, 0.21380615234375, 0.22212600708007812, 0.23044586181640625, 0.23876571655273438, 0.2470855712890625, 0.2554054260253906, 0.26372528076171875, 0.2720451354980469, 0.280364990234375, 0.2886848449707031, 0.29700469970703125, 0.3053245544433594, 0.3136444091796875, 0.3219642639160156, 0.33028411865234375, 0.3386039733886719, 0.346923828125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 7.0, 10.0, 15.0, 15.0, 21.0, 23.0, 27.0, 35.0, 31.0, 33.0, 39.0, 42.0, 54.0, 48.0, 45.0, 44.0, 49.0, 40.0, 49.0, 49.0, 46.0, 36.0, 34.0, 34.0, 30.0, 26.0, 22.0, 10.0, 12.0, 9.0, 18.0, 7.0, 6.0, 6.0, 9.0, 0.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.038330078125, -0.03719615936279297, -0.03606224060058594, -0.034928321838378906, -0.033794403076171875, -0.032660484313964844, -0.03152656555175781, -0.03039264678955078, -0.02925872802734375, -0.02812480926513672, -0.026990890502929688, -0.025856971740722656, -0.024723052978515625, -0.023589134216308594, -0.022455215454101562, -0.02132129669189453, -0.0201873779296875, -0.01905345916748047, -0.017919540405273438, -0.016785621643066406, -0.015651702880859375, -0.014517784118652344, -0.013383865356445312, -0.012249946594238281, -0.01111602783203125, -0.009982109069824219, -0.008848190307617188, -0.007714271545410156, -0.006580352783203125, -0.005446434020996094, -0.0043125152587890625, -0.0031785964965820312, -0.002044677734375, -0.0009107589721679688, 0.0002231597900390625, 0.0013570785522460938, 0.002490997314453125, 0.0036249160766601562, 0.0047588348388671875, 0.005892753601074219, 0.00702667236328125, 0.008160591125488281, 0.009294509887695312, 0.010428428649902344, 0.011562347412109375, 0.012696266174316406, 0.013830184936523438, 0.014964103698730469, 0.0160980224609375, 0.01723194122314453, 0.018365859985351562, 0.019499778747558594, 0.020633697509765625, 0.021767616271972656, 0.022901535034179688, 0.02403545379638672, 0.02516937255859375, 0.02630329132080078, 0.027437210083007812, 0.028571128845214844, 0.029705047607421875, 0.030838966369628906, 0.03197288513183594, 0.03310680389404297, 0.03424072265625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 5.0, 8.0, 7.0, 6.0, 9.0, 12.0, 27.0, 20.0, 22.0, 42.0, 61.0, 80.0, 110.0, 143.0, 180.0, 308.0, 546.0, 998.0, 3132.0, 100561.0, 4081016.0, 4114.0, 1182.0, 603.0, 315.0, 223.0, 148.0, 101.0, 76.0, 60.0, 36.0, 42.0, 23.0, 14.0, 8.0, 9.0, 10.0, 9.0, 2.0, 2.0, 2.0, 1.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.79296875, -0.7697067260742188, -0.7464447021484375, -0.7231826782226562, -0.699920654296875, -0.6766586303710938, -0.6533966064453125, -0.6301345825195312, -0.60687255859375, -0.5836105346679688, -0.5603485107421875, -0.5370864868164062, -0.513824462890625, -0.49056243896484375, -0.4673004150390625, -0.44403839111328125, -0.4207763671875, -0.39751434326171875, -0.3742523193359375, -0.35099029541015625, -0.327728271484375, -0.30446624755859375, -0.2812042236328125, -0.25794219970703125, -0.23468017578125, -0.21141815185546875, -0.1881561279296875, -0.16489410400390625, -0.141632080078125, -0.11837005615234375, -0.0951080322265625, -0.07184600830078125, -0.048583984375, -0.02532196044921875, -0.0020599365234375, 0.02120208740234375, 0.044464111328125, 0.06772613525390625, 0.0909881591796875, 0.11425018310546875, 0.13751220703125, 0.16077423095703125, 0.1840362548828125, 0.20729827880859375, 0.230560302734375, 0.25382232666015625, 0.2770843505859375, 0.30034637451171875, 0.3236083984375, 0.34687042236328125, 0.3701324462890625, 0.39339447021484375, 0.416656494140625, 0.43991851806640625, 0.4631805419921875, 0.48644256591796875, 0.50970458984375, 0.5329666137695312, 0.5562286376953125, 0.5794906616210938, 0.602752685546875, 0.6260147094726562, 0.6492767333984375, 0.6725387573242188, 0.69580078125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 8.0, 15.0, 102.0, 3884.0, 52.0, 11.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.169921875, -0.16414642333984375, -0.1583709716796875, -0.15259552001953125, -0.146820068359375, -0.14104461669921875, -0.1352691650390625, -0.12949371337890625, -0.12371826171875, -0.11794281005859375, -0.1121673583984375, -0.10639190673828125, -0.100616455078125, -0.09484100341796875, -0.0890655517578125, -0.08329010009765625, -0.0775146484375, -0.07173919677734375, -0.0659637451171875, -0.06018829345703125, -0.054412841796875, -0.04863739013671875, -0.0428619384765625, -0.03708648681640625, -0.03131103515625, -0.02553558349609375, -0.0197601318359375, -0.01398468017578125, -0.008209228515625, -0.00243377685546875, 0.0033416748046875, 0.00911712646484375, 0.014892578125, 0.02066802978515625, 0.0264434814453125, 0.03221893310546875, 0.037994384765625, 0.04376983642578125, 0.0495452880859375, 0.05532073974609375, 0.06109619140625, 0.06687164306640625, 0.0726470947265625, 0.07842254638671875, 0.084197998046875, 0.08997344970703125, 0.0957489013671875, 0.10152435302734375, 0.1072998046875, 0.11307525634765625, 0.1188507080078125, 0.12462615966796875, 0.130401611328125, 0.13617706298828125, 0.1419525146484375, 0.14772796630859375, 0.15350341796875, 0.15927886962890625, 0.1650543212890625, 0.17082977294921875, 0.176605224609375, 0.18238067626953125, 0.1881561279296875, 0.19393157958984375, 0.19970703125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 6.0, 8.0, 13.0, 20.0, 19.0, 19.0, 36.0, 53.0, 76.0, 81.0, 108.0, 108.0, 102.0, 96.0, 75.0, 47.0, 31.0, 29.0, 22.0, 14.0, 6.0, 10.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2450229972600937, -0.23755328357219696, -0.23008356988430023, -0.2226138710975647, -0.21514415740966797, -0.20767444372177124, -0.2002047300338745, -0.19273501634597778, -0.18526530265808105, -0.17779558897018433, -0.1703258752822876, -0.16285616159439087, -0.15538646280765533, -0.1479167491197586, -0.14044703543186188, -0.13297732174396515, -0.12550762295722961, -0.11803790926933289, -0.11056820303201675, -0.10309848934412003, -0.0956287831068039, -0.08815906941890717, -0.08068935573101044, -0.07321964204311371, -0.06574993580579758, -0.05828022584319115, -0.05081051588058472, -0.04334080219268799, -0.03587109223008156, -0.028401382267475128, -0.0209316685795784, -0.01346195861697197, -0.005992233753204346, 0.001477477140724659, 0.008947188034653664, 0.016416899859905243, 0.023886609822511673, 0.0313563197851181, 0.03882603347301483, 0.04629574343562126, 0.05376545339822769, 0.06123516336083412, 0.06870487332344055, 0.07617458701133728, 0.08364430069923401, 0.09111400693655014, 0.09858372062444687, 0.106053426861763, 0.11352314054965973, 0.12099285423755646, 0.12846256792545319, 0.13593226671218872, 0.14340198040008545, 0.15087169408798218, 0.1583414077758789, 0.16581112146377563, 0.17328083515167236, 0.1807505488395691, 0.18822026252746582, 0.19568997621536255, 0.20315967500209808, 0.2106293886899948, 0.21809910237789154, 0.22556881606578827, 0.2330385148525238]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 4.0, 2.0, 3.0, 4.0, 9.0, 7.0, 9.0, 10.0, 13.0, 18.0, 17.0, 20.0, 22.0, 28.0, 27.0, 28.0, 34.0, 33.0, 39.0, 41.0, 30.0, 34.0, 50.0, 36.0, 37.0, 44.0, 25.0, 33.0, 28.0, 43.0, 34.0, 27.0, 45.0, 17.0, 14.0, 15.0, 23.0, 19.0, 16.0, 15.0, 11.0, 6.0, 7.0, 5.0, 4.0, 5.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.1370716094970703, -0.1327364295721054, -0.1284012496471405, -0.1240660548210144, -0.1197308748960495, -0.1153956949710846, -0.11106050759553909, -0.10672532021999359, -0.10239014029502869, -0.09805496037006378, -0.09371977299451828, -0.08938458561897278, -0.08504940569400787, -0.08071422576904297, -0.07637903839349747, -0.07204385101795197, -0.06770867109298706, -0.06337349116802216, -0.059038303792476654, -0.05470312014222145, -0.05036793649196625, -0.046032752841711044, -0.04169756919145584, -0.03736238554120064, -0.033027201890945435, -0.02869201824069023, -0.024356834590435028, -0.020021650940179825, -0.01568646728992462, -0.011351283639669418, -0.007016099989414215, -0.002680916339159012, 0.0016542673110961914, 0.005989450961351395, 0.010324634611606598, 0.014659818261861801, 0.018995001912117004, 0.023330185562372208, 0.02766536921262741, 0.032000552862882614, 0.03633573651313782, 0.04067092016339302, 0.045006103813648224, 0.04934128746390343, 0.05367647111415863, 0.058011654764413834, 0.06234683841466904, 0.06668202579021454, 0.07101720571517944, 0.07535238564014435, 0.07968757301568985, 0.08402276039123535, 0.08835794031620026, 0.09269312024116516, 0.09702830761671066, 0.10136349499225616, 0.10569867491722107, 0.11003385484218597, 0.11436904221773148, 0.11870422959327698, 0.12303940951824188, 0.1273745894432068, 0.13170978426933289, 0.1360449641942978, 0.1403801441192627]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 9.0, 7.0, 4.0, 12.0, 10.0, 16.0, 30.0, 27.0, 41.0, 68.0, 100.0, 111.0, 227.0, 307.0, 444.0, 737.0, 1164.0, 2096.0, 3855.0, 7274.0, 15459.0, 35350.0, 88218.0, 227783.0, 354865.0, 183161.0, 70951.0, 29045.0, 12859.0, 6291.0, 3163.0, 1853.0, 1048.0, 693.0, 416.0, 284.0, 167.0, 109.0, 77.0, 56.0, 50.0, 30.0, 33.0, 16.0, 7.0, 8.0, 7.0, 2.0, 3.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 3.0], "bins": [-0.07763671875, -0.07516288757324219, -0.07268905639648438, -0.07021522521972656, -0.06774139404296875, -0.06526756286621094, -0.06279373168945312, -0.06031990051269531, -0.0578460693359375, -0.05537223815917969, -0.052898406982421875, -0.05042457580566406, -0.04795074462890625, -0.04547691345214844, -0.043003082275390625, -0.04052925109863281, -0.038055419921875, -0.03558158874511719, -0.033107757568359375, -0.030633926391601562, -0.02816009521484375, -0.025686264038085938, -0.023212432861328125, -0.020738601684570312, -0.0182647705078125, -0.015790939331054688, -0.013317108154296875, -0.010843276977539062, -0.00836944580078125, -0.0058956146240234375, -0.003421783447265625, -0.0009479522705078125, 0.00152587890625, 0.0039997100830078125, 0.006473541259765625, 0.008947372436523438, 0.01142120361328125, 0.013895034790039062, 0.016368865966796875, 0.018842697143554688, 0.0213165283203125, 0.023790359497070312, 0.026264190673828125, 0.028738021850585938, 0.03121185302734375, 0.03368568420410156, 0.036159515380859375, 0.03863334655761719, 0.041107177734375, 0.04358100891113281, 0.046054840087890625, 0.04852867126464844, 0.05100250244140625, 0.05347633361816406, 0.055950164794921875, 0.05842399597167969, 0.0608978271484375, 0.06337165832519531, 0.06584548950195312, 0.06831932067871094, 0.07079315185546875, 0.07326698303222656, 0.07574081420898438, 0.07821464538574219, 0.0806884765625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 7.0, 0.0, 6.0, 6.0, 5.0, 6.0, 9.0, 15.0, 15.0, 12.0, 16.0, 16.0, 20.0, 12.0, 28.0, 36.0, 41.0, 33.0, 32.0, 39.0, 29.0, 49.0, 47.0, 31.0, 53.0, 46.0, 49.0, 43.0, 46.0, 35.0, 28.0, 23.0, 27.0, 19.0, 16.0, 19.0, 12.0, 12.0, 14.0, 12.0, 10.0, 9.0, 4.0, 8.0, 4.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.040313720703125, -0.03911113739013672, -0.03790855407714844, -0.036705970764160156, -0.035503387451171875, -0.034300804138183594, -0.03309822082519531, -0.03189563751220703, -0.03069305419921875, -0.02949047088623047, -0.028287887573242188, -0.027085304260253906, -0.025882720947265625, -0.024680137634277344, -0.023477554321289062, -0.02227497100830078, -0.0210723876953125, -0.01986980438232422, -0.018667221069335938, -0.017464637756347656, -0.016262054443359375, -0.015059471130371094, -0.013856887817382812, -0.012654304504394531, -0.01145172119140625, -0.010249137878417969, -0.009046554565429688, -0.007843971252441406, -0.006641387939453125, -0.005438804626464844, -0.0042362213134765625, -0.0030336380004882812, -0.0018310546875, -0.0006284713745117188, 0.0005741119384765625, 0.0017766952514648438, 0.002979278564453125, 0.004181861877441406, 0.0053844451904296875, 0.006587028503417969, 0.00778961181640625, 0.008992195129394531, 0.010194778442382812, 0.011397361755371094, 0.012599945068359375, 0.013802528381347656, 0.015005111694335938, 0.01620769500732422, 0.0174102783203125, 0.01861286163330078, 0.019815444946289062, 0.021018028259277344, 0.022220611572265625, 0.023423194885253906, 0.024625778198242188, 0.02582836151123047, 0.02703094482421875, 0.02823352813720703, 0.029436111450195312, 0.030638694763183594, 0.031841278076171875, 0.033043861389160156, 0.03424644470214844, 0.03544902801513672, 0.036651611328125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 2.0, 3.0, 3.0, 11.0, 8.0, 14.0, 14.0, 27.0, 32.0, 39.0, 69.0, 89.0, 118.0, 198.0, 242.0, 443.0, 796.0, 1635.0, 4440.0, 16215.0, 95027.0, 684233.0, 206016.0, 27455.0, 6563.0, 2296.0, 1015.0, 526.0, 327.0, 215.0, 157.0, 98.0, 68.0, 49.0, 36.0, 27.0, 14.0, 11.0, 9.0, 7.0, 4.0, 1.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1624755859375, -0.1577892303466797, -0.15310287475585938, -0.14841651916503906, -0.14373016357421875, -0.13904380798339844, -0.13435745239257812, -0.1296710968017578, -0.1249847412109375, -0.12029838562011719, -0.11561203002929688, -0.11092567443847656, -0.10623931884765625, -0.10155296325683594, -0.09686660766601562, -0.09218025207519531, -0.087493896484375, -0.08280754089355469, -0.07812118530273438, -0.07343482971191406, -0.06874847412109375, -0.06406211853027344, -0.059375762939453125, -0.05468940734863281, -0.0500030517578125, -0.04531669616699219, -0.040630340576171875, -0.03594398498535156, -0.03125762939453125, -0.026571273803710938, -0.021884918212890625, -0.017198562622070312, -0.01251220703125, -0.007825851440429688, -0.003139495849609375, 0.0015468597412109375, 0.00623321533203125, 0.010919570922851562, 0.015605926513671875, 0.020292282104492188, 0.0249786376953125, 0.029664993286132812, 0.034351348876953125, 0.03903770446777344, 0.04372406005859375, 0.04841041564941406, 0.053096771240234375, 0.05778312683105469, 0.062469482421875, 0.06715583801269531, 0.07184219360351562, 0.07652854919433594, 0.08121490478515625, 0.08590126037597656, 0.09058761596679688, 0.09527397155761719, 0.0999603271484375, 0.10464668273925781, 0.10933303833007812, 0.11401939392089844, 0.11870574951171875, 0.12339210510253906, 0.12807846069335938, 0.1327648162841797, 0.137451171875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 8.0, 5.0, 14.0, 9.0, 8.0, 25.0, 17.0, 39.0, 18.0, 39.0, 33.0, 50.0, 31.0, 43.0, 48.0, 55.0, 55.0, 60.0, 42.0, 46.0, 59.0, 35.0, 43.0, 40.0, 39.0, 21.0, 34.0, 24.0, 9.0, 10.0, 7.0, 11.0, 7.0, 7.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2349853515625, -0.22806930541992188, -0.22115325927734375, -0.21423721313476562, -0.2073211669921875, -0.20040512084960938, -0.19348907470703125, -0.18657302856445312, -0.179656982421875, -0.17274093627929688, -0.16582489013671875, -0.15890884399414062, -0.1519927978515625, -0.14507675170898438, -0.13816070556640625, -0.13124465942382812, -0.12432861328125, -0.11741256713867188, -0.11049652099609375, -0.10358047485351562, -0.0966644287109375, -0.08974838256835938, -0.08283233642578125, -0.07591629028320312, -0.069000244140625, -0.062084197998046875, -0.05516815185546875, -0.048252105712890625, -0.0413360595703125, -0.034420013427734375, -0.02750396728515625, -0.020587921142578125, -0.013671875, -0.006755828857421875, 0.00016021728515625, 0.007076263427734375, 0.0139923095703125, 0.020908355712890625, 0.02782440185546875, 0.034740447998046875, 0.041656494140625, 0.048572540283203125, 0.05548858642578125, 0.062404632568359375, 0.0693206787109375, 0.07623672485351562, 0.08315277099609375, 0.09006881713867188, 0.09698486328125, 0.10390090942382812, 0.11081695556640625, 0.11773300170898438, 0.1246490478515625, 0.13156509399414062, 0.13848114013671875, 0.14539718627929688, 0.152313232421875, 0.15922927856445312, 0.16614532470703125, 0.17306137084960938, 0.1799774169921875, 0.18689346313476562, 0.19380950927734375, 0.20072555541992188, 0.2076416015625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 2.0, 5.0, 8.0, 3.0, 12.0, 22.0, 32.0, 56.0, 91.0, 196.0, 445.0, 1383.0, 11594.0, 842199.0, 186035.0, 4843.0, 908.0, 334.0, 144.0, 64.0, 62.0, 41.0, 24.0, 19.0, 8.0, 7.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.2646484375, -0.25832176208496094, -0.2519950866699219, -0.2456684112548828, -0.23934173583984375, -0.2330150604248047, -0.22668838500976562, -0.22036170959472656, -0.2140350341796875, -0.20770835876464844, -0.20138168334960938, -0.1950550079345703, -0.18872833251953125, -0.1824016571044922, -0.17607498168945312, -0.16974830627441406, -0.163421630859375, -0.15709495544433594, -0.15076828002929688, -0.1444416046142578, -0.13811492919921875, -0.1317882537841797, -0.12546157836914062, -0.11913490295410156, -0.1128082275390625, -0.10648155212402344, -0.10015487670898438, -0.09382820129394531, -0.08750152587890625, -0.08117485046386719, -0.07484817504882812, -0.06852149963378906, -0.06219482421875, -0.05586814880371094, -0.049541473388671875, -0.04321479797363281, -0.03688812255859375, -0.030561447143554688, -0.024234771728515625, -0.017908096313476562, -0.0115814208984375, -0.0052547454833984375, 0.001071929931640625, 0.0073986053466796875, 0.01372528076171875, 0.020051956176757812, 0.026378631591796875, 0.03270530700683594, 0.039031982421875, 0.04535865783691406, 0.051685333251953125, 0.05801200866699219, 0.06433868408203125, 0.07066535949707031, 0.07699203491210938, 0.08331871032714844, 0.0896453857421875, 0.09597206115722656, 0.10229873657226562, 0.10862541198730469, 0.11495208740234375, 0.12127876281738281, 0.12760543823242188, 0.13393211364746094, 0.1402587890625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 8.0, 7.0, 10.0, 10.0, 15.0, 11.0, 18.0, 18.0, 37.0, 42.0, 48.0, 46.0, 86.0, 71.0, 78.0, 80.0, 65.0, 71.0, 49.0, 49.0, 45.0, 25.0, 20.0, 23.0, 10.0, 11.0, 10.0, 8.0, 10.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1278858184814453e-05, -2.0585954189300537e-05, -1.989305019378662e-05, -1.9200146198272705e-05, -1.850724220275879e-05, -1.7814338207244873e-05, -1.7121434211730957e-05, -1.642853021621704e-05, -1.5735626220703125e-05, -1.5042722225189209e-05, -1.4349818229675293e-05, -1.3656914234161377e-05, -1.2964010238647461e-05, -1.2271106243133545e-05, -1.1578202247619629e-05, -1.0885298252105713e-05, -1.0192394256591797e-05, -9.499490261077881e-06, -8.806586265563965e-06, -8.113682270050049e-06, -7.420778274536133e-06, -6.727874279022217e-06, -6.034970283508301e-06, -5.342066287994385e-06, -4.649162292480469e-06, -3.956258296966553e-06, -3.2633543014526367e-06, -2.5704503059387207e-06, -1.8775463104248047e-06, -1.1846423149108887e-06, -4.917383193969727e-07, 2.0116567611694336e-07, 8.940696716308594e-07, 1.5869736671447754e-06, 2.2798776626586914e-06, 2.9727816581726074e-06, 3.6656856536865234e-06, 4.3585896492004395e-06, 5.0514936447143555e-06, 5.7443976402282715e-06, 6.4373016357421875e-06, 7.1302056312561035e-06, 7.82310962677002e-06, 8.516013622283936e-06, 9.208917617797852e-06, 9.901821613311768e-06, 1.0594725608825684e-05, 1.12876296043396e-05, 1.1980533599853516e-05, 1.2673437595367432e-05, 1.3366341590881348e-05, 1.4059245586395264e-05, 1.475214958190918e-05, 1.5445053577423096e-05, 1.6137957572937012e-05, 1.6830861568450928e-05, 1.7523765563964844e-05, 1.821666955947876e-05, 1.8909573554992676e-05, 1.9602477550506592e-05, 2.0295381546020508e-05, 2.0988285541534424e-05, 2.168118953704834e-05, 2.2374093532562256e-05, 2.3066997528076172e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 12.0, 15.0, 31.0, 56.0, 82.0, 159.0, 280.0, 585.0, 1422.0, 5051.0, 39584.0, 832005.0, 155469.0, 9882.0, 2254.0, 790.0, 395.0, 202.0, 106.0, 67.0, 28.0, 22.0, 15.0, 9.0, 6.0, 5.0, 8.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.174072265625, -0.16945552825927734, -0.1648387908935547, -0.16022205352783203, -0.15560531616210938, -0.15098857879638672, -0.14637184143066406, -0.1417551040649414, -0.13713836669921875, -0.1325216293334961, -0.12790489196777344, -0.12328815460205078, -0.11867141723632812, -0.11405467987060547, -0.10943794250488281, -0.10482120513916016, -0.1002044677734375, -0.09558773040771484, -0.09097099304199219, -0.08635425567626953, -0.08173751831054688, -0.07712078094482422, -0.07250404357910156, -0.0678873062133789, -0.06327056884765625, -0.058653831481933594, -0.05403709411621094, -0.04942035675048828, -0.044803619384765625, -0.04018688201904297, -0.03557014465332031, -0.030953407287597656, -0.026336669921875, -0.021719932556152344, -0.017103195190429688, -0.012486457824707031, -0.007869720458984375, -0.0032529830932617188, 0.0013637542724609375, 0.005980491638183594, 0.01059722900390625, 0.015213966369628906, 0.019830703735351562, 0.02444744110107422, 0.029064178466796875, 0.03368091583251953, 0.03829765319824219, 0.042914390563964844, 0.0475311279296875, 0.052147865295410156, 0.05676460266113281, 0.06138134002685547, 0.06599807739257812, 0.07061481475830078, 0.07523155212402344, 0.0798482894897461, 0.08446502685546875, 0.0890817642211914, 0.09369850158691406, 0.09831523895263672, 0.10293197631835938, 0.10754871368408203, 0.11216545104980469, 0.11678218841552734, 0.12139892578125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 8.0, 9.0, 12.0, 27.0, 49.0, 83.0, 122.0, 164.0, 161.0, 139.0, 85.0, 55.0, 36.0, 24.0, 7.0, 9.0, 7.0, 7.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1910400390625, -0.1868114471435547, -0.18258285522460938, -0.17835426330566406, -0.17412567138671875, -0.16989707946777344, -0.16566848754882812, -0.1614398956298828, -0.1572113037109375, -0.1529827117919922, -0.14875411987304688, -0.14452552795410156, -0.14029693603515625, -0.13606834411621094, -0.13183975219726562, -0.1276111602783203, -0.123382568359375, -0.11915397644042969, -0.11492538452148438, -0.11069679260253906, -0.10646820068359375, -0.10223960876464844, -0.09801101684570312, -0.09378242492675781, -0.0895538330078125, -0.08532524108886719, -0.08109664916992188, -0.07686805725097656, -0.07263946533203125, -0.06841087341308594, -0.06418228149414062, -0.05995368957519531, -0.05572509765625, -0.05149650573730469, -0.047267913818359375, -0.04303932189941406, -0.03881072998046875, -0.03458213806152344, -0.030353546142578125, -0.026124954223632812, -0.0218963623046875, -0.017667770385742188, -0.013439178466796875, -0.009210586547851562, -0.00498199462890625, -0.0007534027099609375, 0.003475189208984375, 0.0077037811279296875, 0.011932373046875, 0.016160964965820312, 0.020389556884765625, 0.024618148803710938, 0.02884674072265625, 0.03307533264160156, 0.037303924560546875, 0.04153251647949219, 0.0457611083984375, 0.04998970031738281, 0.054218292236328125, 0.05844688415527344, 0.06267547607421875, 0.06690406799316406, 0.07113265991210938, 0.07536125183105469, 0.07958984375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 9.0, 4.0, 33.0, 85.0, 234.0, 276.0, 200.0, 102.0, 32.0, 16.0, 9.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9702353477478027, -2.891038179397583, -2.8118410110473633, -2.7326440811157227, -2.653446912765503, -2.574249744415283, -2.4950528144836426, -2.415855646133423, -2.336658477783203, -2.2574613094329834, -2.1782641410827637, -2.099067211151123, -2.0198700428009033, -1.9406728744506836, -1.8614758253097534, -1.7822787761688232, -1.7030816078186035, -1.6238844394683838, -1.5446873903274536, -1.4654903411865234, -1.3862931728363037, -1.307096004486084, -1.2278989553451538, -1.1487019062042236, -1.069504737854004, -0.990307629108429, -0.911110520362854, -0.831913411617279, -0.7527163028717041, -0.6735191941261292, -0.5943220853805542, -0.5151249766349792, -0.4359278678894043, -0.35673075914382935, -0.2775336503982544, -0.19833654165267944, -0.11913943290710449, -0.03994232416152954, 0.03925478458404541, 0.11845189332962036, 0.1976490020751953, 0.27684611082077026, 0.3560432195663452, 0.43524032831192017, 0.5144374370574951, 0.5936345458030701, 0.672831654548645, 0.75202876329422, 0.8312258720397949, 0.9104229807853699, 0.9896200895309448, 1.068817138671875, 1.1480143070220947, 1.2272114753723145, 1.3064085245132446, 1.3856055736541748, 1.4648027420043945, 1.5439999103546143, 1.6231969594955444, 1.7023940086364746, 1.7815911769866943, 1.860788345336914, 1.9399853944778442, 2.0191824436187744, 2.098379611968994]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 10.0, 16.0, 16.0, 23.0, 21.0, 18.0, 34.0, 42.0, 46.0, 53.0, 59.0, 69.0, 87.0, 74.0, 76.0, 66.0, 61.0, 36.0, 50.0, 29.0, 24.0, 23.0, 19.0, 14.0, 8.0, 9.0, 2.0, 6.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0803883075714111, -1.0384495258331299, -0.9965108036994934, -0.9545720815658569, -0.9126332998275757, -0.8706945180892944, -0.828755795955658, -0.7868170738220215, -0.7448782920837402, -0.702939510345459, -0.6610007882118225, -0.619062066078186, -0.5771232843399048, -0.5351845026016235, -0.49324578046798706, -0.4513070285320282, -0.40936827659606934, -0.3674295246601105, -0.3254907727241516, -0.28355202078819275, -0.2416132688522339, -0.19967451691627502, -0.15773576498031616, -0.1157970130443573, -0.07385826110839844, -0.031919509172439575, 0.010019242763519287, 0.05195799469947815, 0.09389674663543701, 0.13583549857139587, 0.17777425050735474, 0.2197130024433136, 0.26165175437927246, 0.3035905063152313, 0.3455292582511902, 0.38746801018714905, 0.4294067621231079, 0.4713455140590668, 0.5132842659950256, 0.5552229881286621, 0.5971617698669434, 0.6391005516052246, 0.6810392737388611, 0.7229779958724976, 0.7649167776107788, 0.8068555593490601, 0.8487942814826965, 0.890733003616333, 0.9326717853546143, 0.9746105670928955, 1.0165493488311768, 1.0584880113601685, 1.1004267930984497, 1.142365574836731, 1.1843042373657227, 1.226243019104004, 1.2681818008422852, 1.3101205825805664, 1.3520593643188477, 1.3939980268478394, 1.4359368085861206, 1.4778755903244019, 1.5198142528533936, 1.5617530345916748, 1.603691816329956]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 5.0, 10.0, 11.0, 13.0, 19.0, 21.0, 25.0, 51.0, 55.0, 86.0, 123.0, 173.0, 233.0, 335.0, 527.0, 991.0, 2199.0, 6888.0, 31969.0, 4041324.0, 90522.0, 11805.0, 3402.0, 1392.0, 698.0, 406.0, 281.0, 189.0, 144.0, 96.0, 66.0, 68.0, 48.0, 30.0, 20.0, 21.0, 10.0, 11.0, 2.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.22705078125, -0.2201080322265625, -0.213165283203125, -0.2062225341796875, -0.19927978515625, -0.1923370361328125, -0.185394287109375, -0.1784515380859375, -0.1715087890625, -0.1645660400390625, -0.157623291015625, -0.1506805419921875, -0.14373779296875, -0.1367950439453125, -0.129852294921875, -0.1229095458984375, -0.115966796875, -0.1090240478515625, -0.102081298828125, -0.0951385498046875, -0.08819580078125, -0.0812530517578125, -0.074310302734375, -0.0673675537109375, -0.0604248046875, -0.0534820556640625, -0.046539306640625, -0.0395965576171875, -0.03265380859375, -0.0257110595703125, -0.018768310546875, -0.0118255615234375, -0.0048828125, 0.0020599365234375, 0.009002685546875, 0.0159454345703125, 0.02288818359375, 0.0298309326171875, 0.036773681640625, 0.0437164306640625, 0.0506591796875, 0.0576019287109375, 0.064544677734375, 0.0714874267578125, 0.07843017578125, 0.0853729248046875, 0.092315673828125, 0.0992584228515625, 0.106201171875, 0.1131439208984375, 0.120086669921875, 0.1270294189453125, 0.13397216796875, 0.1409149169921875, 0.147857666015625, 0.1548004150390625, 0.1617431640625, 0.1686859130859375, 0.175628662109375, 0.1825714111328125, 0.18951416015625, 0.1964569091796875, 0.203399658203125, 0.2103424072265625, 0.21728515625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 7.0, 10.0, 12.0, 19.0, 26.0, 28.0, 50.0, 65.0, 77.0, 98.0, 99.0, 105.0, 118.0, 75.0, 57.0, 47.0, 41.0, 36.0, 17.0, 9.0, 3.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.087890625, -0.08505630493164062, -0.08222198486328125, -0.07938766479492188, -0.0765533447265625, -0.07371902465820312, -0.07088470458984375, -0.06805038452148438, -0.065216064453125, -0.062381744384765625, -0.05954742431640625, -0.056713104248046875, -0.0538787841796875, -0.051044464111328125, -0.04821014404296875, -0.045375823974609375, -0.04254150390625, -0.039707183837890625, -0.03687286376953125, -0.034038543701171875, -0.0312042236328125, -0.028369903564453125, -0.02553558349609375, -0.022701263427734375, -0.019866943359375, -0.017032623291015625, -0.01419830322265625, -0.011363983154296875, -0.0085296630859375, -0.005695343017578125, -0.00286102294921875, -2.6702880859375e-05, 0.0028076171875, 0.005641937255859375, 0.00847625732421875, 0.011310577392578125, 0.0141448974609375, 0.016979217529296875, 0.01981353759765625, 0.022647857666015625, 0.025482177734375, 0.028316497802734375, 0.03115081787109375, 0.033985137939453125, 0.0368194580078125, 0.039653778076171875, 0.04248809814453125, 0.045322418212890625, 0.04815673828125, 0.050991058349609375, 0.05382537841796875, 0.056659698486328125, 0.0594940185546875, 0.062328338623046875, 0.06516265869140625, 0.06799697875976562, 0.070831298828125, 0.07366561889648438, 0.07649993896484375, 0.07933425903320312, 0.0821685791015625, 0.08500289916992188, 0.08783721923828125, 0.09067153930664062, 0.093505859375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 2.0, 2.0, 4.0, 6.0, 11.0, 12.0, 17.0, 23.0, 23.0, 46.0, 47.0, 66.0, 102.0, 140.0, 211.0, 290.0, 456.0, 640.0, 1057.0, 1825.0, 3581.0, 8641.0, 31241.0, 3330202.0, 770759.0, 28403.0, 8147.0, 3509.0, 1794.0, 1019.0, 638.0, 414.0, 269.0, 189.0, 151.0, 99.0, 70.0, 53.0, 29.0, 23.0, 23.0, 15.0, 10.0, 9.0, 4.0, 1.0, 3.0, 5.0, 6.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.2103271484375, -0.20413589477539062, -0.19794464111328125, -0.19175338745117188, -0.1855621337890625, -0.17937088012695312, -0.17317962646484375, -0.16698837280273438, -0.160797119140625, -0.15460586547851562, -0.14841461181640625, -0.14222335815429688, -0.1360321044921875, -0.12984085083007812, -0.12364959716796875, -0.11745834350585938, -0.11126708984375, -0.10507583618164062, -0.09888458251953125, -0.09269332885742188, -0.0865020751953125, -0.08031082153320312, -0.07411956787109375, -0.06792831420898438, -0.061737060546875, -0.055545806884765625, -0.04935455322265625, -0.043163299560546875, -0.0369720458984375, -0.030780792236328125, -0.02458953857421875, -0.018398284912109375, -0.01220703125, -0.006015777587890625, 0.00017547607421875, 0.006366729736328125, 0.0125579833984375, 0.018749237060546875, 0.02494049072265625, 0.031131744384765625, 0.037322998046875, 0.043514251708984375, 0.04970550537109375, 0.055896759033203125, 0.0620880126953125, 0.06827926635742188, 0.07447052001953125, 0.08066177368164062, 0.08685302734375, 0.09304428100585938, 0.09923553466796875, 0.10542678833007812, 0.1116180419921875, 0.11780929565429688, 0.12400054931640625, 0.13019180297851562, 0.136383056640625, 0.14257431030273438, 0.14876556396484375, 0.15495681762695312, 0.1611480712890625, 0.16733932495117188, 0.17353057861328125, 0.17972183227539062, 0.1859130859375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 5.0, 6.0, 8.0, 11.0, 14.0, 28.0, 36.0, 109.0, 728.0, 2829.0, 161.0, 48.0, 37.0, 13.0, 5.0, 8.0, 10.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09521484375, -0.09224796295166016, -0.08928108215332031, -0.08631420135498047, -0.08334732055664062, -0.08038043975830078, -0.07741355895996094, -0.0744466781616211, -0.07147979736328125, -0.0685129165649414, -0.06554603576660156, -0.06257915496826172, -0.059612274169921875, -0.05664539337158203, -0.05367851257324219, -0.050711631774902344, -0.0477447509765625, -0.044777870178222656, -0.04181098937988281, -0.03884410858154297, -0.035877227783203125, -0.03291034698486328, -0.029943466186523438, -0.026976585388183594, -0.02400970458984375, -0.021042823791503906, -0.018075942993164062, -0.015109062194824219, -0.012142181396484375, -0.009175300598144531, -0.0062084197998046875, -0.0032415390014648438, -0.000274658203125, 0.0026922225952148438, 0.0056591033935546875, 0.008625984191894531, 0.011592864990234375, 0.014559745788574219, 0.017526626586914062, 0.020493507385253906, 0.02346038818359375, 0.026427268981933594, 0.029394149780273438, 0.03236103057861328, 0.035327911376953125, 0.03829479217529297, 0.04126167297363281, 0.044228553771972656, 0.0471954345703125, 0.050162315368652344, 0.05312919616699219, 0.05609607696533203, 0.059062957763671875, 0.06202983856201172, 0.06499671936035156, 0.0679636001586914, 0.07093048095703125, 0.0738973617553711, 0.07686424255371094, 0.07983112335205078, 0.08279800415039062, 0.08576488494873047, 0.08873176574707031, 0.09169864654541016, 0.09466552734375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 2.0, 2.0, 8.0, 16.0, 14.0, 10.0, 15.0, 29.0, 35.0, 42.0, 61.0, 92.0, 98.0, 100.0, 102.0, 82.0, 84.0, 62.0, 38.0, 39.0, 25.0, 11.0, 10.0, 6.0, 8.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3083820044994354, -0.29975780844688416, -0.2911336123943329, -0.2825094163417816, -0.27388522028923035, -0.2652610242366791, -0.2566368281841278, -0.24801264703273773, -0.23938845098018646, -0.2307642549276352, -0.22214005887508392, -0.21351586282253265, -0.20489168167114258, -0.1962674856185913, -0.18764328956604004, -0.17901909351348877, -0.1703948974609375, -0.16177070140838623, -0.15314650535583496, -0.1445223093032837, -0.13589811325073242, -0.12727391719818115, -0.11864973604679108, -0.11002553999423981, -0.10140134394168854, -0.09277714788913727, -0.084152951836586, -0.07552876323461533, -0.06690456718206406, -0.05828037112951279, -0.049656178802251816, -0.041031986474990845, -0.03240780532360077, -0.02378361113369465, -0.015159416943788528, -0.006535222753882408, 0.002088971436023712, 0.010713167488574982, 0.019337359815835953, 0.027961552143096924, 0.03658574819564819, 0.04520994424819946, 0.053834136575460434, 0.062458328902721405, 0.07108252495527267, 0.07970672100782394, 0.08833090960979462, 0.09695510566234589, 0.10557930171489716, 0.11420349776744843, 0.1228276938199997, 0.13145188987255096, 0.14007607102394104, 0.1487002670764923, 0.15732446312904358, 0.16594865918159485, 0.17457285523414612, 0.1831970512866974, 0.19182124733924866, 0.20044544339179993, 0.2090696394443512, 0.21769383549690247, 0.22631801664829254, 0.2349422127008438, 0.24356640875339508]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 10.0, 3.0, 6.0, 18.0, 14.0, 14.0, 20.0, 18.0, 28.0, 30.0, 37.0, 28.0, 33.0, 51.0, 43.0, 50.0, 36.0, 49.0, 34.0, 52.0, 41.0, 53.0, 46.0, 31.0, 47.0, 36.0, 22.0, 26.0, 25.0, 21.0, 10.0, 19.0, 12.0, 12.0, 3.0, 6.0, 6.0, 2.0, 4.0, 0.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.18508309125900269, -0.17879697680473328, -0.17251084744930267, -0.16622473299503326, -0.15993860363960266, -0.15365248918533325, -0.14736637473106384, -0.14108026027679443, -0.13479413092136383, -0.12850801646709442, -0.12222188711166382, -0.11593577265739441, -0.1096496507525444, -0.1033635288476944, -0.09707741439342499, -0.09079129248857498, -0.08450517058372498, -0.07821904867887497, -0.07193292677402496, -0.06564681231975555, -0.05936069041490555, -0.05307456851005554, -0.046788450330495834, -0.04050233215093613, -0.03421621024608612, -0.027930090203881264, -0.021643970161676407, -0.01535785011947155, -0.009071730077266693, -0.002785608172416687, 0.0035005100071430206, 0.009786628186702728, 0.016072750091552734, 0.02235887013375759, 0.028644990175962448, 0.034931108355522156, 0.04121723026037216, 0.04750335216522217, 0.053789470344781876, 0.06007558852434158, 0.06636171042919159, 0.0726478323340416, 0.0789339542388916, 0.08522006869316101, 0.09150619059801102, 0.09779231250286102, 0.10407842695713043, 0.11036454886198044, 0.11665067076683044, 0.12293679267168045, 0.12922291457653046, 0.13550902903079987, 0.14179515838623047, 0.14808127284049988, 0.1543673872947693, 0.1606535017490387, 0.1669396311044693, 0.1732257455587387, 0.1795118749141693, 0.18579798936843872, 0.19208410382270813, 0.19837023317813873, 0.20465634763240814, 0.21094247698783875, 0.21722859144210815]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 8.0, 10.0, 29.0, 39.0, 41.0, 89.0, 154.0, 230.0, 458.0, 851.0, 1650.0, 3693.0, 10066.0, 32596.0, 131757.0, 509375.0, 269181.0, 60745.0, 16936.0, 5818.0, 2379.0, 1099.0, 585.0, 309.0, 182.0, 101.0, 64.0, 42.0, 24.0, 10.0, 14.0, 7.0, 3.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1624755859375, -0.1570110321044922, -0.15154647827148438, -0.14608192443847656, -0.14061737060546875, -0.13515281677246094, -0.12968826293945312, -0.12422370910644531, -0.1187591552734375, -0.11329460144042969, -0.10783004760742188, -0.10236549377441406, -0.09690093994140625, -0.09143638610839844, -0.08597183227539062, -0.08050727844238281, -0.075042724609375, -0.06957817077636719, -0.06411361694335938, -0.05864906311035156, -0.05318450927734375, -0.04771995544433594, -0.042255401611328125, -0.03679084777832031, -0.0313262939453125, -0.025861740112304688, -0.020397186279296875, -0.014932632446289062, -0.00946807861328125, -0.0040035247802734375, 0.001461029052734375, 0.0069255828857421875, 0.01239013671875, 0.017854690551757812, 0.023319244384765625, 0.028783798217773438, 0.03424835205078125, 0.03971290588378906, 0.045177459716796875, 0.05064201354980469, 0.0561065673828125, 0.06157112121582031, 0.06703567504882812, 0.07250022888183594, 0.07796478271484375, 0.08342933654785156, 0.08889389038085938, 0.09435844421386719, 0.099822998046875, 0.10528755187988281, 0.11075210571289062, 0.11621665954589844, 0.12168121337890625, 0.12714576721191406, 0.13261032104492188, 0.1380748748779297, 0.1435394287109375, 0.1490039825439453, 0.15446853637695312, 0.15993309020996094, 0.16539764404296875, 0.17086219787597656, 0.17632675170898438, 0.1817913055419922, 0.187255859375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 8.0, 10.0, 21.0, 23.0, 29.0, 49.0, 56.0, 81.0, 85.0, 103.0, 85.0, 107.0, 94.0, 80.0, 50.0, 42.0, 25.0, 18.0, 18.0, 11.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10992431640625, -0.1069021224975586, -0.10387992858886719, -0.10085773468017578, -0.09783554077148438, -0.09481334686279297, -0.09179115295410156, -0.08876895904541016, -0.08574676513671875, -0.08272457122802734, -0.07970237731933594, -0.07668018341064453, -0.07365798950195312, -0.07063579559326172, -0.06761360168457031, -0.0645914077758789, -0.0615692138671875, -0.058547019958496094, -0.05552482604980469, -0.05250263214111328, -0.049480438232421875, -0.04645824432373047, -0.04343605041503906, -0.040413856506347656, -0.03739166259765625, -0.034369468688964844, -0.03134727478027344, -0.02832508087158203, -0.025302886962890625, -0.02228069305419922, -0.019258499145507812, -0.016236305236816406, -0.013214111328125, -0.010191917419433594, -0.0071697235107421875, -0.004147529602050781, -0.001125335693359375, 0.0018968582153320312, 0.0049190521240234375, 0.007941246032714844, 0.01096343994140625, 0.013985633850097656, 0.017007827758789062, 0.02003002166748047, 0.023052215576171875, 0.02607440948486328, 0.029096603393554688, 0.032118797302246094, 0.0351409912109375, 0.038163185119628906, 0.04118537902832031, 0.04420757293701172, 0.047229766845703125, 0.05025196075439453, 0.05327415466308594, 0.056296348571777344, 0.05931854248046875, 0.062340736389160156, 0.06536293029785156, 0.06838512420654297, 0.07140731811523438, 0.07442951202392578, 0.07745170593261719, 0.0804738998413086, 0.08349609375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 7.0, 4.0, 6.0, 10.0, 8.0, 13.0, 12.0, 23.0, 45.0, 49.0, 60.0, 78.0, 99.0, 168.0, 234.0, 323.0, 492.0, 843.0, 1583.0, 3161.0, 7710.0, 24385.0, 120487.0, 620478.0, 211181.0, 37533.0, 10607.0, 4096.0, 1963.0, 1004.0, 614.0, 363.0, 288.0, 164.0, 117.0, 90.0, 73.0, 53.0, 33.0, 27.0, 25.0, 11.0, 11.0, 10.0, 4.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.16943359375, -0.164398193359375, -0.15936279296875, -0.154327392578125, -0.1492919921875, -0.144256591796875, -0.13922119140625, -0.134185791015625, -0.129150390625, -0.124114990234375, -0.11907958984375, -0.114044189453125, -0.1090087890625, -0.103973388671875, -0.09893798828125, -0.093902587890625, -0.0888671875, -0.083831787109375, -0.07879638671875, -0.073760986328125, -0.0687255859375, -0.063690185546875, -0.05865478515625, -0.053619384765625, -0.048583984375, -0.043548583984375, -0.03851318359375, -0.033477783203125, -0.0284423828125, -0.023406982421875, -0.01837158203125, -0.013336181640625, -0.00830078125, -0.003265380859375, 0.00177001953125, 0.006805419921875, 0.0118408203125, 0.016876220703125, 0.02191162109375, 0.026947021484375, 0.031982421875, 0.037017822265625, 0.04205322265625, 0.047088623046875, 0.0521240234375, 0.057159423828125, 0.06219482421875, 0.067230224609375, 0.072265625, 0.077301025390625, 0.08233642578125, 0.087371826171875, 0.0924072265625, 0.097442626953125, 0.10247802734375, 0.107513427734375, 0.112548828125, 0.117584228515625, 0.12261962890625, 0.127655029296875, 0.1326904296875, 0.137725830078125, 0.14276123046875, 0.147796630859375, 0.15283203125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 7.0, 3.0, 7.0, 5.0, 5.0, 16.0, 13.0, 13.0, 16.0, 26.0, 32.0, 21.0, 29.0, 44.0, 36.0, 31.0, 40.0, 34.0, 33.0, 44.0, 39.0, 40.0, 29.0, 38.0, 38.0, 37.0, 31.0, 32.0, 35.0, 34.0, 19.0, 24.0, 22.0, 21.0, 13.0, 15.0, 16.0, 17.0, 7.0, 5.0, 7.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.1904296875, -0.1849346160888672, -0.17943954467773438, -0.17394447326660156, -0.16844940185546875, -0.16295433044433594, -0.15745925903320312, -0.1519641876220703, -0.1464691162109375, -0.1409740447998047, -0.13547897338867188, -0.12998390197753906, -0.12448883056640625, -0.11899375915527344, -0.11349868774414062, -0.10800361633300781, -0.102508544921875, -0.09701347351074219, -0.09151840209960938, -0.08602333068847656, -0.08052825927734375, -0.07503318786621094, -0.06953811645507812, -0.06404304504394531, -0.0585479736328125, -0.05305290222167969, -0.047557830810546875, -0.04206275939941406, -0.03656768798828125, -0.031072616577148438, -0.025577545166015625, -0.020082473754882812, -0.01458740234375, -0.009092330932617188, -0.003597259521484375, 0.0018978118896484375, 0.00739288330078125, 0.012887954711914062, 0.018383026123046875, 0.023878097534179688, 0.0293731689453125, 0.03486824035644531, 0.040363311767578125, 0.04585838317871094, 0.05135345458984375, 0.05684852600097656, 0.062343597412109375, 0.06783866882324219, 0.073333740234375, 0.07882881164550781, 0.08432388305664062, 0.08981895446777344, 0.09531402587890625, 0.10080909729003906, 0.10630416870117188, 0.11179924011230469, 0.1172943115234375, 0.12278938293457031, 0.12828445434570312, 0.13377952575683594, 0.13927459716796875, 0.14476966857910156, 0.15026473999023438, 0.1557598114013672, 0.1612548828125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 4.0, 6.0, 6.0, 5.0, 4.0, 6.0, 5.0, 11.0, 12.0, 27.0, 31.0, 34.0, 64.0, 115.0, 154.0, 230.0, 349.0, 626.0, 1251.0, 2620.0, 6578.0, 22242.0, 148853.0, 698580.0, 134285.0, 20900.0, 6173.0, 2480.0, 1218.0, 634.0, 377.0, 241.0, 130.0, 99.0, 57.0, 48.0, 26.0, 19.0, 18.0, 9.0, 7.0, 5.0, 7.0, 3.0, 2.0, 4.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06658935546875, -0.06440448760986328, -0.06221961975097656, -0.060034751892089844, -0.057849884033203125, -0.055665016174316406, -0.05348014831542969, -0.05129528045654297, -0.04911041259765625, -0.04692554473876953, -0.04474067687988281, -0.042555809020996094, -0.040370941162109375, -0.038186073303222656, -0.03600120544433594, -0.03381633758544922, -0.0316314697265625, -0.02944660186767578, -0.027261734008789062, -0.025076866149902344, -0.022891998291015625, -0.020707130432128906, -0.018522262573242188, -0.01633739471435547, -0.01415252685546875, -0.011967658996582031, -0.009782791137695312, -0.007597923278808594, -0.005413055419921875, -0.0032281875610351562, -0.0010433197021484375, 0.0011415481567382812, 0.003326416015625, 0.005511283874511719, 0.0076961517333984375, 0.009881019592285156, 0.012065887451171875, 0.014250755310058594, 0.016435623168945312, 0.01862049102783203, 0.02080535888671875, 0.02299022674560547, 0.025175094604492188, 0.027359962463378906, 0.029544830322265625, 0.031729698181152344, 0.03391456604003906, 0.03609943389892578, 0.0382843017578125, 0.04046916961669922, 0.04265403747558594, 0.044838905334472656, 0.047023773193359375, 0.049208641052246094, 0.05139350891113281, 0.05357837677001953, 0.05576324462890625, 0.05794811248779297, 0.06013298034667969, 0.062317848205566406, 0.06450271606445312, 0.06668758392333984, 0.06887245178222656, 0.07105731964111328, 0.0732421875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 7.0, 10.0, 10.0, 15.0, 19.0, 45.0, 42.0, 57.0, 66.0, 100.0, 162.0, 122.0, 95.0, 73.0, 61.0, 24.0, 31.0, 15.0, 12.0, 12.0, 10.0, 5.0, 5.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.500150680541992e-05, -4.3623149394989014e-05, -4.2244791984558105e-05, -4.08664345741272e-05, -3.948807716369629e-05, -3.810971975326538e-05, -3.673136234283447e-05, -3.5353004932403564e-05, -3.3974647521972656e-05, -3.259629011154175e-05, -3.121793270111084e-05, -2.983957529067993e-05, -2.8461217880249023e-05, -2.7082860469818115e-05, -2.5704503059387207e-05, -2.43261456489563e-05, -2.294778823852539e-05, -2.1569430828094482e-05, -2.0191073417663574e-05, -1.8812716007232666e-05, -1.7434358596801758e-05, -1.605600118637085e-05, -1.4677643775939941e-05, -1.3299286365509033e-05, -1.1920928955078125e-05, -1.0542571544647217e-05, -9.164214134216309e-06, -7.7858567237854e-06, -6.407499313354492e-06, -5.029141902923584e-06, -3.6507844924926758e-06, -2.2724270820617676e-06, -8.940696716308594e-07, 4.842877388000488e-07, 1.862645149230957e-06, 3.2410025596618652e-06, 4.6193599700927734e-06, 5.997717380523682e-06, 7.37607479095459e-06, 8.754432201385498e-06, 1.0132789611816406e-05, 1.1511147022247314e-05, 1.2889504432678223e-05, 1.4267861843109131e-05, 1.564621925354004e-05, 1.7024576663970947e-05, 1.8402934074401855e-05, 1.9781291484832764e-05, 2.1159648895263672e-05, 2.253800630569458e-05, 2.3916363716125488e-05, 2.5294721126556396e-05, 2.6673078536987305e-05, 2.8051435947418213e-05, 2.942979335784912e-05, 3.080815076828003e-05, 3.218650817871094e-05, 3.3564865589141846e-05, 3.4943222999572754e-05, 3.632158041000366e-05, 3.769993782043457e-05, 3.907829523086548e-05, 4.045665264129639e-05, 4.1835010051727295e-05, 4.32133674621582e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 4.0, 10.0, 13.0, 19.0, 46.0, 62.0, 128.0, 225.0, 495.0, 1216.0, 4059.0, 21049.0, 417327.0, 571089.0, 25811.0, 4508.0, 1387.0, 516.0, 247.0, 132.0, 69.0, 57.0, 26.0, 13.0, 12.0, 7.0, 10.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08404541015625, -0.0805501937866211, -0.07705497741699219, -0.07355976104736328, -0.07006454467773438, -0.06656932830810547, -0.06307411193847656, -0.059578895568847656, -0.05608367919921875, -0.052588462829589844, -0.04909324645996094, -0.04559803009033203, -0.042102813720703125, -0.03860759735107422, -0.03511238098144531, -0.031617164611816406, -0.0281219482421875, -0.024626731872558594, -0.021131515502929688, -0.01763629913330078, -0.014141082763671875, -0.010645866394042969, -0.0071506500244140625, -0.0036554336547851562, -0.00016021728515625, 0.0033349990844726562, 0.0068302154541015625, 0.010325431823730469, 0.013820648193359375, 0.01731586456298828, 0.020811080932617188, 0.024306297302246094, 0.027801513671875, 0.031296730041503906, 0.03479194641113281, 0.03828716278076172, 0.041782379150390625, 0.04527759552001953, 0.04877281188964844, 0.052268028259277344, 0.05576324462890625, 0.059258460998535156, 0.06275367736816406, 0.06624889373779297, 0.06974411010742188, 0.07323932647705078, 0.07673454284667969, 0.0802297592163086, 0.0837249755859375, 0.0872201919555664, 0.09071540832519531, 0.09421062469482422, 0.09770584106445312, 0.10120105743408203, 0.10469627380371094, 0.10819149017333984, 0.11168670654296875, 0.11518192291259766, 0.11867713928222656, 0.12217235565185547, 0.12566757202148438, 0.12916278839111328, 0.1326580047607422, 0.1361532211303711, 0.1396484375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 3.0, 6.0, 14.0, 15.0, 22.0, 34.0, 50.0, 70.0, 95.0, 123.0, 125.0, 110.0, 78.0, 76.0, 43.0, 38.0, 23.0, 17.0, 16.0, 8.0, 4.0, 5.0, 5.0, 9.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08782958984375, -0.0852804183959961, -0.08273124694824219, -0.08018207550048828, -0.07763290405273438, -0.07508373260498047, -0.07253456115722656, -0.06998538970947266, -0.06743621826171875, -0.06488704681396484, -0.06233787536621094, -0.05978870391845703, -0.057239532470703125, -0.05469036102294922, -0.05214118957519531, -0.049592018127441406, -0.0470428466796875, -0.044493675231933594, -0.04194450378417969, -0.03939533233642578, -0.036846160888671875, -0.03429698944091797, -0.03174781799316406, -0.029198646545410156, -0.02664947509765625, -0.024100303649902344, -0.021551132202148438, -0.01900196075439453, -0.016452789306640625, -0.013903617858886719, -0.011354446411132812, -0.008805274963378906, -0.006256103515625, -0.0037069320678710938, -0.0011577606201171875, 0.0013914108276367188, 0.003940582275390625, 0.006489753723144531, 0.009038925170898438, 0.011588096618652344, 0.01413726806640625, 0.016686439514160156, 0.019235610961914062, 0.02178478240966797, 0.024333953857421875, 0.02688312530517578, 0.029432296752929688, 0.031981468200683594, 0.0345306396484375, 0.037079811096191406, 0.03962898254394531, 0.04217815399169922, 0.044727325439453125, 0.04727649688720703, 0.04982566833496094, 0.052374839782714844, 0.05492401123046875, 0.057473182678222656, 0.06002235412597656, 0.06257152557373047, 0.06512069702148438, 0.06766986846923828, 0.07021903991699219, 0.0727682113647461, 0.0753173828125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 8.0, 6.0, 31.0, 38.0, 109.0, 185.0, 242.0, 197.0, 113.0, 45.0, 20.0, 4.0, 1.0, 6.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.017937660217285, -2.946852922439575, -2.8757681846618652, -2.8046836853027344, -2.7335989475250244, -2.6625142097473145, -2.5914294719696045, -2.5203447341918945, -2.4492602348327637, -2.3781754970550537, -2.3070907592773438, -2.236006259918213, -2.164921522140503, -2.093836784362793, -2.022752046585083, -1.9516674280166626, -1.8805826902389526, -1.8094979524612427, -1.7384133338928223, -1.6673285961151123, -1.596243977546692, -1.525159239768982, -1.4540746212005615, -1.3829898834228516, -1.3119051456451416, -1.2408204078674316, -1.1697357892990112, -1.0986510515213013, -1.0275664329528809, -0.9564816951751709, -0.8853970170021057, -0.8143123388290405, -0.7432276010513306, -0.6721429228782654, -0.6010582447052002, -0.5299735069274902, -0.45888885855674744, -0.38780418038368225, -0.3167194724082947, -0.2456347942352295, -0.1745501160621643, -0.10346543043851852, -0.03238074481487274, 0.03870394825935364, 0.10978862643241882, 0.180873304605484, 0.2519580125808716, 0.32304269075393677, 0.39412736892700195, 0.46521204710006714, 0.5362967252731323, 0.6073814630508423, 0.6784660816192627, 0.7495508193969727, 0.8206354975700378, 0.891720175743103, 0.9628048539161682, 1.0338895320892334, 1.1049742698669434, 1.1760588884353638, 1.2471436262130737, 1.3182282447814941, 1.389312982559204, 1.460397720336914, 1.5314823389053345]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 3.0, 3.0, 1.0, 6.0, 3.0, 9.0, 5.0, 11.0, 6.0, 14.0, 13.0, 15.0, 21.0, 34.0, 34.0, 27.0, 23.0, 39.0, 50.0, 39.0, 53.0, 48.0, 60.0, 67.0, 37.0, 58.0, 48.0, 41.0, 28.0, 34.0, 27.0, 33.0, 17.0, 13.0, 25.0, 11.0, 16.0, 5.0, 5.0, 7.0, 7.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9634849429130554, -0.9339351654052734, -0.9043853282928467, -0.8748355507850647, -0.8452857732772827, -0.815735936164856, -0.786186158657074, -0.756636381149292, -0.72708660364151, -0.697536826133728, -0.6679869890213013, -0.6384372115135193, -0.6088874340057373, -0.5793375968933105, -0.5497878193855286, -0.5202380418777466, -0.4906882345676422, -0.46113842725753784, -0.43158864974975586, -0.4020388424396515, -0.3724890649318695, -0.34293925762176514, -0.31338948011398315, -0.2838396728038788, -0.2542898654937744, -0.22474007308483124, -0.19519028067588806, -0.1656404733657837, -0.1360906958580017, -0.10654088854789734, -0.07699109613895416, -0.047441303730010986, -0.017891526222229004, 0.011658268049359322, 0.04120806232094765, 0.07075785845518112, 0.1003076508641243, 0.12985745072364807, 0.15940724313259125, 0.18895703554153442, 0.2185068279504776, 0.24805662035942078, 0.27760642766952515, 0.30715620517730713, 0.3367060124874115, 0.36625581979751587, 0.39580559730529785, 0.42535537481307983, 0.4549051821231842, 0.4844549894332886, 0.5140047669410706, 0.5435545444488525, 0.5731043815612793, 0.6026541590690613, 0.6322039365768433, 0.66175377368927, 0.691303551197052, 0.720853328704834, 0.7504031658172607, 0.7799529433250427, 0.8095027208328247, 0.8390525579452515, 0.8686023354530334, 0.8981521129608154, 0.9277018904685974]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 6.0, 2.0, 5.0, 9.0, 11.0, 13.0, 26.0, 25.0, 36.0, 49.0, 67.0, 92.0, 113.0, 150.0, 273.0, 346.0, 499.0, 781.0, 1244.0, 2184.0, 3952.0, 7744.0, 16949.0, 46525.0, 209098.0, 2639896.0, 1088449.0, 116696.0, 31916.0, 12832.0, 6083.0, 3243.0, 1764.0, 1113.0, 665.0, 446.0, 275.0, 187.0, 149.0, 84.0, 86.0, 46.0, 42.0, 22.0, 27.0, 18.0, 15.0, 12.0, 4.0, 7.0, 4.0, 2.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08306884765625, -0.08018779754638672, -0.07730674743652344, -0.07442569732666016, -0.07154464721679688, -0.0686635971069336, -0.06578254699707031, -0.06290149688720703, -0.06002044677734375, -0.05713939666748047, -0.05425834655761719, -0.051377296447753906, -0.048496246337890625, -0.045615196228027344, -0.04273414611816406, -0.03985309600830078, -0.0369720458984375, -0.03409099578857422, -0.031209945678710938, -0.028328895568847656, -0.025447845458984375, -0.022566795349121094, -0.019685745239257812, -0.01680469512939453, -0.01392364501953125, -0.011042594909667969, -0.008161544799804688, -0.005280494689941406, -0.002399444580078125, 0.00048160552978515625, 0.0033626556396484375, 0.006243705749511719, 0.009124755859375, 0.012005805969238281, 0.014886856079101562, 0.017767906188964844, 0.020648956298828125, 0.023530006408691406, 0.026411056518554688, 0.02929210662841797, 0.03217315673828125, 0.03505420684814453, 0.03793525695800781, 0.040816307067871094, 0.043697357177734375, 0.046578407287597656, 0.04945945739746094, 0.05234050750732422, 0.0552215576171875, 0.05810260772705078, 0.06098365783691406, 0.06386470794677734, 0.06674575805664062, 0.0696268081665039, 0.07250785827636719, 0.07538890838623047, 0.07826995849609375, 0.08115100860595703, 0.08403205871582031, 0.0869131088256836, 0.08979415893554688, 0.09267520904541016, 0.09555625915527344, 0.09843730926513672, 0.101318359375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 1.0, 4.0, 3.0, 3.0, 6.0, 8.0, 7.0, 12.0, 8.0, 12.0, 9.0, 14.0, 19.0, 25.0, 17.0, 26.0, 22.0, 22.0, 25.0, 32.0, 31.0, 28.0, 38.0, 39.0, 36.0, 35.0, 51.0, 20.0, 44.0, 43.0, 33.0, 42.0, 40.0, 22.0, 28.0, 20.0, 30.0, 23.0, 18.0, 15.0, 17.0, 15.0, 11.0, 12.0, 9.0, 10.0, 4.0, 3.0, 4.0, 4.0, 5.0, 2.0, 1.0, 3.0], "bins": [-0.03936767578125, -0.03827214241027832, -0.03717660903930664, -0.03608107566833496, -0.03498554229736328, -0.0338900089263916, -0.03279447555541992, -0.03169894218444824, -0.030603408813476562, -0.029507875442504883, -0.028412342071533203, -0.027316808700561523, -0.026221275329589844, -0.025125741958618164, -0.024030208587646484, -0.022934675216674805, -0.021839141845703125, -0.020743608474731445, -0.019648075103759766, -0.018552541732788086, -0.017457008361816406, -0.016361474990844727, -0.015265941619873047, -0.014170408248901367, -0.013074874877929688, -0.011979341506958008, -0.010883808135986328, -0.009788274765014648, -0.008692741394042969, -0.007597208023071289, -0.006501674652099609, -0.00540614128112793, -0.00431060791015625, -0.0032150745391845703, -0.0021195411682128906, -0.001024007797241211, 7.152557373046875e-05, 0.0011670589447021484, 0.002262592315673828, 0.003358125686645508, 0.0044536590576171875, 0.005549192428588867, 0.006644725799560547, 0.0077402591705322266, 0.008835792541503906, 0.009931325912475586, 0.011026859283447266, 0.012122392654418945, 0.013217926025390625, 0.014313459396362305, 0.015408992767333984, 0.016504526138305664, 0.017600059509277344, 0.018695592880249023, 0.019791126251220703, 0.020886659622192383, 0.021982192993164062, 0.023077726364135742, 0.024173259735107422, 0.0252687931060791, 0.02636432647705078, 0.02745985984802246, 0.02855539321899414, 0.02965092658996582, 0.0307464599609375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 16.0, 19.0, 20.0, 35.0, 59.0, 94.0, 128.0, 223.0, 410.0, 770.0, 1651.0, 3865.0, 11646.0, 47609.0, 518028.0, 3424480.0, 147959.0, 24850.0, 7170.0, 2714.0, 1160.0, 556.0, 330.0, 169.0, 117.0, 73.0, 36.0, 20.0, 18.0, 14.0, 15.0, 2.0, 10.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.156494140625, -0.15132713317871094, -0.14616012573242188, -0.1409931182861328, -0.13582611083984375, -0.1306591033935547, -0.12549209594726562, -0.12032508850097656, -0.1151580810546875, -0.10999107360839844, -0.10482406616210938, -0.09965705871582031, -0.09449005126953125, -0.08932304382324219, -0.08415603637695312, -0.07898902893066406, -0.073822021484375, -0.06865501403808594, -0.06348800659179688, -0.05832099914550781, -0.05315399169921875, -0.04798698425292969, -0.042819976806640625, -0.03765296936035156, -0.0324859619140625, -0.027318954467773438, -0.022151947021484375, -0.016984939575195312, -0.01181793212890625, -0.0066509246826171875, -0.001483917236328125, 0.0036830902099609375, 0.00885009765625, 0.014017105102539062, 0.019184112548828125, 0.024351119995117188, 0.02951812744140625, 0.03468513488769531, 0.039852142333984375, 0.04501914978027344, 0.0501861572265625, 0.05535316467285156, 0.060520172119140625, 0.06568717956542969, 0.07085418701171875, 0.07602119445800781, 0.08118820190429688, 0.08635520935058594, 0.091522216796875, 0.09668922424316406, 0.10185623168945312, 0.10702323913574219, 0.11219024658203125, 0.11735725402832031, 0.12252426147460938, 0.12769126892089844, 0.1328582763671875, 0.13802528381347656, 0.14319229125976562, 0.1483592987060547, 0.15352630615234375, 0.1586933135986328, 0.16386032104492188, 0.16902732849121094, 0.1741943359375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 13.0, 12.0, 17.0, 10.0, 18.0, 40.0, 65.0, 113.0, 186.0, 323.0, 756.0, 1196.0, 599.0, 287.0, 144.0, 82.0, 54.0, 41.0, 25.0, 20.0, 13.0, 14.0, 11.0, 3.0, 6.0, 2.0, 2.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1390380859375, -0.1339569091796875, -0.128875732421875, -0.1237945556640625, -0.11871337890625, -0.1136322021484375, -0.108551025390625, -0.1034698486328125, -0.098388671875, -0.0933074951171875, -0.088226318359375, -0.0831451416015625, -0.07806396484375, -0.0729827880859375, -0.067901611328125, -0.0628204345703125, -0.0577392578125, -0.0526580810546875, -0.047576904296875, -0.0424957275390625, -0.03741455078125, -0.0323333740234375, -0.027252197265625, -0.0221710205078125, -0.01708984375, -0.0120086669921875, -0.006927490234375, -0.0018463134765625, 0.00323486328125, 0.0083160400390625, 0.013397216796875, 0.0184783935546875, 0.0235595703125, 0.0286407470703125, 0.033721923828125, 0.0388031005859375, 0.04388427734375, 0.0489654541015625, 0.054046630859375, 0.0591278076171875, 0.064208984375, 0.0692901611328125, 0.074371337890625, 0.0794525146484375, 0.08453369140625, 0.0896148681640625, 0.094696044921875, 0.0997772216796875, 0.1048583984375, 0.1099395751953125, 0.115020751953125, 0.1201019287109375, 0.12518310546875, 0.1302642822265625, 0.135345458984375, 0.1404266357421875, 0.1455078125, 0.1505889892578125, 0.155670166015625, 0.1607513427734375, 0.16583251953125, 0.1709136962890625, 0.175994873046875, 0.1810760498046875, 0.1861572265625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 12.0, 24.0, 84.0, 291.0, 355.0, 151.0, 49.0, 17.0, 12.0, 7.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9909154772758484, -0.9020388126373291, -0.8131622076034546, -0.7242856025695801, -0.6354089379310608, -0.5465322732925415, -0.457655668258667, -0.3687790036201477, -0.2799023985862732, -0.1910257637500763, -0.1021491289138794, -0.013272494077682495, 0.0756041407585144, 0.1644807755947113, 0.2533574104309082, 0.3422340750694275, 0.431110680103302, 0.5199873447418213, 0.6088639497756958, 0.6977405548095703, 0.7866172194480896, 0.8754938840866089, 0.9643704891204834, 1.0532472133636475, 1.1421236991882324, 1.231000304222107, 1.3198769092559814, 1.4087536334991455, 1.49763023853302, 1.5865068435668945, 1.6753835678100586, 1.764260172843933, 1.8531370162963867, 1.9420136213302612, 2.0308902263641357, 2.1197669506073, 2.2086434364318848, 2.297520160675049, 2.386396884918213, 2.475273609161377, 2.564150094985962, 2.653026819229126, 2.741903305053711, 2.830780029296875, 2.919656753540039, 3.008533239364624, 3.097409963607788, 3.186286449432373, 3.275163173675537, 3.364039897918701, 3.452916383743286, 3.54179310798645, 3.630669593811035, 3.719546318054199, 3.8084230422973633, 3.8972997665405273, 3.9861762523651123, 4.075052738189697, 4.163929462432861, 4.252806186676025, 4.3416829109191895, 4.4305596351623535, 4.519435882568359, 4.608312606811523, 4.6971893310546875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 7.0, 4.0, 6.0, 5.0, 11.0, 14.0, 22.0, 26.0, 25.0, 36.0, 33.0, 45.0, 47.0, 58.0, 49.0, 50.0, 77.0, 64.0, 50.0, 51.0, 52.0, 55.0, 41.0, 39.0, 32.0, 20.0, 22.0, 20.0, 12.0, 14.0, 8.0, 4.0, 1.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6463693380355835, -0.6231992840766907, -0.6000292897224426, -0.5768592357635498, -0.553689181804657, -0.5305191278457642, -0.5073491334915161, -0.4841790795326233, -0.46100902557373047, -0.43783900141716003, -0.4146689474582672, -0.3914989233016968, -0.36832886934280396, -0.3451588451862335, -0.3219888210296631, -0.29881876707077026, -0.27564874291419983, -0.2524787187576294, -0.22930866479873657, -0.20613864064216614, -0.18296858668327332, -0.15979856252670288, -0.13662852346897125, -0.11345848441123962, -0.090288445353508, -0.06711840629577637, -0.04394837096333504, -0.020778335630893707, 0.002391703426837921, 0.02556174248456955, 0.04873177409172058, 0.07190181314945221, 0.09507185220718384, 0.11824189126491547, 0.1414119303226471, 0.16458195447921753, 0.18775200843811035, 0.2109220325946808, 0.23409207165241241, 0.25726211071014404, 0.28043216466903687, 0.3036021888256073, 0.3267722427845001, 0.34994226694107056, 0.3731123208999634, 0.3962823450565338, 0.41945236921310425, 0.44262242317199707, 0.4657924473285675, 0.48896247148513794, 0.5121325254440308, 0.5353025794029236, 0.5584725737571716, 0.5816426277160645, 0.6048126816749573, 0.6279827356338501, 0.6511527299880981, 0.674322783946991, 0.697492778301239, 0.7206628322601318, 0.7438328862190247, 0.7670029401779175, 0.7901729345321655, 0.8133429884910583, 0.8365130424499512]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 10.0, 10.0, 19.0, 24.0, 34.0, 39.0, 70.0, 90.0, 165.0, 234.0, 440.0, 783.0, 1521.0, 2917.0, 5558.0, 12210.0, 29696.0, 84013.0, 305158.0, 413463.0, 121500.0, 40010.0, 15791.0, 7275.0, 3478.0, 1731.0, 952.0, 523.0, 314.0, 180.0, 112.0, 78.0, 40.0, 31.0, 23.0, 18.0, 14.0, 10.0, 7.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.1337890625, -0.13018798828125, -0.1265869140625, -0.12298583984375, -0.119384765625, -0.11578369140625, -0.1121826171875, -0.10858154296875, -0.10498046875, -0.10137939453125, -0.0977783203125, -0.09417724609375, -0.090576171875, -0.08697509765625, -0.0833740234375, -0.07977294921875, -0.076171875, -0.07257080078125, -0.0689697265625, -0.06536865234375, -0.061767578125, -0.05816650390625, -0.0545654296875, -0.05096435546875, -0.04736328125, -0.04376220703125, -0.0401611328125, -0.03656005859375, -0.032958984375, -0.02935791015625, -0.0257568359375, -0.02215576171875, -0.0185546875, -0.01495361328125, -0.0113525390625, -0.00775146484375, -0.004150390625, -0.00054931640625, 0.0030517578125, 0.00665283203125, 0.01025390625, 0.01385498046875, 0.0174560546875, 0.02105712890625, 0.024658203125, 0.02825927734375, 0.0318603515625, 0.03546142578125, 0.0390625, 0.04266357421875, 0.0462646484375, 0.04986572265625, 0.053466796875, 0.05706787109375, 0.0606689453125, 0.06427001953125, 0.06787109375, 0.07147216796875, 0.0750732421875, 0.07867431640625, 0.082275390625, 0.08587646484375, 0.0894775390625, 0.09307861328125, 0.0966796875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 2.0, 7.0, 14.0, 9.0, 19.0, 15.0, 25.0, 23.0, 21.0, 30.0, 27.0, 41.0, 33.0, 50.0, 52.0, 60.0, 40.0, 44.0, 59.0, 58.0, 37.0, 51.0, 39.0, 43.0, 30.0, 26.0, 21.0, 29.0, 14.0, 16.0, 15.0, 10.0, 11.0, 9.0, 6.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039093017578125, -0.03761863708496094, -0.036144256591796875, -0.03466987609863281, -0.03319549560546875, -0.03172111511230469, -0.030246734619140625, -0.028772354125976562, -0.0272979736328125, -0.025823593139648438, -0.024349212646484375, -0.022874832153320312, -0.02140045166015625, -0.019926071166992188, -0.018451690673828125, -0.016977310180664062, -0.0155029296875, -0.014028549194335938, -0.012554168701171875, -0.011079788208007812, -0.00960540771484375, -0.008131027221679688, -0.006656646728515625, -0.0051822662353515625, -0.0037078857421875, -0.0022335052490234375, -0.000759124755859375, 0.0007152557373046875, 0.00218963623046875, 0.0036640167236328125, 0.005138397216796875, 0.0066127777099609375, 0.008087158203125, 0.009561538696289062, 0.011035919189453125, 0.012510299682617188, 0.01398468017578125, 0.015459060668945312, 0.016933441162109375, 0.018407821655273438, 0.0198822021484375, 0.021356582641601562, 0.022830963134765625, 0.024305343627929688, 0.02577972412109375, 0.027254104614257812, 0.028728485107421875, 0.030202865600585938, 0.03167724609375, 0.03315162658691406, 0.034626007080078125, 0.03610038757324219, 0.03757476806640625, 0.03904914855957031, 0.040523529052734375, 0.04199790954589844, 0.0434722900390625, 0.04494667053222656, 0.046421051025390625, 0.04789543151855469, 0.04936981201171875, 0.05084419250488281, 0.052318572998046875, 0.05379295349121094, 0.055267333984375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 8.0, 8.0, 7.0, 12.0, 15.0, 31.0, 54.0, 86.0, 110.0, 192.0, 311.0, 522.0, 1045.0, 2342.0, 7103.0, 37704.0, 661829.0, 303899.0, 23954.0, 5345.0, 1886.0, 925.0, 465.0, 256.0, 162.0, 92.0, 51.0, 54.0, 28.0, 23.0, 15.0, 9.0, 9.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2493896484375, -0.24224090576171875, -0.2350921630859375, -0.22794342041015625, -0.220794677734375, -0.21364593505859375, -0.2064971923828125, -0.19934844970703125, -0.19219970703125, -0.18505096435546875, -0.1779022216796875, -0.17075347900390625, -0.163604736328125, -0.15645599365234375, -0.1493072509765625, -0.14215850830078125, -0.135009765625, -0.12786102294921875, -0.1207122802734375, -0.11356353759765625, -0.106414794921875, -0.09926605224609375, -0.0921173095703125, -0.08496856689453125, -0.07781982421875, -0.07067108154296875, -0.0635223388671875, -0.05637359619140625, -0.049224853515625, -0.04207611083984375, -0.0349273681640625, -0.02777862548828125, -0.0206298828125, -0.01348114013671875, -0.0063323974609375, 0.00081634521484375, 0.007965087890625, 0.01511383056640625, 0.0222625732421875, 0.02941131591796875, 0.03656005859375, 0.04370880126953125, 0.0508575439453125, 0.05800628662109375, 0.065155029296875, 0.07230377197265625, 0.0794525146484375, 0.08660125732421875, 0.09375, 0.10089874267578125, 0.1080474853515625, 0.11519622802734375, 0.122344970703125, 0.12949371337890625, 0.1366424560546875, 0.14379119873046875, 0.15093994140625, 0.15808868408203125, 0.1652374267578125, 0.17238616943359375, 0.179534912109375, 0.18668365478515625, 0.1938323974609375, 0.20098114013671875, 0.2081298828125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 2.0, 3.0, 6.0, 8.0, 7.0, 17.0, 16.0, 7.0, 22.0, 25.0, 20.0, 29.0, 44.0, 45.0, 62.0, 58.0, 78.0, 62.0, 67.0, 54.0, 50.0, 57.0, 37.0, 51.0, 36.0, 22.0, 38.0, 23.0, 16.0, 13.0, 10.0, 10.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2310791015625, -0.2233448028564453, -0.21561050415039062, -0.20787620544433594, -0.20014190673828125, -0.19240760803222656, -0.18467330932617188, -0.1769390106201172, -0.1692047119140625, -0.1614704132080078, -0.15373611450195312, -0.14600181579589844, -0.13826751708984375, -0.13053321838378906, -0.12279891967773438, -0.11506462097167969, -0.107330322265625, -0.09959602355957031, -0.09186172485351562, -0.08412742614746094, -0.07639312744140625, -0.06865882873535156, -0.060924530029296875, -0.05319023132324219, -0.0454559326171875, -0.03772163391113281, -0.029987335205078125, -0.022253036499023438, -0.01451873779296875, -0.0067844390869140625, 0.000949859619140625, 0.008684158325195312, 0.01641845703125, 0.024152755737304688, 0.031887054443359375, 0.03962135314941406, 0.04735565185546875, 0.05508995056152344, 0.06282424926757812, 0.07055854797363281, 0.0782928466796875, 0.08602714538574219, 0.09376144409179688, 0.10149574279785156, 0.10923004150390625, 0.11696434020996094, 0.12469863891601562, 0.1324329376220703, 0.140167236328125, 0.1479015350341797, 0.15563583374023438, 0.16337013244628906, 0.17110443115234375, 0.17883872985839844, 0.18657302856445312, 0.1943073272705078, 0.2020416259765625, 0.2097759246826172, 0.21751022338867188, 0.22524452209472656, 0.23297882080078125, 0.24071311950683594, 0.24844741821289062, 0.2561817169189453, 0.263916015625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 3.0, 5.0, 9.0, 17.0, 22.0, 47.0, 64.0, 96.0, 174.0, 340.0, 650.0, 1448.0, 3890.0, 13165.0, 81819.0, 820644.0, 103727.0, 15203.0, 4216.0, 1558.0, 648.0, 312.0, 176.0, 135.0, 60.0, 40.0, 28.0, 14.0, 12.0, 9.0, 3.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11456298828125, -0.11114788055419922, -0.10773277282714844, -0.10431766510009766, -0.10090255737304688, -0.0974874496459961, -0.09407234191894531, -0.09065723419189453, -0.08724212646484375, -0.08382701873779297, -0.08041191101074219, -0.0769968032836914, -0.07358169555664062, -0.07016658782958984, -0.06675148010253906, -0.06333637237548828, -0.0599212646484375, -0.05650615692138672, -0.05309104919433594, -0.049675941467285156, -0.046260833740234375, -0.042845726013183594, -0.03943061828613281, -0.03601551055908203, -0.03260040283203125, -0.02918529510498047, -0.025770187377929688, -0.022355079650878906, -0.018939971923828125, -0.015524864196777344, -0.012109756469726562, -0.008694648742675781, -0.005279541015625, -0.0018644332885742188, 0.0015506744384765625, 0.004965782165527344, 0.008380889892578125, 0.011795997619628906, 0.015211105346679688, 0.01862621307373047, 0.02204132080078125, 0.02545642852783203, 0.028871536254882812, 0.032286643981933594, 0.035701751708984375, 0.039116859436035156, 0.04253196716308594, 0.04594707489013672, 0.0493621826171875, 0.05277729034423828, 0.05619239807128906, 0.059607505798339844, 0.06302261352539062, 0.0664377212524414, 0.06985282897949219, 0.07326793670654297, 0.07668304443359375, 0.08009815216064453, 0.08351325988769531, 0.0869283676147461, 0.09034347534179688, 0.09375858306884766, 0.09717369079589844, 0.10058879852294922, 0.10400390625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 5.0, 2.0, 5.0, 2.0, 7.0, 7.0, 14.0, 9.0, 18.0, 33.0, 34.0, 45.0, 80.0, 134.0, 145.0, 140.0, 100.0, 61.0, 35.0, 37.0, 20.0, 19.0, 10.0, 8.0, 10.0, 6.0, 7.0, 3.0, 9.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.334615707397461e-05, -5.212612450122833e-05, -5.0906091928482056e-05, -4.968605935573578e-05, -4.84660267829895e-05, -4.7245994210243225e-05, -4.602596163749695e-05, -4.480592906475067e-05, -4.3585896492004395e-05, -4.236586391925812e-05, -4.114583134651184e-05, -3.9925798773765564e-05, -3.870576620101929e-05, -3.748573362827301e-05, -3.6265701055526733e-05, -3.5045668482780457e-05, -3.382563591003418e-05, -3.26056033372879e-05, -3.1385570764541626e-05, -3.016553819179535e-05, -2.8945505619049072e-05, -2.7725473046302795e-05, -2.650544047355652e-05, -2.5285407900810242e-05, -2.4065375328063965e-05, -2.2845342755317688e-05, -2.162531018257141e-05, -2.0405277609825134e-05, -1.9185245037078857e-05, -1.796521246433258e-05, -1.6745179891586304e-05, -1.5525147318840027e-05, -1.430511474609375e-05, -1.3085082173347473e-05, -1.1865049600601196e-05, -1.064501702785492e-05, -9.424984455108643e-06, -8.204951882362366e-06, -6.984919309616089e-06, -5.764886736869812e-06, -4.544854164123535e-06, -3.3248215913772583e-06, -2.1047890186309814e-06, -8.847564458847046e-07, 3.3527612686157227e-07, 1.5553086996078491e-06, 2.775341272354126e-06, 3.995373845100403e-06, 5.21540641784668e-06, 6.4354389905929565e-06, 7.655471563339233e-06, 8.87550413608551e-06, 1.0095536708831787e-05, 1.1315569281578064e-05, 1.253560185432434e-05, 1.3755634427070618e-05, 1.4975666999816895e-05, 1.619569957256317e-05, 1.7415732145309448e-05, 1.8635764718055725e-05, 1.9855797290802002e-05, 2.107582986354828e-05, 2.2295862436294556e-05, 2.3515895009040833e-05, 2.473592758178711e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 4.0, 5.0, 2.0, 5.0, 4.0, 2.0, 11.0, 12.0, 14.0, 24.0, 36.0, 43.0, 45.0, 79.0, 174.0, 244.0, 467.0, 946.0, 2280.0, 7245.0, 39671.0, 702855.0, 265547.0, 20588.0, 4805.0, 1698.0, 789.0, 373.0, 189.0, 123.0, 88.0, 53.0, 34.0, 30.0, 19.0, 13.0, 11.0, 6.0, 9.0, 4.0, 6.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.12548828125, -0.12208175659179688, -0.11867523193359375, -0.11526870727539062, -0.1118621826171875, -0.10845565795898438, -0.10504913330078125, -0.10164260864257812, -0.098236083984375, -0.09482955932617188, -0.09142303466796875, -0.08801651000976562, -0.0846099853515625, -0.08120346069335938, -0.07779693603515625, -0.07439041137695312, -0.07098388671875, -0.06757736206054688, -0.06417083740234375, -0.060764312744140625, -0.0573577880859375, -0.053951263427734375, -0.05054473876953125, -0.047138214111328125, -0.043731689453125, -0.040325164794921875, -0.03691864013671875, -0.033512115478515625, -0.0301055908203125, -0.026699066162109375, -0.02329254150390625, -0.019886016845703125, -0.0164794921875, -0.013072967529296875, -0.00966644287109375, -0.006259918212890625, -0.0028533935546875, 0.000553131103515625, 0.00395965576171875, 0.007366180419921875, 0.010772705078125, 0.014179229736328125, 0.01758575439453125, 0.020992279052734375, 0.0243988037109375, 0.027805328369140625, 0.03121185302734375, 0.034618377685546875, 0.03802490234375, 0.041431427001953125, 0.04483795166015625, 0.048244476318359375, 0.0516510009765625, 0.055057525634765625, 0.05846405029296875, 0.061870574951171875, 0.065277099609375, 0.06868362426757812, 0.07209014892578125, 0.07549667358398438, 0.0789031982421875, 0.08230972290039062, 0.08571624755859375, 0.08912277221679688, 0.092529296875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 2.0, 6.0, 7.0, 6.0, 11.0, 8.0, 10.0, 13.0, 26.0, 34.0, 36.0, 56.0, 73.0, 77.0, 91.0, 96.0, 89.0, 86.0, 71.0, 53.0, 20.0, 28.0, 22.0, 12.0, 15.0, 9.0, 5.0, 11.0, 2.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.07025146484375, -0.06768798828125, -0.06512451171875, -0.06256103515625, -0.05999755859375, -0.05743408203125, -0.05487060546875, -0.05230712890625, -0.04974365234375, -0.04718017578125, -0.04461669921875, -0.04205322265625, -0.03948974609375, -0.03692626953125, -0.03436279296875, -0.03179931640625, -0.02923583984375, -0.02667236328125, -0.02410888671875, -0.02154541015625, -0.01898193359375, -0.01641845703125, -0.01385498046875, -0.01129150390625, -0.00872802734375, -0.00616455078125, -0.00360107421875, -0.00103759765625, 0.00152587890625, 0.00408935546875, 0.00665283203125, 0.00921630859375, 0.01177978515625, 0.01434326171875, 0.01690673828125, 0.01947021484375, 0.02203369140625, 0.02459716796875, 0.02716064453125, 0.02972412109375, 0.03228759765625, 0.03485107421875, 0.03741455078125, 0.03997802734375, 0.04254150390625, 0.04510498046875, 0.04766845703125, 0.05023193359375, 0.05279541015625, 0.05535888671875, 0.05792236328125, 0.06048583984375, 0.06304931640625, 0.06561279296875, 0.06817626953125, 0.07073974609375, 0.07330322265625, 0.07586669921875, 0.07843017578125, 0.08099365234375, 0.08355712890625, 0.08612060546875, 0.08868408203125, 0.09124755859375, 0.09381103515625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 19.0, 76.0, 279.0, 420.0, 147.0, 37.0, 7.0, 6.0, 3.0, 2.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.326026201248169, -3.212735891342163, -3.0994455814361572, -2.9861555099487305, -2.8728652000427246, -2.7595748901367188, -2.646284580230713, -2.532994270324707, -2.419703960418701, -2.3064136505126953, -2.1931233406066895, -2.0798330307006836, -1.9665428400039673, -1.853252649307251, -1.7399623394012451, -1.6266720294952393, -1.513381838798523, -1.400091528892517, -1.2868013381958008, -1.173511028289795, -1.060220718383789, -0.946930468082428, -0.8336402177810669, -0.720349907875061, -0.6070596575737, -0.4937693774700165, -0.380479097366333, -0.2671888470649719, -0.15389856696128845, -0.04060828685760498, 0.0726819634437561, 0.18597227334976196, 0.29926252365112305, 0.4125528037548065, 0.52584308385849, 0.6391333341598511, 0.7524236440658569, 0.865713894367218, 0.9790041446685791, 1.092294454574585, 1.2055847644805908, 1.3188750743865967, 1.432165265083313, 1.5454555749893188, 1.6587458848953247, 1.772036075592041, 1.8853263854980469, 1.9986166954040527, 2.1119070053100586, 2.2251973152160645, 2.3384876251220703, 2.451777935028076, 2.565068006515503, 2.678358316421509, 2.7916486263275146, 2.9049389362335205, 3.0182290077209473, 3.131519317626953, 3.244809627532959, 3.358099937438965, 3.4713900089263916, 3.5846803188323975, 3.6979706287384033, 3.811260938644409, 3.924551248550415]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 6.0, 6.0, 8.0, 22.0, 20.0, 25.0, 41.0, 45.0, 45.0, 58.0, 62.0, 72.0, 86.0, 92.0, 82.0, 60.0, 74.0, 51.0, 37.0, 23.0, 29.0, 19.0, 8.0, 12.0, 9.0, 4.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.7596783638000488, -1.7197473049163818, -1.6798162460327148, -1.6398853063583374, -1.5999542474746704, -1.5600231885910034, -1.520092248916626, -1.480161190032959, -1.440230131149292, -1.400299072265625, -1.360368013381958, -1.3204370737075806, -1.2805060148239136, -1.2405749559402466, -1.2006440162658691, -1.1607129573822021, -1.1207818984985352, -1.0808508396148682, -1.0409197807312012, -1.0009888410568237, -0.9610577821731567, -0.9211267232894897, -0.8811957240104675, -0.8412647247314453, -0.8013336658477783, -0.7614026069641113, -0.7214716076850891, -0.6815406084060669, -0.6416095495223999, -0.6016784906387329, -0.5617474913597107, -0.5218164920806885, -0.4818854331970215, -0.4419544041156769, -0.4020233750343323, -0.36209234595298767, -0.32216131687164307, -0.28223028779029846, -0.24229925870895386, -0.20236822962760925, -0.16243720054626465, -0.12250617146492004, -0.08257514238357544, -0.042644113302230835, -0.0027130842208862305, 0.037217944860458374, 0.07714897394180298, 0.11708000302314758, 0.1570110321044922, 0.1969420611858368, 0.2368730902671814, 0.276804119348526, 0.3167351484298706, 0.3566661775112152, 0.3965972065925598, 0.4365282356739044, 0.476459264755249, 0.516390323638916, 0.5563213229179382, 0.5962523221969604, 0.6361833810806274, 0.6761144399642944, 0.7160454392433167, 0.7559764385223389, 0.7959074974060059]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 6.0, 9.0, 5.0, 3.0, 15.0, 14.0, 21.0, 18.0, 23.0, 45.0, 70.0, 112.0, 191.0, 375.0, 747.0, 1634.0, 4933.0, 21573.0, 368006.0, 3702071.0, 78213.0, 10886.0, 3121.0, 1087.0, 480.0, 251.0, 133.0, 71.0, 50.0, 31.0, 13.0, 13.0, 15.0, 6.0, 13.0, 9.0, 6.0, 4.0, 2.0, 0.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1695556640625, -0.1635608673095703, -0.15756607055664062, -0.15157127380371094, -0.14557647705078125, -0.13958168029785156, -0.13358688354492188, -0.1275920867919922, -0.1215972900390625, -0.11560249328613281, -0.10960769653320312, -0.10361289978027344, -0.09761810302734375, -0.09162330627441406, -0.08562850952148438, -0.07963371276855469, -0.073638916015625, -0.06764411926269531, -0.061649322509765625, -0.05565452575683594, -0.04965972900390625, -0.04366493225097656, -0.037670135498046875, -0.03167533874511719, -0.0256805419921875, -0.019685745239257812, -0.013690948486328125, -0.0076961517333984375, -0.00170135498046875, 0.0042934417724609375, 0.010288238525390625, 0.016283035278320312, 0.02227783203125, 0.028272628784179688, 0.034267425537109375, 0.04026222229003906, 0.04625701904296875, 0.05225181579589844, 0.058246612548828125, 0.06424140930175781, 0.0702362060546875, 0.07623100280761719, 0.08222579956054688, 0.08822059631347656, 0.09421539306640625, 0.10021018981933594, 0.10620498657226562, 0.11219978332519531, 0.118194580078125, 0.12418937683105469, 0.13018417358398438, 0.13617897033691406, 0.14217376708984375, 0.14816856384277344, 0.15416336059570312, 0.1601581573486328, 0.1661529541015625, 0.1721477508544922, 0.17814254760742188, 0.18413734436035156, 0.19013214111328125, 0.19612693786621094, 0.20212173461914062, 0.2081165313720703, 0.214111328125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 8.0, 14.0, 24.0, 27.0, 28.0, 49.0, 53.0, 59.0, 73.0, 67.0, 75.0, 68.0, 84.0, 80.0, 74.0, 56.0, 31.0, 31.0, 40.0, 26.0, 11.0, 10.0, 4.0, 10.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09393310546875, -0.09165096282958984, -0.08936882019042969, -0.08708667755126953, -0.08480453491210938, -0.08252239227294922, -0.08024024963378906, -0.0779581069946289, -0.07567596435546875, -0.0733938217163086, -0.07111167907714844, -0.06882953643798828, -0.06654739379882812, -0.06426525115966797, -0.06198310852050781, -0.059700965881347656, -0.0574188232421875, -0.055136680603027344, -0.05285453796386719, -0.05057239532470703, -0.048290252685546875, -0.04600811004638672, -0.04372596740722656, -0.041443824768066406, -0.03916168212890625, -0.036879539489746094, -0.03459739685058594, -0.03231525421142578, -0.030033111572265625, -0.02775096893310547, -0.025468826293945312, -0.023186683654785156, -0.020904541015625, -0.018622398376464844, -0.016340255737304688, -0.014058113098144531, -0.011775970458984375, -0.009493827819824219, -0.0072116851806640625, -0.004929542541503906, -0.00264739990234375, -0.00036525726318359375, 0.0019168853759765625, 0.004199028015136719, 0.006481170654296875, 0.008763313293457031, 0.011045455932617188, 0.013327598571777344, 0.0156097412109375, 0.017891883850097656, 0.020174026489257812, 0.02245616912841797, 0.024738311767578125, 0.02702045440673828, 0.029302597045898438, 0.031584739685058594, 0.03386688232421875, 0.036149024963378906, 0.03843116760253906, 0.04071331024169922, 0.042995452880859375, 0.04527759552001953, 0.04755973815917969, 0.049841880798339844, 0.0521240234375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 7.0, 10.0, 21.0, 23.0, 33.0, 56.0, 96.0, 159.0, 293.0, 604.0, 1361.0, 3579.0, 11957.0, 50433.0, 444832.0, 3413794.0, 216734.0, 35075.0, 9344.0, 3152.0, 1268.0, 615.0, 318.0, 185.0, 124.0, 64.0, 48.0, 30.0, 29.0, 15.0, 7.0, 7.0, 2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.173095703125, -0.1683368682861328, -0.16357803344726562, -0.15881919860839844, -0.15406036376953125, -0.14930152893066406, -0.14454269409179688, -0.1397838592529297, -0.1350250244140625, -0.1302661895751953, -0.12550735473632812, -0.12074851989746094, -0.11598968505859375, -0.11123085021972656, -0.10647201538085938, -0.10171318054199219, -0.096954345703125, -0.09219551086425781, -0.08743667602539062, -0.08267784118652344, -0.07791900634765625, -0.07316017150878906, -0.06840133666992188, -0.06364250183105469, -0.0588836669921875, -0.05412483215332031, -0.049365997314453125, -0.04460716247558594, -0.03984832763671875, -0.03508949279785156, -0.030330657958984375, -0.025571823120117188, -0.02081298828125, -0.016054153442382812, -0.011295318603515625, -0.0065364837646484375, -0.00177764892578125, 0.0029811859130859375, 0.007740020751953125, 0.012498855590820312, 0.0172576904296875, 0.022016525268554688, 0.026775360107421875, 0.03153419494628906, 0.03629302978515625, 0.04105186462402344, 0.045810699462890625, 0.05056953430175781, 0.055328369140625, 0.06008720397949219, 0.06484603881835938, 0.06960487365722656, 0.07436370849609375, 0.07912254333496094, 0.08388137817382812, 0.08864021301269531, 0.0933990478515625, 0.09815788269042969, 0.10291671752929688, 0.10767555236816406, 0.11243438720703125, 0.11719322204589844, 0.12195205688476562, 0.1267108917236328, 0.1314697265625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 6.0, 2.0, 1.0, 4.0, 6.0, 4.0, 8.0, 10.0, 13.0, 12.0, 22.0, 32.0, 43.0, 68.0, 93.0, 163.0, 319.0, 581.0, 996.0, 726.0, 375.0, 204.0, 111.0, 76.0, 51.0, 28.0, 30.0, 22.0, 21.0, 11.0, 7.0, 15.0, 6.0, 5.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08795166015625, -0.08370304107666016, -0.07945442199707031, -0.07520580291748047, -0.07095718383789062, -0.06670856475830078, -0.06245994567871094, -0.058211326599121094, -0.05396270751953125, -0.049714088439941406, -0.04546546936035156, -0.04121685028076172, -0.036968231201171875, -0.03271961212158203, -0.028470993041992188, -0.024222373962402344, -0.0199737548828125, -0.015725135803222656, -0.011476516723632812, -0.007227897644042969, -0.002979278564453125, 0.0012693405151367188, 0.0055179595947265625, 0.009766578674316406, 0.01401519775390625, 0.018263816833496094, 0.022512435913085938, 0.02676105499267578, 0.031009674072265625, 0.03525829315185547, 0.03950691223144531, 0.043755531311035156, 0.048004150390625, 0.052252769470214844, 0.05650138854980469, 0.06075000762939453, 0.06499862670898438, 0.06924724578857422, 0.07349586486816406, 0.0777444839477539, 0.08199310302734375, 0.0862417221069336, 0.09049034118652344, 0.09473896026611328, 0.09898757934570312, 0.10323619842529297, 0.10748481750488281, 0.11173343658447266, 0.1159820556640625, 0.12023067474365234, 0.12447929382324219, 0.12872791290283203, 0.13297653198242188, 0.13722515106201172, 0.14147377014160156, 0.1457223892211914, 0.14997100830078125, 0.1542196273803711, 0.15846824645996094, 0.16271686553955078, 0.16696548461914062, 0.17121410369873047, 0.1754627227783203, 0.17971134185791016, 0.1839599609375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 5.0, 19.0, 32.0, 67.0, 177.0, 249.0, 218.0, 111.0, 48.0, 32.0, 17.0, 5.0, 9.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.702487051486969, -0.6507090926170349, -0.598931074142456, -0.547153115272522, -0.4953750967979431, -0.44359713792800903, -0.39181914925575256, -0.3400411605834961, -0.2882631719112396, -0.23648518323898315, -0.18470719456672668, -0.1329292207956314, -0.08115123212337494, -0.029373258352279663, 0.022404730319976807, 0.07418271899223328, 0.12596070766448975, 0.17773869633674622, 0.22951668500900269, 0.28129464387893677, 0.3330726623535156, 0.3848506212234497, 0.4366286098957062, 0.48840659856796265, 0.5401846170425415, 0.5919625759124756, 0.6437405943870544, 0.6955185532569885, 0.7472965717315674, 0.7990745306015015, 0.8508524894714355, 0.9026305079460144, 0.9544085264205933, 1.0061864852905273, 1.0579644441604614, 1.109742522239685, 1.1615204811096191, 1.2132984399795532, 1.2650763988494873, 1.316854476928711, 1.368632435798645, 1.420410394668579, 1.4721883535385132, 1.5239664316177368, 1.575744390487671, 1.627522349357605, 1.679300308227539, 1.7310783863067627, 1.7828562259674072, 1.8346341848373413, 1.8864121437072754, 1.938190221786499, 1.989968180656433, 2.041746139526367, 2.093524217605591, 2.1453020572662354, 2.197080135345459, 2.2488582134246826, 2.300636053085327, 2.352414131164551, 2.4041919708251953, 2.455970048904419, 2.5077481269836426, 2.559525966644287, 2.6113040447235107]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 2.0, 3.0, 5.0, 9.0, 9.0, 8.0, 9.0, 12.0, 17.0, 21.0, 23.0, 26.0, 29.0, 40.0, 33.0, 27.0, 47.0, 47.0, 42.0, 40.0, 50.0, 52.0, 42.0, 34.0, 38.0, 43.0, 37.0, 34.0, 31.0, 28.0, 26.0, 24.0, 16.0, 11.0, 17.0, 10.0, 10.0, 15.0, 13.0, 11.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5210294723510742, -0.5037463307380676, -0.48646318912506104, -0.46918004751205444, -0.45189690589904785, -0.43461376428604126, -0.41733065247535706, -0.40004751086235046, -0.38276436924934387, -0.3654812276363373, -0.3481980860233307, -0.3309149444103241, -0.3136318325996399, -0.2963486909866333, -0.2790655493736267, -0.2617824077606201, -0.24449926614761353, -0.22721612453460693, -0.20993298292160034, -0.19264985620975494, -0.17536671459674835, -0.15808357298374176, -0.14080044627189636, -0.12351730465888977, -0.10623416304588318, -0.08895102143287659, -0.07166788727045059, -0.0543847493827343, -0.037101611495018005, -0.019818469882011414, -0.0025353357195854187, 0.014747798442840576, 0.03203094005584717, 0.04931407794356346, 0.06659721583127975, 0.08388034999370575, 0.10116349160671234, 0.11844663321971893, 0.13572975993156433, 0.15301290154457092, 0.17029604315757751, 0.1875791847705841, 0.2048623263835907, 0.2221454530954361, 0.2394285947084427, 0.2567117214202881, 0.2739948630332947, 0.29127800464630127, 0.30856114625930786, 0.32584428787231445, 0.34312742948532104, 0.36041057109832764, 0.37769371271133423, 0.3949768543243408, 0.412259966135025, 0.4295431077480316, 0.4468262493610382, 0.4641093909740448, 0.4813925325870514, 0.498675674200058, 0.5159587860107422, 0.5332419276237488, 0.5505250692367554, 0.567808210849762, 0.5850913524627686]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 6.0, 9.0, 13.0, 19.0, 34.0, 39.0, 57.0, 83.0, 130.0, 194.0, 288.0, 474.0, 758.0, 1418.0, 2457.0, 4791.0, 9855.0, 22748.0, 62084.0, 225608.0, 474771.0, 159532.0, 47371.0, 18277.0, 8219.0, 4033.0, 2201.0, 1233.0, 679.0, 391.0, 268.0, 142.0, 104.0, 75.0, 47.0, 50.0, 28.0, 19.0, 13.0, 9.0, 5.0, 4.0, 3.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.11395263671875, -0.11053848266601562, -0.10712432861328125, -0.10371017456054688, -0.1002960205078125, -0.09688186645507812, -0.09346771240234375, -0.09005355834960938, -0.086639404296875, -0.08322525024414062, -0.07981109619140625, -0.07639694213867188, -0.0729827880859375, -0.06956863403320312, -0.06615447998046875, -0.06274032592773438, -0.059326171875, -0.055912017822265625, -0.05249786376953125, -0.049083709716796875, -0.0456695556640625, -0.042255401611328125, -0.03884124755859375, -0.035427093505859375, -0.032012939453125, -0.028598785400390625, -0.02518463134765625, -0.021770477294921875, -0.0183563232421875, -0.014942169189453125, -0.01152801513671875, -0.008113861083984375, -0.00469970703125, -0.001285552978515625, 0.00212860107421875, 0.005542755126953125, 0.0089569091796875, 0.012371063232421875, 0.01578521728515625, 0.019199371337890625, 0.022613525390625, 0.026027679443359375, 0.02944183349609375, 0.032855987548828125, 0.0362701416015625, 0.039684295654296875, 0.04309844970703125, 0.046512603759765625, 0.0499267578125, 0.053340911865234375, 0.05675506591796875, 0.060169219970703125, 0.0635833740234375, 0.06699752807617188, 0.07041168212890625, 0.07382583618164062, 0.077239990234375, 0.08065414428710938, 0.08406829833984375, 0.08748245239257812, 0.0908966064453125, 0.09431076049804688, 0.09772491455078125, 0.10113906860351562, 0.10455322265625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 6.0, 9.0, 8.0, 9.0, 15.0, 19.0, 15.0, 28.0, 35.0, 29.0, 39.0, 37.0, 38.0, 36.0, 45.0, 59.0, 52.0, 58.0, 48.0, 55.0, 45.0, 32.0, 42.0, 44.0, 35.0, 39.0, 37.0, 23.0, 15.0, 12.0, 4.0, 4.0, 7.0, 9.0, 3.0, 2.0, 5.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.058685302734375, -0.057065486907958984, -0.05544567108154297, -0.05382585525512695, -0.05220603942871094, -0.05058622360229492, -0.048966407775878906, -0.04734659194946289, -0.045726776123046875, -0.04410696029663086, -0.042487144470214844, -0.04086732864379883, -0.03924751281738281, -0.0376276969909668, -0.03600788116455078, -0.034388065338134766, -0.03276824951171875, -0.031148433685302734, -0.02952861785888672, -0.027908802032470703, -0.026288986206054688, -0.024669170379638672, -0.023049354553222656, -0.02142953872680664, -0.019809722900390625, -0.01818990707397461, -0.016570091247558594, -0.014950275421142578, -0.013330459594726562, -0.011710643768310547, -0.010090827941894531, -0.008471012115478516, -0.0068511962890625, -0.005231380462646484, -0.0036115646362304688, -0.001991748809814453, -0.0003719329833984375, 0.0012478828430175781, 0.0028676986694335938, 0.004487514495849609, 0.006107330322265625, 0.007727146148681641, 0.009346961975097656, 0.010966777801513672, 0.012586593627929688, 0.014206409454345703, 0.01582622528076172, 0.017446041107177734, 0.01906585693359375, 0.020685672760009766, 0.02230548858642578, 0.023925304412841797, 0.025545120239257812, 0.027164936065673828, 0.028784751892089844, 0.03040456771850586, 0.032024383544921875, 0.03364419937133789, 0.035264015197753906, 0.03688383102416992, 0.03850364685058594, 0.04012346267700195, 0.04174327850341797, 0.043363094329833984, 0.04498291015625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 1.0, 1.0, 9.0, 8.0, 13.0, 9.0, 11.0, 28.0, 36.0, 69.0, 102.0, 170.0, 310.0, 620.0, 1480.0, 4276.0, 19362.0, 174885.0, 773766.0, 59410.0, 9295.0, 2609.0, 1025.0, 451.0, 252.0, 128.0, 70.0, 48.0, 36.0, 23.0, 16.0, 15.0, 6.0, 6.0, 7.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2423095703125, -0.2348041534423828, -0.22729873657226562, -0.21979331970214844, -0.21228790283203125, -0.20478248596191406, -0.19727706909179688, -0.1897716522216797, -0.1822662353515625, -0.1747608184814453, -0.16725540161132812, -0.15974998474121094, -0.15224456787109375, -0.14473915100097656, -0.13723373413085938, -0.1297283172607422, -0.122222900390625, -0.11471748352050781, -0.10721206665039062, -0.09970664978027344, -0.09220123291015625, -0.08469581604003906, -0.07719039916992188, -0.06968498229980469, -0.0621795654296875, -0.05467414855957031, -0.047168731689453125, -0.03966331481933594, -0.03215789794921875, -0.024652481079101562, -0.017147064208984375, -0.009641647338867188, -0.00213623046875, 0.0053691864013671875, 0.012874603271484375, 0.020380020141601562, 0.02788543701171875, 0.03539085388183594, 0.042896270751953125, 0.05040168762207031, 0.0579071044921875, 0.06541252136230469, 0.07291793823242188, 0.08042335510253906, 0.08792877197265625, 0.09543418884277344, 0.10293960571289062, 0.11044502258300781, 0.117950439453125, 0.1254558563232422, 0.13296127319335938, 0.14046669006347656, 0.14797210693359375, 0.15547752380371094, 0.16298294067382812, 0.1704883575439453, 0.1779937744140625, 0.1854991912841797, 0.19300460815429688, 0.20051002502441406, 0.20801544189453125, 0.21552085876464844, 0.22302627563476562, 0.2305316925048828, 0.238037109375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 3.0, 6.0, 5.0, 4.0, 9.0, 10.0, 14.0, 14.0, 23.0, 22.0, 29.0, 34.0, 36.0, 48.0, 42.0, 40.0, 44.0, 44.0, 59.0, 54.0, 55.0, 56.0, 52.0, 48.0, 36.0, 36.0, 35.0, 18.0, 21.0, 18.0, 18.0, 13.0, 10.0, 7.0, 8.0, 7.0, 5.0, 8.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.2470703125, -0.2401905059814453, -0.23331069946289062, -0.22643089294433594, -0.21955108642578125, -0.21267127990722656, -0.20579147338867188, -0.1989116668701172, -0.1920318603515625, -0.1851520538330078, -0.17827224731445312, -0.17139244079589844, -0.16451263427734375, -0.15763282775878906, -0.15075302124023438, -0.1438732147216797, -0.136993408203125, -0.1301136016845703, -0.12323379516601562, -0.11635398864746094, -0.10947418212890625, -0.10259437561035156, -0.09571456909179688, -0.08883476257324219, -0.0819549560546875, -0.07507514953613281, -0.06819534301757812, -0.06131553649902344, -0.05443572998046875, -0.04755592346191406, -0.040676116943359375, -0.03379631042480469, -0.02691650390625, -0.020036697387695312, -0.013156890869140625, -0.0062770843505859375, 0.00060272216796875, 0.0074825286865234375, 0.014362335205078125, 0.021242141723632812, 0.0281219482421875, 0.03500175476074219, 0.041881561279296875, 0.04876136779785156, 0.05564117431640625, 0.06252098083496094, 0.06940078735351562, 0.07628059387207031, 0.083160400390625, 0.09004020690917969, 0.09692001342773438, 0.10379981994628906, 0.11067962646484375, 0.11755943298339844, 0.12443923950195312, 0.1313190460205078, 0.1381988525390625, 0.1450786590576172, 0.15195846557617188, 0.15883827209472656, 0.16571807861328125, 0.17259788513183594, 0.17947769165039062, 0.1863574981689453, 0.1932373046875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 12.0, 13.0, 18.0, 23.0, 38.0, 65.0, 88.0, 174.0, 401.0, 919.0, 2859.0, 12238.0, 95501.0, 780448.0, 135027.0, 15459.0, 3290.0, 1023.0, 470.0, 203.0, 109.0, 66.0, 35.0, 19.0, 14.0, 10.0, 8.0, 1.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1107177734375, -0.10709571838378906, -0.10347366333007812, -0.09985160827636719, -0.09622955322265625, -0.09260749816894531, -0.08898544311523438, -0.08536338806152344, -0.0817413330078125, -0.07811927795410156, -0.07449722290039062, -0.07087516784667969, -0.06725311279296875, -0.06363105773925781, -0.060009002685546875, -0.05638694763183594, -0.052764892578125, -0.04914283752441406, -0.045520782470703125, -0.04189872741699219, -0.03827667236328125, -0.03465461730957031, -0.031032562255859375, -0.027410507202148438, -0.0237884521484375, -0.020166397094726562, -0.016544342041015625, -0.012922286987304688, -0.00930023193359375, -0.0056781768798828125, -0.002056121826171875, 0.0015659332275390625, 0.00518798828125, 0.008810043334960938, 0.012432098388671875, 0.016054153442382812, 0.01967620849609375, 0.023298263549804688, 0.026920318603515625, 0.030542373657226562, 0.0341644287109375, 0.03778648376464844, 0.041408538818359375, 0.04503059387207031, 0.04865264892578125, 0.05227470397949219, 0.055896759033203125, 0.05951881408691406, 0.063140869140625, 0.06676292419433594, 0.07038497924804688, 0.07400703430175781, 0.07762908935546875, 0.08125114440917969, 0.08487319946289062, 0.08849525451660156, 0.0921173095703125, 0.09573936462402344, 0.09936141967773438, 0.10298347473144531, 0.10660552978515625, 0.11022758483886719, 0.11384963989257812, 0.11747169494628906, 0.12109375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 1.0, 0.0, 4.0, 4.0, 4.0, 4.0, 3.0, 7.0, 14.0, 13.0, 24.0, 24.0, 36.0, 48.0, 62.0, 72.0, 83.0, 98.0, 100.0, 85.0, 77.0, 66.0, 44.0, 34.0, 18.0, 18.0, 12.0, 7.0, 13.0, 3.0, 6.0, 5.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.331899642944336e-05, -3.248453140258789e-05, -3.165006637573242e-05, -3.081560134887695e-05, -2.9981136322021484e-05, -2.9146671295166016e-05, -2.8312206268310547e-05, -2.7477741241455078e-05, -2.664327621459961e-05, -2.580881118774414e-05, -2.4974346160888672e-05, -2.4139881134033203e-05, -2.3305416107177734e-05, -2.2470951080322266e-05, -2.1636486053466797e-05, -2.0802021026611328e-05, -1.996755599975586e-05, -1.913309097290039e-05, -1.8298625946044922e-05, -1.7464160919189453e-05, -1.6629695892333984e-05, -1.5795230865478516e-05, -1.4960765838623047e-05, -1.4126300811767578e-05, -1.329183578491211e-05, -1.245737075805664e-05, -1.1622905731201172e-05, -1.0788440704345703e-05, -9.953975677490234e-06, -9.119510650634766e-06, -8.285045623779297e-06, -7.450580596923828e-06, -6.616115570068359e-06, -5.781650543212891e-06, -4.947185516357422e-06, -4.112720489501953e-06, -3.2782554626464844e-06, -2.4437904357910156e-06, -1.6093254089355469e-06, -7.748603820800781e-07, 5.960464477539063e-08, 8.940696716308594e-07, 1.7285346984863281e-06, 2.562999725341797e-06, 3.3974647521972656e-06, 4.231929779052734e-06, 5.066394805908203e-06, 5.900859832763672e-06, 6.735324859619141e-06, 7.569789886474609e-06, 8.404254913330078e-06, 9.238719940185547e-06, 1.0073184967041016e-05, 1.0907649993896484e-05, 1.1742115020751953e-05, 1.2576580047607422e-05, 1.341104507446289e-05, 1.424551010131836e-05, 1.5079975128173828e-05, 1.5914440155029297e-05, 1.6748905181884766e-05, 1.7583370208740234e-05, 1.8417835235595703e-05, 1.9252300262451172e-05, 2.008676528930664e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 6.0, 10.0, 20.0, 33.0, 43.0, 84.0, 175.0, 437.0, 1224.0, 4923.0, 41140.0, 817080.0, 168954.0, 11153.0, 2070.0, 627.0, 277.0, 117.0, 54.0, 67.0, 23.0, 14.0, 11.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09228515625, -0.08783149719238281, -0.08337783813476562, -0.07892417907714844, -0.07447052001953125, -0.07001686096191406, -0.06556320190429688, -0.06110954284667969, -0.0566558837890625, -0.05220222473144531, -0.047748565673828125, -0.04329490661621094, -0.03884124755859375, -0.03438758850097656, -0.029933929443359375, -0.025480270385742188, -0.021026611328125, -0.016572952270507812, -0.012119293212890625, -0.0076656341552734375, -0.00321197509765625, 0.0012416839599609375, 0.005695343017578125, 0.010149002075195312, 0.0146026611328125, 0.019056320190429688, 0.023509979248046875, 0.027963638305664062, 0.03241729736328125, 0.03687095642089844, 0.041324615478515625, 0.04577827453613281, 0.05023193359375, 0.05468559265136719, 0.059139251708984375, 0.06359291076660156, 0.06804656982421875, 0.07250022888183594, 0.07695388793945312, 0.08140754699707031, 0.0858612060546875, 0.09031486511230469, 0.09476852416992188, 0.09922218322753906, 0.10367584228515625, 0.10812950134277344, 0.11258316040039062, 0.11703681945800781, 0.121490478515625, 0.1259441375732422, 0.13039779663085938, 0.13485145568847656, 0.13930511474609375, 0.14375877380371094, 0.14821243286132812, 0.1526660919189453, 0.1571197509765625, 0.1615734100341797, 0.16602706909179688, 0.17048072814941406, 0.17493438720703125, 0.17938804626464844, 0.18384170532226562, 0.1882953643798828, 0.1927490234375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 1.0, 3.0, 8.0, 0.0, 3.0, 4.0, 7.0, 13.0, 9.0, 14.0, 11.0, 24.0, 16.0, 22.0, 32.0, 46.0, 34.0, 63.0, 62.0, 81.0, 71.0, 70.0, 59.0, 60.0, 38.0, 44.0, 37.0, 34.0, 24.0, 22.0, 15.0, 10.0, 12.0, 7.0, 14.0, 4.0, 9.0, 1.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.07110595703125, -0.06917905807495117, -0.06725215911865234, -0.06532526016235352, -0.06339836120605469, -0.06147146224975586, -0.05954456329345703, -0.0576176643371582, -0.055690765380859375, -0.05376386642456055, -0.05183696746826172, -0.04991006851196289, -0.04798316955566406, -0.046056270599365234, -0.044129371643066406, -0.04220247268676758, -0.04027557373046875, -0.03834867477416992, -0.036421775817871094, -0.034494876861572266, -0.03256797790527344, -0.03064107894897461, -0.02871417999267578, -0.026787281036376953, -0.024860382080078125, -0.022933483123779297, -0.02100658416748047, -0.01907968521118164, -0.017152786254882812, -0.015225887298583984, -0.013298988342285156, -0.011372089385986328, -0.0094451904296875, -0.007518291473388672, -0.005591392517089844, -0.0036644935607910156, -0.0017375946044921875, 0.00018930435180664062, 0.0021162033081054688, 0.004043102264404297, 0.005970001220703125, 0.007896900177001953, 0.009823799133300781, 0.01175069808959961, 0.013677597045898438, 0.015604496002197266, 0.017531394958496094, 0.019458293914794922, 0.02138519287109375, 0.023312091827392578, 0.025238990783691406, 0.027165889739990234, 0.029092788696289062, 0.03101968765258789, 0.03294658660888672, 0.03487348556518555, 0.036800384521484375, 0.0387272834777832, 0.04065418243408203, 0.04258108139038086, 0.04450798034667969, 0.046434879302978516, 0.048361778259277344, 0.05028867721557617, 0.052215576171875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 13.0, 30.0, 76.0, 144.0, 259.0, 234.0, 119.0, 57.0, 30.0, 13.0, 7.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.2298762798309326, -2.172567367553711, -2.1152584552764893, -2.0579495429992676, -2.000640630722046, -1.9433315992355347, -1.886022686958313, -1.8287137746810913, -1.7714048624038696, -1.714095950126648, -1.6567870378494263, -1.599478006362915, -1.5421690940856934, -1.4848601818084717, -1.42755126953125, -1.3702423572540283, -1.3129334449768066, -1.255624532699585, -1.1983156204223633, -1.1410067081451416, -1.0836976766586304, -1.0263887643814087, -0.969079852104187, -0.9117709398269653, -0.8544619083404541, -0.7971529960632324, -0.739844024181366, -0.6825351119041443, -0.6252261996269226, -0.5679172277450562, -0.5106083154678345, -0.4532994031906128, -0.3959904909133911, -0.33868154883384705, -0.28137263655662537, -0.2240636944770813, -0.16675476729869843, -0.10944584012031555, -0.052136898040771484, 0.005172014236450195, 0.06248095631599426, 0.11978988349437714, 0.17709881067276, 0.23440775275230408, 0.29171669483184814, 0.3490256071090698, 0.4063345491886139, 0.46364346146583557, 0.5209524035453796, 0.5782613158226013, 0.6355702877044678, 0.6928791999816895, 0.7501881122589111, 0.8074970245361328, 0.8648059964179993, 0.922114908695221, 0.9794238805770874, 1.036732792854309, 1.0940417051315308, 1.151350736618042, 1.2086596488952637, 1.2659685611724854, 1.323277473449707, 1.3805863857269287, 1.4378952980041504]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 0.0, 7.0, 9.0, 8.0, 5.0, 12.0, 12.0, 12.0, 12.0, 17.0, 20.0, 21.0, 17.0, 35.0, 25.0, 41.0, 36.0, 44.0, 46.0, 49.0, 62.0, 51.0, 45.0, 48.0, 44.0, 46.0, 35.0, 32.0, 29.0, 34.0, 27.0, 24.0, 20.0, 15.0, 11.0, 4.0, 11.0, 11.0, 4.0, 9.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7336015105247498, -0.7075657248497009, -0.6815299391746521, -0.6554941534996033, -0.6294583082199097, -0.6034225225448608, -0.577386736869812, -0.5513509511947632, -0.5253151655197144, -0.4992793798446655, -0.4732435941696167, -0.4472077786922455, -0.42117199301719666, -0.3951362073421478, -0.3691003918647766, -0.3430646061897278, -0.31702882051467896, -0.2909930348396301, -0.2649572491645813, -0.23892143368721008, -0.21288564801216125, -0.18684986233711243, -0.1608140617609024, -0.13477826118469238, -0.10874247550964355, -0.08270668238401413, -0.056670889258384705, -0.03063509613275528, -0.0045993030071258545, 0.021436482667922974, 0.047472283244132996, 0.07350808382034302, 0.09954386949539185, 0.12557965517044067, 0.1516154557466507, 0.17765125632286072, 0.20368704199790955, 0.22972282767295837, 0.2557586431503296, 0.2817944288253784, 0.30783021450042725, 0.3338660001754761, 0.3599017858505249, 0.3859376013278961, 0.41197338700294495, 0.4380091726779938, 0.464044988155365, 0.4900807738304138, 0.5161165595054626, 0.5421523451805115, 0.5681881308555603, 0.5942239165306091, 0.6202597618103027, 0.6462955474853516, 0.6723313331604004, 0.6983671188354492, 0.724402904510498, 0.7504386901855469, 0.7764744758605957, 0.8025102615356445, 0.8285460472106934, 0.8545818328857422, 0.8806176781654358, 0.9066534638404846, 0.9326892495155334]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 10.0, 6.0, 17.0, 11.0, 19.0, 41.0, 57.0, 89.0, 154.0, 249.0, 379.0, 633.0, 1154.0, 2127.0, 4255.0, 9212.0, 23001.0, 69972.0, 314080.0, 1936222.0, 1502900.0, 236949.0, 56726.0, 19656.0, 8150.0, 3741.0, 1896.0, 1055.0, 570.0, 373.0, 219.0, 135.0, 70.0, 66.0, 30.0, 25.0, 15.0, 10.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.073974609375, -0.07158184051513672, -0.06918907165527344, -0.06679630279541016, -0.06440353393554688, -0.062010765075683594, -0.05961799621582031, -0.05722522735595703, -0.05483245849609375, -0.05243968963623047, -0.05004692077636719, -0.047654151916503906, -0.045261383056640625, -0.042868614196777344, -0.04047584533691406, -0.03808307647705078, -0.0356903076171875, -0.03329753875732422, -0.030904769897460938, -0.028512001037597656, -0.026119232177734375, -0.023726463317871094, -0.021333694458007812, -0.01894092559814453, -0.01654815673828125, -0.014155387878417969, -0.011762619018554688, -0.009369850158691406, -0.006977081298828125, -0.004584312438964844, -0.0021915435791015625, 0.00020122528076171875, 0.002593994140625, 0.004986763000488281, 0.0073795318603515625, 0.009772300720214844, 0.012165069580078125, 0.014557838439941406, 0.016950607299804688, 0.01934337615966797, 0.02173614501953125, 0.02412891387939453, 0.026521682739257812, 0.028914451599121094, 0.031307220458984375, 0.033699989318847656, 0.03609275817871094, 0.03848552703857422, 0.0408782958984375, 0.04327106475830078, 0.04566383361816406, 0.048056602478027344, 0.050449371337890625, 0.052842140197753906, 0.05523490905761719, 0.05762767791748047, 0.06002044677734375, 0.06241321563720703, 0.06480598449707031, 0.0671987533569336, 0.06959152221679688, 0.07198429107666016, 0.07437705993652344, 0.07676982879638672, 0.07916259765625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 9.0, 8.0, 6.0, 13.0, 20.0, 24.0, 25.0, 45.0, 40.0, 65.0, 66.0, 64.0, 56.0, 66.0, 73.0, 54.0, 63.0, 49.0, 49.0, 41.0, 39.0, 35.0, 21.0, 20.0, 13.0, 14.0, 12.0, 4.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.058013916015625, -0.056078433990478516, -0.05414295196533203, -0.05220746994018555, -0.05027198791503906, -0.04833650588989258, -0.046401023864746094, -0.04446554183959961, -0.042530059814453125, -0.04059457778930664, -0.038659095764160156, -0.03672361373901367, -0.03478813171386719, -0.0328526496887207, -0.03091716766357422, -0.028981685638427734, -0.02704620361328125, -0.025110721588134766, -0.02317523956298828, -0.021239757537841797, -0.019304275512695312, -0.017368793487548828, -0.015433311462402344, -0.01349782943725586, -0.011562347412109375, -0.00962686538696289, -0.007691383361816406, -0.005755901336669922, -0.0038204193115234375, -0.0018849372863769531, 5.054473876953125e-05, 0.0019860267639160156, 0.0039215087890625, 0.005856990814208984, 0.007792472839355469, 0.009727954864501953, 0.011663436889648438, 0.013598918914794922, 0.015534400939941406, 0.01746988296508789, 0.019405364990234375, 0.02134084701538086, 0.023276329040527344, 0.025211811065673828, 0.027147293090820312, 0.029082775115966797, 0.03101825714111328, 0.032953739166259766, 0.03488922119140625, 0.036824703216552734, 0.03876018524169922, 0.0406956672668457, 0.04263114929199219, 0.04456663131713867, 0.046502113342285156, 0.04843759536743164, 0.050373077392578125, 0.05230855941772461, 0.054244041442871094, 0.05617952346801758, 0.05811500549316406, 0.06005048751831055, 0.06198596954345703, 0.06392145156860352, 0.06585693359375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 12.0, 7.0, 15.0, 33.0, 59.0, 92.0, 174.0, 357.0, 837.0, 2199.0, 7944.0, 45736.0, 735840.0, 3252189.0, 125738.0, 16393.0, 3954.0, 1387.0, 601.0, 313.0, 165.0, 82.0, 56.0, 26.0, 27.0, 23.0, 8.0, 6.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.259033203125, -0.2524280548095703, -0.24582290649414062, -0.23921775817871094, -0.23261260986328125, -0.22600746154785156, -0.21940231323242188, -0.2127971649169922, -0.2061920166015625, -0.1995868682861328, -0.19298171997070312, -0.18637657165527344, -0.17977142333984375, -0.17316627502441406, -0.16656112670898438, -0.1599559783935547, -0.153350830078125, -0.1467456817626953, -0.14014053344726562, -0.13353538513183594, -0.12693023681640625, -0.12032508850097656, -0.11371994018554688, -0.10711479187011719, -0.1005096435546875, -0.09390449523925781, -0.08729934692382812, -0.08069419860839844, -0.07408905029296875, -0.06748390197753906, -0.060878753662109375, -0.05427360534667969, -0.04766845703125, -0.04106330871582031, -0.034458160400390625, -0.027853012084960938, -0.02124786376953125, -0.014642715454101562, -0.008037567138671875, -0.0014324188232421875, 0.0051727294921875, 0.011777877807617188, 0.018383026123046875, 0.024988174438476562, 0.03159332275390625, 0.03819847106933594, 0.044803619384765625, 0.05140876770019531, 0.058013916015625, 0.06461906433105469, 0.07122421264648438, 0.07782936096191406, 0.08443450927734375, 0.09103965759277344, 0.09764480590820312, 0.10424995422363281, 0.1108551025390625, 0.11746025085449219, 0.12406539916992188, 0.13067054748535156, 0.13727569580078125, 0.14388084411621094, 0.15048599243164062, 0.1570911407470703, 0.1636962890625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 5.0, 4.0, 4.0, 9.0, 17.0, 25.0, 29.0, 49.0, 57.0, 78.0, 138.0, 257.0, 451.0, 757.0, 777.0, 536.0, 329.0, 185.0, 120.0, 68.0, 53.0, 35.0, 27.0, 21.0, 10.0, 4.0, 6.0, 5.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1484375, -0.14253616333007812, -0.13663482666015625, -0.13073348999023438, -0.1248321533203125, -0.11893081665039062, -0.11302947998046875, -0.10712814331054688, -0.101226806640625, -0.09532546997070312, -0.08942413330078125, -0.08352279663085938, -0.0776214599609375, -0.07172012329101562, -0.06581878662109375, -0.059917449951171875, -0.05401611328125, -0.048114776611328125, -0.04221343994140625, -0.036312103271484375, -0.0304107666015625, -0.024509429931640625, -0.01860809326171875, -0.012706756591796875, -0.006805419921875, -0.000904083251953125, 0.00499725341796875, 0.010898590087890625, 0.0167999267578125, 0.022701263427734375, 0.02860260009765625, 0.034503936767578125, 0.0404052734375, 0.046306610107421875, 0.05220794677734375, 0.058109283447265625, 0.0640106201171875, 0.06991195678710938, 0.07581329345703125, 0.08171463012695312, 0.087615966796875, 0.09351730346679688, 0.09941864013671875, 0.10531997680664062, 0.1112213134765625, 0.11712265014648438, 0.12302398681640625, 0.12892532348632812, 0.13482666015625, 0.14072799682617188, 0.14662933349609375, 0.15253067016601562, 0.1584320068359375, 0.16433334350585938, 0.17023468017578125, 0.17613601684570312, 0.182037353515625, 0.18793869018554688, 0.19384002685546875, 0.19974136352539062, 0.2056427001953125, 0.21154403686523438, 0.21744537353515625, 0.22334671020507812, 0.229248046875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 18.0, 73.0, 233.0, 371.0, 221.0, 46.0, 12.0, 5.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5941085815429688, -2.4825284481048584, -2.370948314666748, -2.2593679428100586, -2.1477878093719482, -2.036207675933838, -1.924627423286438, -1.813047170639038, -1.7014670372009277, -1.5898869037628174, -1.4783066511154175, -1.3667263984680176, -1.2551462650299072, -1.1435661315917969, -1.031985878944397, -0.9204056859016418, -0.8088254928588867, -0.6972452998161316, -0.5856651067733765, -0.47408491373062134, -0.3625047206878662, -0.2509245276451111, -0.13934433460235596, -0.02776414155960083, 0.0838160514831543, 0.19539624452590942, 0.30697643756866455, 0.4185566306114197, 0.5301368236541748, 0.6417170166969299, 0.7532972097396851, 0.8648774027824402, 0.9764575958251953, 1.0880377292633057, 1.1996179819107056, 1.3111982345581055, 1.4227783679962158, 1.5343585014343262, 1.645938754081726, 1.757519006729126, 1.8690991401672363, 1.9806792736053467, 2.092259407043457, 2.2038397789001465, 2.315419912338257, 2.427000045776367, 2.5385804176330566, 2.650160551071167, 2.7617406845092773, 2.8733208179473877, 2.984900951385498, 3.0964813232421875, 3.208061456680298, 3.319641590118408, 3.4312219619750977, 3.542802095413208, 3.6543822288513184, 3.7659623622894287, 3.877542495727539, 3.9891228675842285, 4.100703239440918, 4.212283134460449, 4.323863506317139, 4.43544340133667, 4.547023773193359]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 5.0, 7.0, 5.0, 6.0, 10.0, 12.0, 17.0, 14.0, 27.0, 21.0, 36.0, 24.0, 38.0, 35.0, 41.0, 39.0, 36.0, 42.0, 42.0, 38.0, 39.0, 41.0, 40.0, 61.0, 35.0, 38.0, 31.0, 35.0, 27.0, 27.0, 19.0, 20.0, 16.0, 8.0, 13.0, 10.0, 10.0, 3.0, 11.0, 6.0, 2.0, 1.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8110286593437195, -0.786143958568573, -0.7612591981887817, -0.7363744974136353, -0.711489737033844, -0.6866050362586975, -0.6617202758789062, -0.6368355751037598, -0.6119508743286133, -0.5870661735534668, -0.5621814131736755, -0.537296712398529, -0.5124119520187378, -0.4875272512435913, -0.46264252066612244, -0.43775779008865356, -0.4128730297088623, -0.38798829913139343, -0.36310356855392456, -0.3382188677787781, -0.3133341073989868, -0.28844940662384033, -0.26356467604637146, -0.2386799454689026, -0.21379521489143372, -0.18891048431396484, -0.16402575373649597, -0.1391410380601883, -0.11425630748271942, -0.08937157690525055, -0.06448686122894287, -0.039602130651474, -0.014717400074005127, 0.010167326778173447, 0.03505205363035202, 0.059936776757240295, 0.08482150733470917, 0.10970623791217804, 0.13459095358848572, 0.1594756841659546, 0.18436041474342346, 0.20924514532089233, 0.2341298758983612, 0.2590146064758301, 0.28389930725097656, 0.3087840676307678, 0.3336687684059143, 0.3585534989833832, 0.38343822956085205, 0.4083229601383209, 0.4332076907157898, 0.4580923914909363, 0.48297715187072754, 0.507861852645874, 0.5327465534210205, 0.5576313138008118, 0.582516074180603, 0.6074007749557495, 0.6322855353355408, 0.6571702361106873, 0.6820549964904785, 0.706939697265625, 0.7318243980407715, 0.7567091584205627, 0.7815938591957092]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 5.0, 4.0, 5.0, 4.0, 7.0, 6.0, 10.0, 30.0, 55.0, 49.0, 111.0, 170.0, 270.0, 450.0, 918.0, 1820.0, 4002.0, 9630.0, 25722.0, 74489.0, 237077.0, 432107.0, 172495.0, 55605.0, 19577.0, 7449.0, 3137.0, 1512.0, 789.0, 453.0, 216.0, 144.0, 99.0, 41.0, 34.0, 23.0, 18.0, 12.0, 6.0, 2.0, 1.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.092529296875, -0.08873176574707031, -0.08493423461914062, -0.08113670349121094, -0.07733917236328125, -0.07354164123535156, -0.06974411010742188, -0.06594657897949219, -0.0621490478515625, -0.05835151672363281, -0.054553985595703125, -0.05075645446777344, -0.04695892333984375, -0.04316139221191406, -0.039363861083984375, -0.03556632995605469, -0.031768798828125, -0.027971267700195312, -0.024173736572265625, -0.020376205444335938, -0.01657867431640625, -0.012781143188476562, -0.008983612060546875, -0.0051860809326171875, -0.0013885498046875, 0.0024089813232421875, 0.006206512451171875, 0.010004043579101562, 0.01380157470703125, 0.017599105834960938, 0.021396636962890625, 0.025194168090820312, 0.02899169921875, 0.03278923034667969, 0.036586761474609375, 0.04038429260253906, 0.04418182373046875, 0.04797935485839844, 0.051776885986328125, 0.05557441711425781, 0.0593719482421875, 0.06316947937011719, 0.06696701049804688, 0.07076454162597656, 0.07456207275390625, 0.07835960388183594, 0.08215713500976562, 0.08595466613769531, 0.089752197265625, 0.09354972839355469, 0.09734725952148438, 0.10114479064941406, 0.10494232177734375, 0.10873985290527344, 0.11253738403320312, 0.11633491516113281, 0.1201324462890625, 0.12392997741699219, 0.12772750854492188, 0.13152503967285156, 0.13532257080078125, 0.13912010192871094, 0.14291763305664062, 0.1467151641845703, 0.1505126953125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 6.0, 5.0, 6.0, 8.0, 14.0, 5.0, 20.0, 17.0, 21.0, 26.0, 24.0, 23.0, 32.0, 36.0, 38.0, 36.0, 47.0, 37.0, 49.0, 47.0, 48.0, 47.0, 45.0, 37.0, 43.0, 45.0, 35.0, 33.0, 28.0, 19.0, 28.0, 9.0, 19.0, 13.0, 12.0, 9.0, 8.0, 5.0, 6.0, 7.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041168212890625, -0.03974723815917969, -0.038326263427734375, -0.03690528869628906, -0.03548431396484375, -0.03406333923339844, -0.032642364501953125, -0.031221389770507812, -0.0298004150390625, -0.028379440307617188, -0.026958465576171875, -0.025537490844726562, -0.02411651611328125, -0.022695541381835938, -0.021274566650390625, -0.019853591918945312, -0.0184326171875, -0.017011642456054688, -0.015590667724609375, -0.014169692993164062, -0.01274871826171875, -0.011327743530273438, -0.009906768798828125, -0.008485794067382812, -0.0070648193359375, -0.0056438446044921875, -0.004222869873046875, -0.0028018951416015625, -0.00138092041015625, 4.00543212890625e-05, 0.001461029052734375, 0.0028820037841796875, 0.004302978515625, 0.0057239532470703125, 0.007144927978515625, 0.008565902709960938, 0.00998687744140625, 0.011407852172851562, 0.012828826904296875, 0.014249801635742188, 0.0156707763671875, 0.017091751098632812, 0.018512725830078125, 0.019933700561523438, 0.02135467529296875, 0.022775650024414062, 0.024196624755859375, 0.025617599487304688, 0.02703857421875, 0.028459548950195312, 0.029880523681640625, 0.03130149841308594, 0.03272247314453125, 0.03414344787597656, 0.035564422607421875, 0.03698539733886719, 0.0384063720703125, 0.03982734680175781, 0.041248321533203125, 0.04266929626464844, 0.04409027099609375, 0.04551124572753906, 0.046932220458984375, 0.04835319519042969, 0.049774169921875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 5.0, 3.0, 11.0, 10.0, 11.0, 16.0, 20.0, 18.0, 36.0, 46.0, 99.0, 143.0, 228.0, 398.0, 696.0, 1409.0, 2944.0, 8268.0, 38915.0, 585055.0, 364620.0, 32447.0, 7445.0, 2719.0, 1333.0, 673.0, 353.0, 213.0, 147.0, 90.0, 54.0, 36.0, 29.0, 30.0, 11.0, 8.0, 6.0, 3.0, 2.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.26611328125, -0.2580375671386719, -0.24996185302734375, -0.24188613891601562, -0.2338104248046875, -0.22573471069335938, -0.21765899658203125, -0.20958328247070312, -0.201507568359375, -0.19343185424804688, -0.18535614013671875, -0.17728042602539062, -0.1692047119140625, -0.16112899780273438, -0.15305328369140625, -0.14497756958007812, -0.13690185546875, -0.12882614135742188, -0.12075042724609375, -0.11267471313476562, -0.1045989990234375, -0.09652328491210938, -0.08844757080078125, -0.08037185668945312, -0.072296142578125, -0.06422042846679688, -0.05614471435546875, -0.048069000244140625, -0.0399932861328125, -0.031917572021484375, -0.02384185791015625, -0.015766143798828125, -0.0076904296875, 0.000385284423828125, 0.00846099853515625, 0.016536712646484375, 0.0246124267578125, 0.032688140869140625, 0.04076385498046875, 0.048839569091796875, 0.056915283203125, 0.06499099731445312, 0.07306671142578125, 0.08114242553710938, 0.0892181396484375, 0.09729385375976562, 0.10536956787109375, 0.11344528198242188, 0.12152099609375, 0.12959671020507812, 0.13767242431640625, 0.14574813842773438, 0.1538238525390625, 0.16189956665039062, 0.16997528076171875, 0.17805099487304688, 0.186126708984375, 0.19420242309570312, 0.20227813720703125, 0.21035385131835938, 0.2184295654296875, 0.22650527954101562, 0.23458099365234375, 0.24265670776367188, 0.250732421875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 0.0, 5.0, 3.0, 4.0, 6.0, 3.0, 6.0, 14.0, 7.0, 9.0, 13.0, 26.0, 29.0, 18.0, 25.0, 25.0, 38.0, 44.0, 41.0, 50.0, 49.0, 49.0, 46.0, 41.0, 33.0, 39.0, 53.0, 35.0, 45.0, 39.0, 21.0, 25.0, 31.0, 24.0, 17.0, 16.0, 16.0, 12.0, 11.0, 8.0, 6.0, 3.0, 4.0, 4.0, 1.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.2408447265625, -0.23380661010742188, -0.22676849365234375, -0.21973037719726562, -0.2126922607421875, -0.20565414428710938, -0.19861602783203125, -0.19157791137695312, -0.184539794921875, -0.17750167846679688, -0.17046356201171875, -0.16342544555664062, -0.1563873291015625, -0.14934921264648438, -0.14231109619140625, -0.13527297973632812, -0.12823486328125, -0.12119674682617188, -0.11415863037109375, -0.10712051391601562, -0.1000823974609375, -0.09304428100585938, -0.08600616455078125, -0.07896804809570312, -0.071929931640625, -0.06489181518554688, -0.05785369873046875, -0.050815582275390625, -0.0437774658203125, -0.036739349365234375, -0.02970123291015625, -0.022663116455078125, -0.015625, -0.008586883544921875, -0.00154876708984375, 0.005489349365234375, 0.0125274658203125, 0.019565582275390625, 0.02660369873046875, 0.033641815185546875, 0.040679931640625, 0.047718048095703125, 0.05475616455078125, 0.061794281005859375, 0.0688323974609375, 0.07587051391601562, 0.08290863037109375, 0.08994674682617188, 0.09698486328125, 0.10402297973632812, 0.11106109619140625, 0.11809921264648438, 0.1251373291015625, 0.13217544555664062, 0.13921356201171875, 0.14625167846679688, 0.153289794921875, 0.16032791137695312, 0.16736602783203125, 0.17440414428710938, 0.1814422607421875, 0.18848037719726562, 0.19551849365234375, 0.20255661010742188, 0.2095947265625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 7.0, 8.0, 11.0, 17.0, 14.0, 24.0, 32.0, 43.0, 75.0, 113.0, 177.0, 279.0, 509.0, 901.0, 1921.0, 4802.0, 14279.0, 54922.0, 266332.0, 577379.0, 92350.0, 22243.0, 6843.0, 2650.0, 1161.0, 556.0, 332.0, 209.0, 94.0, 78.0, 58.0, 37.0, 28.0, 23.0, 12.0, 9.0, 8.0, 11.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.06561279296875, -0.0635080337524414, -0.06140327453613281, -0.05929851531982422, -0.057193756103515625, -0.05508899688720703, -0.05298423767089844, -0.050879478454589844, -0.04877471923828125, -0.046669960021972656, -0.04456520080566406, -0.04246044158935547, -0.040355682373046875, -0.03825092315673828, -0.03614616394042969, -0.034041404724121094, -0.0319366455078125, -0.029831886291503906, -0.027727127075195312, -0.02562236785888672, -0.023517608642578125, -0.02141284942626953, -0.019308090209960938, -0.017203330993652344, -0.01509857177734375, -0.012993812561035156, -0.010889053344726562, -0.008784294128417969, -0.006679534912109375, -0.004574775695800781, -0.0024700164794921875, -0.00036525726318359375, 0.001739501953125, 0.0038442611694335938, 0.0059490203857421875, 0.008053779602050781, 0.010158538818359375, 0.012263298034667969, 0.014368057250976562, 0.016472816467285156, 0.01857757568359375, 0.020682334899902344, 0.022787094116210938, 0.02489185333251953, 0.026996612548828125, 0.02910137176513672, 0.031206130981445312, 0.033310890197753906, 0.0354156494140625, 0.037520408630371094, 0.03962516784667969, 0.04172992706298828, 0.043834686279296875, 0.04593944549560547, 0.04804420471191406, 0.050148963928222656, 0.05225372314453125, 0.054358482360839844, 0.05646324157714844, 0.05856800079345703, 0.060672760009765625, 0.06277751922607422, 0.06488227844238281, 0.0669870376586914, 0.069091796875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 3.0, 5.0, 4.0, 8.0, 2.0, 12.0, 11.0, 16.0, 16.0, 20.0, 14.0, 19.0, 18.0, 25.0, 37.0, 32.0, 41.0, 69.0, 65.0, 63.0, 60.0, 68.0, 64.0, 52.0, 37.0, 32.0, 30.0, 27.0, 16.0, 14.0, 16.0, 20.0, 11.0, 11.0, 13.0, 9.0, 8.0, 8.0, 6.0, 6.0, 1.0, 4.0, 5.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-2.2530555725097656e-05, -2.1889805793762207e-05, -2.1249055862426758e-05, -2.060830593109131e-05, -1.996755599975586e-05, -1.932680606842041e-05, -1.868605613708496e-05, -1.8045306205749512e-05, -1.7404556274414062e-05, -1.6763806343078613e-05, -1.6123056411743164e-05, -1.5482306480407715e-05, -1.4841556549072266e-05, -1.4200806617736816e-05, -1.3560056686401367e-05, -1.2919306755065918e-05, -1.2278556823730469e-05, -1.163780689239502e-05, -1.099705696105957e-05, -1.0356307029724121e-05, -9.715557098388672e-06, -9.074807167053223e-06, -8.434057235717773e-06, -7.793307304382324e-06, -7.152557373046875e-06, -6.511807441711426e-06, -5.8710575103759766e-06, -5.230307579040527e-06, -4.589557647705078e-06, -3.948807716369629e-06, -3.3080577850341797e-06, -2.6673078536987305e-06, -2.0265579223632812e-06, -1.385807991027832e-06, -7.450580596923828e-07, -1.043081283569336e-07, 5.364418029785156e-07, 1.1771917343139648e-06, 1.817941665649414e-06, 2.4586915969848633e-06, 3.0994415283203125e-06, 3.7401914596557617e-06, 4.380941390991211e-06, 5.02169132232666e-06, 5.662441253662109e-06, 6.303191184997559e-06, 6.943941116333008e-06, 7.584691047668457e-06, 8.225440979003906e-06, 8.866190910339355e-06, 9.506940841674805e-06, 1.0147690773010254e-05, 1.0788440704345703e-05, 1.1429190635681152e-05, 1.2069940567016602e-05, 1.271069049835205e-05, 1.33514404296875e-05, 1.399219036102295e-05, 1.4632940292358398e-05, 1.5273690223693848e-05, 1.5914440155029297e-05, 1.6555190086364746e-05, 1.7195940017700195e-05, 1.7836689949035645e-05, 1.8477439880371094e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 5.0, 11.0, 15.0, 29.0, 38.0, 34.0, 67.0, 109.0, 207.0, 380.0, 705.0, 1419.0, 3426.0, 10798.0, 55975.0, 595272.0, 327032.0, 39186.0, 8195.0, 2898.0, 1265.0, 646.0, 332.0, 184.0, 100.0, 82.0, 48.0, 21.0, 16.0, 12.0, 9.0, 8.0, 3.0, 5.0, 7.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.09576416015625, -0.09323787689208984, -0.09071159362792969, -0.08818531036376953, -0.08565902709960938, -0.08313274383544922, -0.08060646057128906, -0.0780801773071289, -0.07555389404296875, -0.0730276107788086, -0.07050132751464844, -0.06797504425048828, -0.06544876098632812, -0.06292247772216797, -0.06039619445800781, -0.057869911193847656, -0.0553436279296875, -0.052817344665527344, -0.05029106140136719, -0.04776477813720703, -0.045238494873046875, -0.04271221160888672, -0.04018592834472656, -0.037659645080566406, -0.03513336181640625, -0.032607078552246094, -0.030080795288085938, -0.02755451202392578, -0.025028228759765625, -0.02250194549560547, -0.019975662231445312, -0.017449378967285156, -0.014923095703125, -0.012396812438964844, -0.009870529174804688, -0.007344245910644531, -0.004817962646484375, -0.0022916793823242188, 0.0002346038818359375, 0.0027608871459960938, 0.00528717041015625, 0.007813453674316406, 0.010339736938476562, 0.012866020202636719, 0.015392303466796875, 0.01791858673095703, 0.020444869995117188, 0.022971153259277344, 0.0254974365234375, 0.028023719787597656, 0.030550003051757812, 0.03307628631591797, 0.035602569580078125, 0.03812885284423828, 0.04065513610839844, 0.043181419372558594, 0.04570770263671875, 0.048233985900878906, 0.05076026916503906, 0.05328655242919922, 0.055812835693359375, 0.05833911895751953, 0.06086540222167969, 0.06339168548583984, 0.06591796875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 8.0, 7.0, 11.0, 9.0, 15.0, 9.0, 18.0, 12.0, 16.0, 19.0, 29.0, 17.0, 40.0, 36.0, 39.0, 43.0, 54.0, 55.0, 58.0, 52.0, 45.0, 54.0, 46.0, 43.0, 32.0, 38.0, 22.0, 31.0, 17.0, 21.0, 17.0, 20.0, 14.0, 7.0, 12.0, 3.0, 5.0, 5.0, 7.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0560302734375, -0.05443000793457031, -0.052829742431640625, -0.05122947692871094, -0.04962921142578125, -0.04802894592285156, -0.046428680419921875, -0.04482841491699219, -0.0432281494140625, -0.04162788391113281, -0.040027618408203125, -0.03842735290527344, -0.03682708740234375, -0.03522682189941406, -0.033626556396484375, -0.03202629089355469, -0.030426025390625, -0.028825759887695312, -0.027225494384765625, -0.025625228881835938, -0.02402496337890625, -0.022424697875976562, -0.020824432373046875, -0.019224166870117188, -0.0176239013671875, -0.016023635864257812, -0.014423370361328125, -0.012823104858398438, -0.01122283935546875, -0.009622573852539062, -0.008022308349609375, -0.0064220428466796875, -0.00482177734375, -0.0032215118408203125, -0.001621246337890625, -2.09808349609375e-05, 0.00157928466796875, 0.0031795501708984375, 0.004779815673828125, 0.0063800811767578125, 0.0079803466796875, 0.009580612182617188, 0.011180877685546875, 0.012781143188476562, 0.01438140869140625, 0.015981674194335938, 0.017581939697265625, 0.019182205200195312, 0.020782470703125, 0.022382736206054688, 0.023983001708984375, 0.025583267211914062, 0.02718353271484375, 0.028783798217773438, 0.030384063720703125, 0.03198432922363281, 0.0335845947265625, 0.03518486022949219, 0.036785125732421875, 0.03838539123535156, 0.03998565673828125, 0.04158592224121094, 0.043186187744140625, 0.04478645324707031, 0.04638671875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 13.0, 21.0, 23.0, 34.0, 68.0, 100.0, 162.0, 202.0, 139.0, 92.0, 57.0, 32.0, 12.0, 16.0, 10.0, 6.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.1225615739822388, -1.0796549320220947, -1.0367484092712402, -0.9938417673110962, -0.9509351253509521, -0.9080285429954529, -0.8651219606399536, -0.8222153186798096, -0.7793087363243103, -0.736402153968811, -0.693495512008667, -0.6505889296531677, -0.6076823472976685, -0.5647757053375244, -0.5218691229820251, -0.4789625108242035, -0.43605589866638184, -0.3931492865085602, -0.3502426743507385, -0.30733609199523926, -0.2644294798374176, -0.22152286767959595, -0.17861628532409668, -0.13570967316627502, -0.09280306100845337, -0.04989645630121231, -0.0069898515939712524, 0.03591674566268921, 0.07882335782051086, 0.12172996997833252, 0.1646365523338318, 0.20754316449165344, 0.25044965744018555, 0.2933562695980072, 0.33626288175582886, 0.3791694641113281, 0.4220760762691498, 0.46498268842697144, 0.5078892707824707, 0.5507959127426147, 0.593702495098114, 0.6366090774536133, 0.6795157194137573, 0.7224223017692566, 0.7653288841247559, 0.8082355260848999, 0.8511421084403992, 0.8940486907958984, 0.9369553327560425, 0.9798619151115417, 1.022768497467041, 1.065675139427185, 1.108581781387329, 1.1514883041381836, 1.1943949460983276, 1.2373015880584717, 1.2802081108093262, 1.3231147527694702, 1.3660212755203247, 1.4089279174804688, 1.4518345594406128, 1.4947412014007568, 1.5376477241516113, 1.5805543661117554, 1.6234610080718994]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 4.0, 0.0, 5.0, 1.0, 5.0, 5.0, 6.0, 8.0, 9.0, 6.0, 17.0, 13.0, 23.0, 18.0, 28.0, 27.0, 34.0, 42.0, 33.0, 42.0, 34.0, 65.0, 81.0, 57.0, 53.0, 55.0, 68.0, 36.0, 31.0, 32.0, 26.0, 15.0, 24.0, 12.0, 9.0, 14.0, 18.0, 14.0, 10.0, 3.0, 8.0, 7.0, 2.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-1.043489694595337, -1.0154638290405273, -0.9874380230903625, -0.9594122171401978, -0.931386411190033, -0.9033605456352234, -0.8753347396850586, -0.847308874130249, -0.8192830681800842, -0.7912572622299194, -0.7632313966751099, -0.7352055907249451, -0.7071797847747803, -0.6791539192199707, -0.6511281132698059, -0.6231023073196411, -0.5950764417648315, -0.5670506358146667, -0.5390247702598572, -0.5109989643096924, -0.4829731285572052, -0.454947292804718, -0.4269214868545532, -0.39889565110206604, -0.37086987495422363, -0.34284403920173645, -0.31481823325157166, -0.2867923974990845, -0.2587665617465973, -0.2307407408952713, -0.2027149200439453, -0.17468908429145813, -0.14666324853897095, -0.11863742023706436, -0.09061159193515778, -0.06258577108383179, -0.0345599427819252, -0.006534114480018616, 0.021491706371307373, 0.049517542123794556, 0.07754336297512054, 0.10556919127702713, 0.13359501957893372, 0.1616208404302597, 0.1896466612815857, 0.21767249703407288, 0.24569831788539886, 0.27372413873672485, 0.30174997448921204, 0.3297758102416992, 0.357801616191864, 0.3858274519443512, 0.4138532876968384, 0.4418790936470032, 0.46990492939949036, 0.49793076515197754, 0.5259565711021423, 0.5539823770523071, 0.5820082426071167, 0.6100340485572815, 0.6380598545074463, 0.6660857200622559, 0.6941115260124207, 0.7221373319625854, 0.750163197517395]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 8.0, 9.0, 21.0, 21.0, 44.0, 66.0, 116.0, 201.0, 413.0, 682.0, 1434.0, 2974.0, 6862.0, 16718.0, 49970.0, 197669.0, 1165404.0, 2159560.0, 452591.0, 93452.0, 27585.0, 9997.0, 4314.0, 1965.0, 1010.0, 513.0, 260.0, 163.0, 104.0, 66.0, 33.0, 13.0, 13.0, 9.0, 7.0, 9.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06207275390625, -0.05994987487792969, -0.057826995849609375, -0.05570411682128906, -0.05358123779296875, -0.05145835876464844, -0.049335479736328125, -0.04721260070800781, -0.0450897216796875, -0.04296684265136719, -0.040843963623046875, -0.03872108459472656, -0.03659820556640625, -0.03447532653808594, -0.032352447509765625, -0.030229568481445312, -0.028106689453125, -0.025983810424804688, -0.023860931396484375, -0.021738052368164062, -0.01961517333984375, -0.017492294311523438, -0.015369415283203125, -0.013246536254882812, -0.0111236572265625, -0.009000778198242188, -0.006877899169921875, -0.0047550201416015625, -0.00263214111328125, -0.0005092620849609375, 0.001613616943359375, 0.0037364959716796875, 0.005859375, 0.007982254028320312, 0.010105133056640625, 0.012228012084960938, 0.01435089111328125, 0.016473770141601562, 0.018596649169921875, 0.020719528198242188, 0.0228424072265625, 0.024965286254882812, 0.027088165283203125, 0.029211044311523438, 0.03133392333984375, 0.03345680236816406, 0.035579681396484375, 0.03770256042480469, 0.039825439453125, 0.04194831848144531, 0.044071197509765625, 0.04619407653808594, 0.04831695556640625, 0.05043983459472656, 0.052562713623046875, 0.05468559265136719, 0.0568084716796875, 0.05893135070800781, 0.061054229736328125, 0.06317710876464844, 0.06529998779296875, 0.06742286682128906, 0.06954574584960938, 0.07166862487792969, 0.07379150390625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 4.0, 9.0, 8.0, 14.0, 13.0, 16.0, 15.0, 17.0, 30.0, 27.0, 27.0, 30.0, 40.0, 52.0, 49.0, 37.0, 38.0, 62.0, 51.0, 49.0, 49.0, 40.0, 49.0, 43.0, 37.0, 45.0, 24.0, 26.0, 27.0, 18.0, 10.0, 13.0, 3.0, 8.0, 4.0, 4.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.047515869140625, -0.04597282409667969, -0.044429779052734375, -0.04288673400878906, -0.04134368896484375, -0.03980064392089844, -0.038257598876953125, -0.03671455383300781, -0.0351715087890625, -0.03362846374511719, -0.032085418701171875, -0.030542373657226562, -0.02899932861328125, -0.027456283569335938, -0.025913238525390625, -0.024370193481445312, -0.0228271484375, -0.021284103393554688, -0.019741058349609375, -0.018198013305664062, -0.01665496826171875, -0.015111923217773438, -0.013568878173828125, -0.012025833129882812, -0.0104827880859375, -0.008939743041992188, -0.007396697998046875, -0.0058536529541015625, -0.00431060791015625, -0.0027675628662109375, -0.001224517822265625, 0.0003185272216796875, 0.001861572265625, 0.0034046173095703125, 0.004947662353515625, 0.0064907073974609375, 0.00803375244140625, 0.009576797485351562, 0.011119842529296875, 0.012662887573242188, 0.0142059326171875, 0.015748977661132812, 0.017292022705078125, 0.018835067749023438, 0.02037811279296875, 0.021921157836914062, 0.023464202880859375, 0.025007247924804688, 0.02655029296875, 0.028093338012695312, 0.029636383056640625, 0.031179428100585938, 0.03272247314453125, 0.03426551818847656, 0.035808563232421875, 0.03735160827636719, 0.0388946533203125, 0.04043769836425781, 0.041980743408203125, 0.04352378845214844, 0.04506683349609375, 0.04660987854003906, 0.048152923583984375, 0.04969596862792969, 0.051239013671875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 6.0, 4.0, 4.0, 7.0, 7.0, 16.0, 18.0, 12.0, 56.0, 65.0, 79.0, 167.0, 266.0, 446.0, 929.0, 2264.0, 6368.0, 19486.0, 84292.0, 737673.0, 2976954.0, 295493.0, 48915.0, 13119.0, 4420.0, 1628.0, 662.0, 357.0, 204.0, 113.0, 87.0, 55.0, 30.0, 22.0, 16.0, 8.0, 9.0, 8.0, 5.0, 1.0, 7.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1156005859375, -0.11165809631347656, -0.10771560668945312, -0.10377311706542969, -0.09983062744140625, -0.09588813781738281, -0.09194564819335938, -0.08800315856933594, -0.0840606689453125, -0.08011817932128906, -0.07617568969726562, -0.07223320007324219, -0.06829071044921875, -0.06434822082519531, -0.060405731201171875, -0.05646324157714844, -0.052520751953125, -0.04857826232910156, -0.044635772705078125, -0.04069328308105469, -0.03675079345703125, -0.03280830383300781, -0.028865814208984375, -0.024923324584960938, -0.0209808349609375, -0.017038345336914062, -0.013095855712890625, -0.009153366088867188, -0.00521087646484375, -0.0012683868408203125, 0.002674102783203125, 0.0066165924072265625, 0.01055908203125, 0.014501571655273438, 0.018444061279296875, 0.022386550903320312, 0.02632904052734375, 0.030271530151367188, 0.034214019775390625, 0.03815650939941406, 0.0420989990234375, 0.04604148864746094, 0.049983978271484375, 0.05392646789550781, 0.05786895751953125, 0.06181144714355469, 0.06575393676757812, 0.06969642639160156, 0.073638916015625, 0.07758140563964844, 0.08152389526367188, 0.08546638488769531, 0.08940887451171875, 0.09335136413574219, 0.09729385375976562, 0.10123634338378906, 0.1051788330078125, 0.10912132263183594, 0.11306381225585938, 0.11700630187988281, 0.12094879150390625, 0.12489128112792969, 0.12883377075195312, 0.13277626037597656, 0.13671875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 3.0, 1.0, 3.0, 5.0, 8.0, 5.0, 10.0, 9.0, 8.0, 15.0, 17.0, 18.0, 38.0, 46.0, 45.0, 55.0, 69.0, 118.0, 158.0, 203.0, 276.0, 430.0, 522.0, 493.0, 372.0, 287.0, 229.0, 143.0, 123.0, 76.0, 69.0, 47.0, 28.0, 30.0, 25.0, 16.0, 11.0, 9.0, 5.0, 1.0, 14.0, 6.0, 8.0, 8.0, 4.0, 0.0, 3.0, 2.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.092529296875, -0.08933639526367188, -0.08614349365234375, -0.08295059204101562, -0.0797576904296875, -0.07656478881835938, -0.07337188720703125, -0.07017898559570312, -0.066986083984375, -0.06379318237304688, -0.06060028076171875, -0.057407379150390625, -0.0542144775390625, -0.051021575927734375, -0.04782867431640625, -0.044635772705078125, -0.04144287109375, -0.038249969482421875, -0.03505706787109375, -0.031864166259765625, -0.0286712646484375, -0.025478363037109375, -0.02228546142578125, -0.019092559814453125, -0.015899658203125, -0.012706756591796875, -0.00951385498046875, -0.006320953369140625, -0.0031280517578125, 6.4849853515625e-05, 0.00325775146484375, 0.006450653076171875, 0.0096435546875, 0.012836456298828125, 0.01602935791015625, 0.019222259521484375, 0.0224151611328125, 0.025608062744140625, 0.02880096435546875, 0.031993865966796875, 0.035186767578125, 0.038379669189453125, 0.04157257080078125, 0.044765472412109375, 0.0479583740234375, 0.051151275634765625, 0.05434417724609375, 0.057537078857421875, 0.06072998046875, 0.06392288208007812, 0.06711578369140625, 0.07030868530273438, 0.0735015869140625, 0.07669448852539062, 0.07988739013671875, 0.08308029174804688, 0.086273193359375, 0.08946609497070312, 0.09265899658203125, 0.09585189819335938, 0.0990447998046875, 0.10223770141601562, 0.10543060302734375, 0.10862350463867188, 0.11181640625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 6.0, 12.0, 25.0, 80.0, 164.0, 280.0, 219.0, 116.0, 51.0, 20.0, 9.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4146473407745361, -1.3522950410842896, -1.289942741394043, -1.2275904417037964, -1.1652381420135498, -1.1028858423233032, -1.0405335426330566, -0.9781813025474548, -0.9158290028572083, -0.8534767031669617, -0.7911244034767151, -0.7287721633911133, -0.6664198637008667, -0.6040675640106201, -0.5417152643203735, -0.47936296463012695, -0.41701066493988037, -0.3546583652496338, -0.2923060655593872, -0.229953795671463, -0.16760149598121643, -0.10524919629096985, -0.042896926403045654, 0.019455373287200928, 0.08180767297744751, 0.1441599726676941, 0.20651225745677948, 0.26886454224586487, 0.33121684193611145, 0.39356914162635803, 0.4559214115142822, 0.5182737112045288, 0.5806260108947754, 0.642978310585022, 0.7053306102752686, 0.7676829099655151, 0.8300352096557617, 0.8923875093460083, 0.9547397494316101, 1.017091989517212, 1.079444408416748, 1.1417967081069946, 1.2041490077972412, 1.2665013074874878, 1.3288536071777344, 1.391205906867981, 1.4535582065582275, 1.5159103870391846, 1.5782626867294312, 1.6406149864196777, 1.7029672861099243, 1.765319585800171, 1.8276718854904175, 1.890024185180664, 1.952376365661621, 2.0147287845611572, 2.0770809650421143, 2.1394331455230713, 2.2017855644226074, 2.2641377449035645, 2.3264901638031006, 2.3888423442840576, 2.4511947631835938, 2.513546943664551, 2.575899362564087]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 2.0, 8.0, 9.0, 12.0, 9.0, 10.0, 15.0, 19.0, 26.0, 20.0, 29.0, 25.0, 39.0, 35.0, 46.0, 47.0, 50.0, 50.0, 39.0, 57.0, 63.0, 48.0, 50.0, 37.0, 28.0, 30.0, 31.0, 33.0, 26.0, 22.0, 16.0, 14.0, 12.0, 9.0, 5.0, 9.0, 9.0, 6.0, 3.0, 1.0, 1.0, 2.0, 5.0, 1.0], "bins": [-0.7618774771690369, -0.7423037886619568, -0.7227301597595215, -0.7031564712524414, -0.6835827827453613, -0.6640090942382812, -0.6444354057312012, -0.6248617768287659, -0.6052880883216858, -0.5857143998146057, -0.5661407709121704, -0.5465670824050903, -0.5269933938980103, -0.5074197053909302, -0.4878460466861725, -0.4682723879814148, -0.4486986994743347, -0.42912501096725464, -0.40955135226249695, -0.38997769355773926, -0.3704040050506592, -0.3508303165435791, -0.3312566578388214, -0.3116829991340637, -0.29210931062698364, -0.27253562211990356, -0.2529619634151459, -0.233388289809227, -0.2138146162033081, -0.19424094259738922, -0.17466726899147034, -0.15509359538555145, -0.13551992177963257, -0.11594624817371368, -0.0963725745677948, -0.07679890096187592, -0.05722522735595703, -0.03765155375003815, -0.018077880144119263, 0.0014957934617996216, 0.021069467067718506, 0.04064314067363739, 0.060216814279556274, 0.07979048788547516, 0.09936416149139404, 0.11893783509731293, 0.1385115087032318, 0.1580851823091507, 0.17765885591506958, 0.19723252952098846, 0.21680620312690735, 0.23637987673282623, 0.2559535503387451, 0.2755272388458252, 0.2951008975505829, 0.3146745562553406, 0.33424824476242065, 0.35382193326950073, 0.3733955919742584, 0.3929692506790161, 0.4125429391860962, 0.43211662769317627, 0.45169028639793396, 0.47126394510269165, 0.49083763360977173]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 6.0, 7.0, 22.0, 15.0, 46.0, 50.0, 104.0, 193.0, 331.0, 685.0, 1342.0, 2837.0, 6480.0, 18029.0, 60192.0, 262146.0, 509846.0, 131878.0, 34696.0, 11213.0, 4406.0, 1966.0, 952.0, 502.0, 255.0, 135.0, 87.0, 52.0, 32.0, 27.0, 10.0, 5.0, 6.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1378173828125, -0.13341140747070312, -0.12900543212890625, -0.12459945678710938, -0.1201934814453125, -0.11578750610351562, -0.11138153076171875, -0.10697555541992188, -0.102569580078125, -0.09816360473632812, -0.09375762939453125, -0.08935165405273438, -0.0849456787109375, -0.08053970336914062, -0.07613372802734375, -0.07172775268554688, -0.06732177734375, -0.06291580200195312, -0.05850982666015625, -0.054103851318359375, -0.0496978759765625, -0.045291900634765625, -0.04088592529296875, -0.036479949951171875, -0.032073974609375, -0.027667999267578125, -0.02326202392578125, -0.018856048583984375, -0.0144500732421875, -0.010044097900390625, -0.00563812255859375, -0.001232147216796875, 0.003173828125, 0.007579803466796875, 0.01198577880859375, 0.016391754150390625, 0.0207977294921875, 0.025203704833984375, 0.02960968017578125, 0.034015655517578125, 0.038421630859375, 0.042827606201171875, 0.04723358154296875, 0.051639556884765625, 0.0560455322265625, 0.060451507568359375, 0.06485748291015625, 0.06926345825195312, 0.07366943359375, 0.07807540893554688, 0.08248138427734375, 0.08688735961914062, 0.0912933349609375, 0.09569931030273438, 0.10010528564453125, 0.10451126098632812, 0.108917236328125, 0.11332321166992188, 0.11772918701171875, 0.12213516235351562, 0.1265411376953125, 0.13094711303710938, 0.13535308837890625, 0.13975906372070312, 0.1441650390625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 7.0, 4.0, 7.0, 11.0, 5.0, 5.0, 11.0, 14.0, 22.0, 14.0, 22.0, 21.0, 46.0, 53.0, 38.0, 32.0, 46.0, 45.0, 55.0, 52.0, 55.0, 55.0, 38.0, 44.0, 47.0, 27.0, 43.0, 38.0, 36.0, 27.0, 17.0, 16.0, 13.0, 8.0, 10.0, 9.0, 1.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.05877685546875, -0.05713605880737305, -0.055495262145996094, -0.05385446548461914, -0.05221366882324219, -0.050572872161865234, -0.04893207550048828, -0.04729127883911133, -0.045650482177734375, -0.04400968551635742, -0.04236888885498047, -0.040728092193603516, -0.03908729553222656, -0.03744649887084961, -0.035805702209472656, -0.0341649055480957, -0.03252410888671875, -0.030883312225341797, -0.029242515563964844, -0.02760171890258789, -0.025960922241210938, -0.024320125579833984, -0.02267932891845703, -0.021038532257080078, -0.019397735595703125, -0.017756938934326172, -0.01611614227294922, -0.014475345611572266, -0.012834548950195312, -0.01119375228881836, -0.009552955627441406, -0.007912158966064453, -0.0062713623046875, -0.004630565643310547, -0.0029897689819335938, -0.0013489723205566406, 0.0002918243408203125, 0.0019326210021972656, 0.0035734176635742188, 0.005214214324951172, 0.006855010986328125, 0.008495807647705078, 0.010136604309082031, 0.011777400970458984, 0.013418197631835938, 0.01505899429321289, 0.016699790954589844, 0.018340587615966797, 0.01998138427734375, 0.021622180938720703, 0.023262977600097656, 0.02490377426147461, 0.026544570922851562, 0.028185367584228516, 0.02982616424560547, 0.03146696090698242, 0.033107757568359375, 0.03474855422973633, 0.03638935089111328, 0.038030147552490234, 0.03967094421386719, 0.04131174087524414, 0.042952537536621094, 0.04459333419799805, 0.046234130859375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 4.0, 9.0, 8.0, 12.0, 32.0, 43.0, 69.0, 118.0, 199.0, 414.0, 899.0, 2139.0, 7842.0, 60659.0, 844909.0, 114862.0, 11475.0, 2777.0, 1020.0, 455.0, 272.0, 124.0, 69.0, 45.0, 43.0, 16.0, 16.0, 11.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.249755859375, -0.24071121215820312, -0.23166656494140625, -0.22262191772460938, -0.2135772705078125, -0.20453262329101562, -0.19548797607421875, -0.18644332885742188, -0.177398681640625, -0.16835403442382812, -0.15930938720703125, -0.15026473999023438, -0.1412200927734375, -0.13217544555664062, -0.12313079833984375, -0.11408615112304688, -0.10504150390625, -0.09599685668945312, -0.08695220947265625, -0.07790756225585938, -0.0688629150390625, -0.059818267822265625, -0.05077362060546875, -0.041728973388671875, -0.032684326171875, -0.023639678955078125, -0.01459503173828125, -0.005550384521484375, 0.0034942626953125, 0.012538909912109375, 0.02158355712890625, 0.030628204345703125, 0.0396728515625, 0.048717498779296875, 0.05776214599609375, 0.06680679321289062, 0.0758514404296875, 0.08489608764648438, 0.09394073486328125, 0.10298538208007812, 0.112030029296875, 0.12107467651367188, 0.13011932373046875, 0.13916397094726562, 0.1482086181640625, 0.15725326538085938, 0.16629791259765625, 0.17534255981445312, 0.18438720703125, 0.19343185424804688, 0.20247650146484375, 0.21152114868164062, 0.2205657958984375, 0.22961044311523438, 0.23865509033203125, 0.24769973754882812, 0.256744384765625, 0.2657890319824219, 0.27483367919921875, 0.2838783264160156, 0.2929229736328125, 0.3019676208496094, 0.31101226806640625, 0.3200569152832031, 0.3291015625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 6.0, 5.0, 6.0, 7.0, 4.0, 9.0, 6.0, 10.0, 12.0, 14.0, 14.0, 18.0, 15.0, 20.0, 28.0, 27.0, 30.0, 35.0, 53.0, 28.0, 33.0, 38.0, 41.0, 35.0, 47.0, 47.0, 42.0, 42.0, 45.0, 39.0, 36.0, 26.0, 29.0, 18.0, 18.0, 14.0, 19.0, 12.0, 19.0, 9.0, 6.0, 9.0, 7.0, 3.0, 4.0, 4.0, 4.0, 3.0, 2.0, 5.0, 6.0, 2.0, 1.0, 1.0], "bins": [-0.1964111328125, -0.1906261444091797, -0.18484115600585938, -0.17905616760253906, -0.17327117919921875, -0.16748619079589844, -0.16170120239257812, -0.1559162139892578, -0.1501312255859375, -0.1443462371826172, -0.13856124877929688, -0.13277626037597656, -0.12699127197265625, -0.12120628356933594, -0.11542129516601562, -0.10963630676269531, -0.103851318359375, -0.09806632995605469, -0.09228134155273438, -0.08649635314941406, -0.08071136474609375, -0.07492637634277344, -0.06914138793945312, -0.06335639953613281, -0.0575714111328125, -0.05178642272949219, -0.046001434326171875, -0.04021644592285156, -0.03443145751953125, -0.028646469116210938, -0.022861480712890625, -0.017076492309570312, -0.01129150390625, -0.0055065155029296875, 0.000278472900390625, 0.0060634613037109375, 0.01184844970703125, 0.017633438110351562, 0.023418426513671875, 0.029203414916992188, 0.0349884033203125, 0.04077339172363281, 0.046558380126953125, 0.05234336853027344, 0.05812835693359375, 0.06391334533691406, 0.06969833374023438, 0.07548332214355469, 0.081268310546875, 0.08705329895019531, 0.09283828735351562, 0.09862327575683594, 0.10440826416015625, 0.11019325256347656, 0.11597824096679688, 0.12176322937011719, 0.1275482177734375, 0.1333332061767578, 0.13911819458007812, 0.14490318298339844, 0.15068817138671875, 0.15647315979003906, 0.16225814819335938, 0.1680431365966797, 0.173828125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 2.0, 11.0, 8.0, 7.0, 7.0, 17.0, 29.0, 28.0, 53.0, 74.0, 89.0, 124.0, 216.0, 343.0, 560.0, 995.0, 1900.0, 4238.0, 10173.0, 30744.0, 111268.0, 556172.0, 240850.0, 59850.0, 17958.0, 6593.0, 2858.0, 1387.0, 776.0, 409.0, 267.0, 168.0, 105.0, 70.0, 63.0, 37.0, 22.0, 22.0, 12.0, 12.0, 14.0, 6.0, 5.0, 6.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.052337646484375, -0.05057954788208008, -0.048821449279785156, -0.047063350677490234, -0.04530525207519531, -0.04354715347290039, -0.04178905487060547, -0.04003095626831055, -0.038272857666015625, -0.0365147590637207, -0.03475666046142578, -0.03299856185913086, -0.031240463256835938, -0.029482364654541016, -0.027724266052246094, -0.025966167449951172, -0.02420806884765625, -0.022449970245361328, -0.020691871643066406, -0.018933773040771484, -0.017175674438476562, -0.01541757583618164, -0.013659477233886719, -0.011901378631591797, -0.010143280029296875, -0.008385181427001953, -0.006627082824707031, -0.004868984222412109, -0.0031108856201171875, -0.0013527870178222656, 0.00040531158447265625, 0.002163410186767578, 0.0039215087890625, 0.005679607391357422, 0.007437705993652344, 0.009195804595947266, 0.010953903198242188, 0.01271200180053711, 0.014470100402832031, 0.016228199005126953, 0.017986297607421875, 0.019744396209716797, 0.02150249481201172, 0.02326059341430664, 0.025018692016601562, 0.026776790618896484, 0.028534889221191406, 0.030292987823486328, 0.03205108642578125, 0.03380918502807617, 0.035567283630371094, 0.037325382232666016, 0.03908348083496094, 0.04084157943725586, 0.04259967803955078, 0.0443577766418457, 0.046115875244140625, 0.04787397384643555, 0.04963207244873047, 0.05139017105102539, 0.05314826965332031, 0.054906368255615234, 0.056664466857910156, 0.05842256546020508, 0.0601806640625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 5.0, 2.0, 2.0, 4.0, 5.0, 2.0, 8.0, 8.0, 12.0, 14.0, 21.0, 18.0, 30.0, 34.0, 32.0, 42.0, 65.0, 63.0, 52.0, 69.0, 76.0, 64.0, 71.0, 54.0, 31.0, 24.0, 31.0, 31.0, 26.0, 19.0, 15.0, 13.0, 16.0, 15.0, 5.0, 6.0, 3.0, 3.0, 3.0, 2.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.390146255493164e-05, -2.3271888494491577e-05, -2.2642314434051514e-05, -2.201274037361145e-05, -2.1383166313171387e-05, -2.0753592252731323e-05, -2.012401819229126e-05, -1.9494444131851196e-05, -1.8864870071411133e-05, -1.823529601097107e-05, -1.7605721950531006e-05, -1.6976147890090942e-05, -1.634657382965088e-05, -1.5716999769210815e-05, -1.5087425708770752e-05, -1.4457851648330688e-05, -1.3828277587890625e-05, -1.3198703527450562e-05, -1.2569129467010498e-05, -1.1939555406570435e-05, -1.1309981346130371e-05, -1.0680407285690308e-05, -1.0050833225250244e-05, -9.42125916481018e-06, -8.791685104370117e-06, -8.162111043930054e-06, -7.53253698348999e-06, -6.902962923049927e-06, -6.273388862609863e-06, -5.6438148021698e-06, -5.014240741729736e-06, -4.384666681289673e-06, -3.7550926208496094e-06, -3.125518560409546e-06, -2.4959444999694824e-06, -1.866370439529419e-06, -1.2367963790893555e-06, -6.07222318649292e-07, 2.2351741790771484e-08, 6.51925802230835e-07, 1.2814998626708984e-06, 1.911073923110962e-06, 2.5406479835510254e-06, 3.170222043991089e-06, 3.7997961044311523e-06, 4.429370164871216e-06, 5.058944225311279e-06, 5.688518285751343e-06, 6.318092346191406e-06, 6.94766640663147e-06, 7.577240467071533e-06, 8.206814527511597e-06, 8.83638858795166e-06, 9.465962648391724e-06, 1.0095536708831787e-05, 1.072511076927185e-05, 1.1354684829711914e-05, 1.1984258890151978e-05, 1.2613832950592041e-05, 1.3243407011032104e-05, 1.3872981071472168e-05, 1.4502555131912231e-05, 1.5132129192352295e-05, 1.576170325279236e-05, 1.6391277313232422e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 1.0, 2.0, 5.0, 10.0, 13.0, 11.0, 21.0, 25.0, 46.0, 56.0, 95.0, 147.0, 239.0, 435.0, 847.0, 1772.0, 4271.0, 13221.0, 59628.0, 501646.0, 388269.0, 57321.0, 12682.0, 4180.0, 1713.0, 769.0, 427.0, 279.0, 144.0, 99.0, 60.0, 34.0, 27.0, 16.0, 16.0, 10.0, 5.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0740966796875, -0.07191658020019531, -0.06973648071289062, -0.06755638122558594, -0.06537628173828125, -0.06319618225097656, -0.061016082763671875, -0.05883598327636719, -0.0566558837890625, -0.05447578430175781, -0.052295684814453125, -0.05011558532714844, -0.04793548583984375, -0.04575538635253906, -0.043575286865234375, -0.04139518737792969, -0.039215087890625, -0.03703498840332031, -0.034854888916015625, -0.03267478942871094, -0.03049468994140625, -0.028314590454101562, -0.026134490966796875, -0.023954391479492188, -0.0217742919921875, -0.019594192504882812, -0.017414093017578125, -0.015233993530273438, -0.01305389404296875, -0.010873794555664062, -0.008693695068359375, -0.0065135955810546875, -0.00433349609375, -0.0021533966064453125, 2.6702880859375e-05, 0.0022068023681640625, 0.00438690185546875, 0.0065670013427734375, 0.008747100830078125, 0.010927200317382812, 0.0131072998046875, 0.015287399291992188, 0.017467498779296875, 0.019647598266601562, 0.02182769775390625, 0.024007797241210938, 0.026187896728515625, 0.028367996215820312, 0.030548095703125, 0.03272819519042969, 0.034908294677734375, 0.03708839416503906, 0.03926849365234375, 0.04144859313964844, 0.043628692626953125, 0.04580879211425781, 0.0479888916015625, 0.05016899108886719, 0.052349090576171875, 0.05452919006347656, 0.05670928955078125, 0.05888938903808594, 0.061069488525390625, 0.06324958801269531, 0.0654296875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 5.0, 3.0, 7.0, 13.0, 7.0, 13.0, 15.0, 13.0, 15.0, 14.0, 28.0, 35.0, 37.0, 41.0, 57.0, 57.0, 82.0, 56.0, 57.0, 65.0, 57.0, 64.0, 42.0, 31.0, 33.0, 33.0, 20.0, 13.0, 22.0, 15.0, 8.0, 6.0, 10.0, 10.0, 3.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048736572265625, -0.04724407196044922, -0.04575157165527344, -0.044259071350097656, -0.042766571044921875, -0.041274070739746094, -0.03978157043457031, -0.03828907012939453, -0.03679656982421875, -0.03530406951904297, -0.03381156921386719, -0.032319068908691406, -0.030826568603515625, -0.029334068298339844, -0.027841567993164062, -0.02634906768798828, -0.0248565673828125, -0.02336406707763672, -0.021871566772460938, -0.020379066467285156, -0.018886566162109375, -0.017394065856933594, -0.015901565551757812, -0.014409065246582031, -0.01291656494140625, -0.011424064636230469, -0.009931564331054688, -0.008439064025878906, -0.006946563720703125, -0.005454063415527344, -0.0039615631103515625, -0.0024690628051757812, -0.0009765625, 0.0005159378051757812, 0.0020084381103515625, 0.0035009384155273438, 0.004993438720703125, 0.006485939025878906, 0.007978439331054688, 0.009470939636230469, 0.01096343994140625, 0.012455940246582031, 0.013948440551757812, 0.015440940856933594, 0.016933441162109375, 0.018425941467285156, 0.019918441772460938, 0.02141094207763672, 0.0229034423828125, 0.02439594268798828, 0.025888442993164062, 0.027380943298339844, 0.028873443603515625, 0.030365943908691406, 0.03185844421386719, 0.03335094451904297, 0.03484344482421875, 0.03633594512939453, 0.03782844543457031, 0.039320945739746094, 0.040813446044921875, 0.042305946350097656, 0.04379844665527344, 0.04529094696044922, 0.046783447265625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 8.0, 8.0, 20.0, 64.0, 127.0, 322.0, 252.0, 112.0, 50.0, 17.0, 9.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4606847763061523, -1.3905689716339111, -1.3204530477523804, -1.2503372430801392, -1.1802213191986084, -1.1101055145263672, -1.039989709854126, -0.96987384557724, -0.899757981300354, -0.829642117023468, -0.759526252746582, -0.6894104480743408, -0.6192945837974548, -0.5491787195205688, -0.47906288504600525, -0.40894705057144165, -0.33883118629455566, -0.2687153220176697, -0.19859948754310608, -0.1284836381673813, -0.058367788791656494, 0.011748075485229492, 0.08186390995979309, 0.1519797444343567, 0.22209560871124268, 0.29221147298812866, 0.36232730746269226, 0.43244314193725586, 0.5025590062141418, 0.5726748704910278, 0.642790675163269, 0.712906539440155, 0.7830226421356201, 0.8531385064125061, 0.9232543706893921, 0.9933701753616333, 1.063486099243164, 1.1336019039154053, 1.2037177085876465, 1.2738335132598877, 1.3439494371414185, 1.4140652418136597, 1.4841811656951904, 1.5542969703674316, 1.6244127750396729, 1.6945286989212036, 1.7646445035934448, 1.8347604274749756, 1.9048762321472168, 1.974992036819458, 2.045107841491699, 2.1152238845825195, 2.1853396892547607, 2.255455493927002, 2.325571298599243, 2.3956871032714844, 2.4658031463623047, 2.535918951034546, 2.606034755706787, 2.6761507987976074, 2.7462666034698486, 2.81638240814209, 2.886498212814331, 2.9566140174865723, 3.0267298221588135]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 6.0, 4.0, 5.0, 11.0, 5.0, 11.0, 6.0, 13.0, 16.0, 15.0, 21.0, 25.0, 29.0, 30.0, 31.0, 30.0, 43.0, 36.0, 48.0, 68.0, 61.0, 65.0, 60.0, 43.0, 53.0, 35.0, 31.0, 22.0, 23.0, 20.0, 19.0, 17.0, 16.0, 13.0, 11.0, 14.0, 7.0, 7.0, 7.0, 6.0, 1.0, 4.0, 6.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.8308830857276917, -0.8063111305236816, -0.7817391753196716, -0.7571672201156616, -0.7325952649116516, -0.7080233097076416, -0.6834513545036316, -0.6588793992996216, -0.6343074440956116, -0.6097354888916016, -0.5851635336875916, -0.5605915784835815, -0.5360196232795715, -0.5114476680755615, -0.4868757128715515, -0.4623037576675415, -0.4377318322658539, -0.41315987706184387, -0.38858792185783386, -0.36401596665382385, -0.33944401144981384, -0.31487205624580383, -0.2903001308441162, -0.2657281756401062, -0.241156205534935, -0.216584250330925, -0.19201229512691498, -0.16744035482406616, -0.14286839962005615, -0.11829643696546555, -0.09372448921203613, -0.06915253400802612, -0.04458057880401611, -0.020008625462651253, 0.004563327878713608, 0.02913527935743332, 0.05370723456144333, 0.07827918976545334, 0.10285113751888275, 0.12742309272289276, 0.15199504792690277, 0.17656700313091278, 0.2011389583349228, 0.2257108986377716, 0.2502828538417816, 0.2748548090457916, 0.29942676424980164, 0.32399871945381165, 0.34857067465782166, 0.37314262986183167, 0.3977145850658417, 0.4222865402698517, 0.4468584954738617, 0.4714304506778717, 0.4960023760795593, 0.5205743312835693, 0.5451462864875793, 0.5697182416915894, 0.5942901968955994, 0.6188621520996094, 0.6434341073036194, 0.6680060625076294, 0.6925780177116394, 0.7171499729156494, 0.7417219281196594]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 4.0, 12.0, 12.0, 17.0, 21.0, 52.0, 78.0, 114.0, 215.0, 319.0, 633.0, 1216.0, 2441.0, 5559.0, 15243.0, 52736.0, 312309.0, 2355352.0, 1250542.0, 147460.0, 31583.0, 10148.0, 4193.0, 1863.0, 924.0, 486.0, 297.0, 148.0, 126.0, 65.0, 38.0, 28.0, 16.0, 11.0, 9.0, 8.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.09442138671875, -0.09204959869384766, -0.08967781066894531, -0.08730602264404297, -0.08493423461914062, -0.08256244659423828, -0.08019065856933594, -0.0778188705444336, -0.07544708251953125, -0.0730752944946289, -0.07070350646972656, -0.06833171844482422, -0.06595993041992188, -0.06358814239501953, -0.06121635437011719, -0.058844566345214844, -0.0564727783203125, -0.054100990295410156, -0.05172920227050781, -0.04935741424560547, -0.046985626220703125, -0.04461383819580078, -0.04224205017089844, -0.039870262145996094, -0.03749847412109375, -0.035126686096191406, -0.03275489807128906, -0.03038311004638672, -0.028011322021484375, -0.02563953399658203, -0.023267745971679688, -0.020895957946777344, -0.018524169921875, -0.016152381896972656, -0.013780593872070312, -0.011408805847167969, -0.009037017822265625, -0.006665229797363281, -0.0042934417724609375, -0.0019216537475585938, 0.00045013427734375, 0.0028219223022460938, 0.0051937103271484375, 0.007565498352050781, 0.009937286376953125, 0.012309074401855469, 0.014680862426757812, 0.017052650451660156, 0.0194244384765625, 0.021796226501464844, 0.024168014526367188, 0.02653980255126953, 0.028911590576171875, 0.03128337860107422, 0.03365516662597656, 0.036026954650878906, 0.03839874267578125, 0.040770530700683594, 0.04314231872558594, 0.04551410675048828, 0.047885894775390625, 0.05025768280029297, 0.05262947082519531, 0.055001258850097656, 0.057373046875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 2.0, 5.0, 4.0, 3.0, 8.0, 6.0, 7.0, 12.0, 12.0, 14.0, 27.0, 32.0, 26.0, 24.0, 33.0, 35.0, 34.0, 32.0, 34.0, 33.0, 51.0, 47.0, 49.0, 37.0, 44.0, 32.0, 39.0, 43.0, 34.0, 42.0, 24.0, 24.0, 27.0, 24.0, 22.0, 20.0, 14.0, 10.0, 8.0, 6.0, 7.0, 7.0, 4.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.042877197265625, -0.04151439666748047, -0.04015159606933594, -0.038788795471191406, -0.037425994873046875, -0.036063194274902344, -0.03470039367675781, -0.03333759307861328, -0.03197479248046875, -0.03061199188232422, -0.029249191284179688, -0.027886390686035156, -0.026523590087890625, -0.025160789489746094, -0.023797988891601562, -0.02243518829345703, -0.0210723876953125, -0.01970958709716797, -0.018346786499023438, -0.016983985900878906, -0.015621185302734375, -0.014258384704589844, -0.012895584106445312, -0.011532783508300781, -0.01016998291015625, -0.008807182312011719, -0.0074443817138671875, -0.006081581115722656, -0.004718780517578125, -0.0033559799194335938, -0.0019931793212890625, -0.0006303787231445312, 0.000732421875, 0.0020952224731445312, 0.0034580230712890625, 0.004820823669433594, 0.006183624267578125, 0.007546424865722656, 0.008909225463867188, 0.010272026062011719, 0.01163482666015625, 0.012997627258300781, 0.014360427856445312, 0.015723228454589844, 0.017086029052734375, 0.018448829650878906, 0.019811630249023438, 0.02117443084716797, 0.0225372314453125, 0.02390003204345703, 0.025262832641601562, 0.026625633239746094, 0.027988433837890625, 0.029351234436035156, 0.030714035034179688, 0.03207683563232422, 0.03343963623046875, 0.03480243682861328, 0.03616523742675781, 0.037528038024902344, 0.038890838623046875, 0.040253639221191406, 0.04161643981933594, 0.04297924041748047, 0.044342041015625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 7.0, 9.0, 33.0, 56.0, 58.0, 119.0, 221.0, 459.0, 1071.0, 3519.0, 15478.0, 148591.0, 3665702.0, 327376.0, 24454.0, 4782.0, 1329.0, 467.0, 239.0, 114.0, 63.0, 38.0, 33.0, 17.0, 12.0, 7.0, 10.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1949462890625, -0.18896865844726562, -0.18299102783203125, -0.17701339721679688, -0.1710357666015625, -0.16505813598632812, -0.15908050537109375, -0.15310287475585938, -0.147125244140625, -0.14114761352539062, -0.13516998291015625, -0.12919235229492188, -0.1232147216796875, -0.11723709106445312, -0.11125946044921875, -0.10528182983398438, -0.09930419921875, -0.09332656860351562, -0.08734893798828125, -0.08137130737304688, -0.0753936767578125, -0.06941604614257812, -0.06343841552734375, -0.057460784912109375, -0.051483154296875, -0.045505523681640625, -0.03952789306640625, -0.033550262451171875, -0.0275726318359375, -0.021595001220703125, -0.01561737060546875, -0.009639739990234375, -0.003662109375, 0.002315521240234375, 0.00829315185546875, 0.014270782470703125, 0.0202484130859375, 0.026226043701171875, 0.03220367431640625, 0.038181304931640625, 0.044158935546875, 0.050136566162109375, 0.05611419677734375, 0.062091827392578125, 0.0680694580078125, 0.07404708862304688, 0.08002471923828125, 0.08600234985351562, 0.09197998046875, 0.09795761108398438, 0.10393524169921875, 0.10991287231445312, 0.1158905029296875, 0.12186813354492188, 0.12784576416015625, 0.13382339477539062, 0.139801025390625, 0.14577865600585938, 0.15175628662109375, 0.15773391723632812, 0.1637115478515625, 0.16968917846679688, 0.17566680908203125, 0.18164443969726562, 0.1876220703125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 1.0, 2.0, 3.0, 4.0, 4.0, 10.0, 9.0, 15.0, 12.0, 19.0, 23.0, 35.0, 57.0, 96.0, 113.0, 194.0, 294.0, 423.0, 613.0, 699.0, 465.0, 322.0, 185.0, 137.0, 104.0, 51.0, 41.0, 30.0, 32.0, 15.0, 13.0, 9.0, 11.0, 10.0, 4.0, 2.0, 4.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.119140625, -0.11554431915283203, -0.11194801330566406, -0.1083517074584961, -0.10475540161132812, -0.10115909576416016, -0.09756278991699219, -0.09396648406982422, -0.09037017822265625, -0.08677387237548828, -0.08317756652832031, -0.07958126068115234, -0.07598495483398438, -0.0723886489868164, -0.06879234313964844, -0.06519603729248047, -0.0615997314453125, -0.05800342559814453, -0.05440711975097656, -0.050810813903808594, -0.047214508056640625, -0.043618202209472656, -0.04002189636230469, -0.03642559051513672, -0.03282928466796875, -0.02923297882080078, -0.025636672973632812, -0.022040367126464844, -0.018444061279296875, -0.014847755432128906, -0.011251449584960938, -0.007655143737792969, -0.004058837890625, -0.00046253204345703125, 0.0031337738037109375, 0.006730079650878906, 0.010326385498046875, 0.013922691345214844, 0.017518997192382812, 0.02111530303955078, 0.02471160888671875, 0.02830791473388672, 0.03190422058105469, 0.035500526428222656, 0.039096832275390625, 0.042693138122558594, 0.04628944396972656, 0.04988574981689453, 0.0534820556640625, 0.05707836151123047, 0.06067466735839844, 0.0642709732055664, 0.06786727905273438, 0.07146358489990234, 0.07505989074707031, 0.07865619659423828, 0.08225250244140625, 0.08584880828857422, 0.08944511413574219, 0.09304141998291016, 0.09663772583007812, 0.1002340316772461, 0.10383033752441406, 0.10742664337158203, 0.11102294921875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 6.0, 7.0, 9.0, 31.0, 58.0, 177.0, 243.0, 213.0, 143.0, 63.0, 25.0, 13.0, 6.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.8412970304489136, -1.7834926843643188, -1.7256882190704346, -1.6678838729858398, -1.6100794076919556, -1.5522750616073608, -1.4944705963134766, -1.4366662502288818, -1.378861904144287, -1.3210575580596924, -1.263253092765808, -1.2054487466812134, -1.147644281387329, -1.0898399353027344, -1.0320355892181396, -0.9742311239242554, -0.9164266586303711, -0.8586222529411316, -0.8008178472518921, -0.7430135011672974, -0.6852090358734131, -0.6274046897888184, -0.5696002840995789, -0.5117958784103394, -0.45399147272109985, -0.39618706703186035, -0.33838266134262085, -0.28057828545570374, -0.22277387976646423, -0.16496947407722473, -0.10716509819030762, -0.049360692501068115, 0.008443832397460938, 0.06624823063611984, 0.12405262887477875, 0.18185701966285706, 0.23966142535209656, 0.29746583104133606, 0.3552702069282532, 0.4130746126174927, 0.4708790183067322, 0.5286834239959717, 0.5864878296852112, 0.6442922353744507, 0.7020965814590454, 0.7599010467529297, 0.8177053928375244, 0.8755097985267639, 0.9333142042160034, 0.9911186099052429, 1.0489230155944824, 1.1067273616790771, 1.1645318269729614, 1.2223361730575562, 1.2801406383514404, 1.3379449844360352, 1.3957493305206299, 1.4535536766052246, 1.5113581418991089, 1.5691624879837036, 1.626966953277588, 1.6847712993621826, 1.7425756454467773, 1.8003801107406616, 1.858184576034546]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 5.0, 9.0, 14.0, 15.0, 20.0, 25.0, 30.0, 29.0, 52.0, 54.0, 58.0, 79.0, 65.0, 68.0, 65.0, 72.0, 64.0, 45.0, 50.0, 41.0, 29.0, 21.0, 14.0, 21.0, 15.0, 10.0, 4.0, 9.0, 7.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7511221766471863, -0.7279333472251892, -0.7047445178031921, -0.6815556883811951, -0.6583667993545532, -0.6351779699325562, -0.6119891405105591, -0.588800311088562, -0.5656114816665649, -0.5424226522445679, -0.5192338228225708, -0.49604496359825134, -0.4728561341762543, -0.4496673047542572, -0.42647844552993774, -0.4032896161079407, -0.3801007866859436, -0.35691195726394653, -0.33372312784194946, -0.31053426861763, -0.28734543919563293, -0.26415660977363586, -0.2409677654504776, -0.21777892112731934, -0.19459009170532227, -0.1714012622833252, -0.14821241796016693, -0.12502357363700867, -0.1018347442150116, -0.07864590734243393, -0.05545707046985626, -0.032268226146698, -0.009079396724700928, 0.01410944014787674, 0.03729827702045441, 0.060487113893032074, 0.08367595076560974, 0.10686478763818741, 0.13005362451076508, 0.15324246883392334, 0.1764312982559204, 0.19962012767791748, 0.22280897200107574, 0.245997816324234, 0.2691866457462311, 0.29237547516822815, 0.3155643343925476, 0.3387531638145447, 0.36194199323654175, 0.3851308226585388, 0.4083196520805359, 0.43150851130485535, 0.4546973407268524, 0.4778861701488495, 0.501075029373169, 0.524263858795166, 0.5474526882171631, 0.5706415176391602, 0.5938303470611572, 0.6170191764831543, 0.6402080059051514, 0.6633968949317932, 0.6865857243537903, 0.7097745537757874, 0.7329633831977844]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 8.0, 24.0, 29.0, 33.0, 56.0, 86.0, 138.0, 230.0, 387.0, 616.0, 1052.0, 1854.0, 3494.0, 7425.0, 16826.0, 43524.0, 125211.0, 319162.0, 322948.0, 128447.0, 44311.0, 17085.0, 7415.0, 3525.0, 1920.0, 1101.0, 654.0, 374.0, 218.0, 136.0, 99.0, 56.0, 33.0, 29.0, 19.0, 6.0, 13.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06781005859375, -0.06547260284423828, -0.06313514709472656, -0.060797691345214844, -0.058460235595703125, -0.056122779846191406, -0.05378532409667969, -0.05144786834716797, -0.04911041259765625, -0.04677295684814453, -0.04443550109863281, -0.042098045349121094, -0.039760589599609375, -0.037423133850097656, -0.03508567810058594, -0.03274822235107422, -0.0304107666015625, -0.02807331085205078, -0.025735855102539062, -0.023398399353027344, -0.021060943603515625, -0.018723487854003906, -0.016386032104492188, -0.014048576354980469, -0.01171112060546875, -0.009373664855957031, -0.0070362091064453125, -0.004698753356933594, -0.002361297607421875, -2.384185791015625e-05, 0.0023136138916015625, 0.004651069641113281, 0.006988525390625, 0.009325981140136719, 0.011663436889648438, 0.014000892639160156, 0.016338348388671875, 0.018675804138183594, 0.021013259887695312, 0.02335071563720703, 0.02568817138671875, 0.02802562713623047, 0.030363082885742188, 0.032700538635253906, 0.035037994384765625, 0.037375450134277344, 0.03971290588378906, 0.04205036163330078, 0.0443878173828125, 0.04672527313232422, 0.04906272888183594, 0.051400184631347656, 0.053737640380859375, 0.056075096130371094, 0.05841255187988281, 0.06075000762939453, 0.06308746337890625, 0.06542491912841797, 0.06776237487792969, 0.0700998306274414, 0.07243728637695312, 0.07477474212646484, 0.07711219787597656, 0.07944965362548828, 0.081787109375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 8.0, 5.0, 5.0, 10.0, 7.0, 13.0, 17.0, 18.0, 18.0, 18.0, 24.0, 29.0, 39.0, 35.0, 28.0, 40.0, 47.0, 34.0, 42.0, 46.0, 44.0, 37.0, 42.0, 39.0, 35.0, 25.0, 33.0, 22.0, 37.0, 27.0, 32.0, 16.0, 22.0, 18.0, 14.0, 20.0, 7.0, 10.0, 10.0, 2.0, 3.0, 4.0, 5.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04022216796875, -0.03884601593017578, -0.03746986389160156, -0.036093711853027344, -0.034717559814453125, -0.033341407775878906, -0.03196525573730469, -0.03058910369873047, -0.02921295166015625, -0.02783679962158203, -0.026460647583007812, -0.025084495544433594, -0.023708343505859375, -0.022332191467285156, -0.020956039428710938, -0.01957988739013672, -0.0182037353515625, -0.01682758331298828, -0.015451431274414062, -0.014075279235839844, -0.012699127197265625, -0.011322975158691406, -0.009946823120117188, -0.008570671081542969, -0.00719451904296875, -0.005818367004394531, -0.0044422149658203125, -0.0030660629272460938, -0.001689910888671875, -0.00031375885009765625, 0.0010623931884765625, 0.0024385452270507812, 0.003814697265625, 0.005190849304199219, 0.0065670013427734375, 0.007943153381347656, 0.009319305419921875, 0.010695457458496094, 0.012071609497070312, 0.013447761535644531, 0.01482391357421875, 0.01620006561279297, 0.017576217651367188, 0.018952369689941406, 0.020328521728515625, 0.021704673767089844, 0.023080825805664062, 0.02445697784423828, 0.0258331298828125, 0.02720928192138672, 0.028585433959960938, 0.029961585998535156, 0.031337738037109375, 0.032713890075683594, 0.03409004211425781, 0.03546619415283203, 0.03684234619140625, 0.03821849822998047, 0.03959465026855469, 0.040970802307128906, 0.042346954345703125, 0.043723106384277344, 0.04509925842285156, 0.04647541046142578, 0.0478515625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 7.0, 6.0, 5.0, 12.0, 11.0, 12.0, 17.0, 30.0, 35.0, 53.0, 100.0, 201.0, 341.0, 704.0, 1706.0, 5120.0, 22546.0, 163258.0, 718263.0, 112431.0, 16744.0, 4139.0, 1453.0, 590.0, 314.0, 149.0, 100.0, 77.0, 40.0, 31.0, 18.0, 9.0, 9.0, 9.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.160888671875, -0.15634536743164062, -0.15180206298828125, -0.14725875854492188, -0.1427154541015625, -0.13817214965820312, -0.13362884521484375, -0.12908554077148438, -0.124542236328125, -0.11999893188476562, -0.11545562744140625, -0.11091232299804688, -0.1063690185546875, -0.10182571411132812, -0.09728240966796875, -0.09273910522460938, -0.08819580078125, -0.08365249633789062, -0.07910919189453125, -0.07456588745117188, -0.0700225830078125, -0.06547927856445312, -0.06093597412109375, -0.056392669677734375, -0.051849365234375, -0.047306060791015625, -0.04276275634765625, -0.038219451904296875, -0.0336761474609375, -0.029132843017578125, -0.02458953857421875, -0.020046234130859375, -0.0155029296875, -0.010959625244140625, -0.00641632080078125, -0.001873016357421875, 0.0026702880859375, 0.007213592529296875, 0.01175689697265625, 0.016300201416015625, 0.020843505859375, 0.025386810302734375, 0.02993011474609375, 0.034473419189453125, 0.0390167236328125, 0.043560028076171875, 0.04810333251953125, 0.052646636962890625, 0.05718994140625, 0.061733245849609375, 0.06627655029296875, 0.07081985473632812, 0.0753631591796875, 0.07990646362304688, 0.08444976806640625, 0.08899307250976562, 0.093536376953125, 0.09807968139648438, 0.10262298583984375, 0.10716629028320312, 0.1117095947265625, 0.11625289916992188, 0.12079620361328125, 0.12533950805664062, 0.1298828125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 4.0, 9.0, 9.0, 13.0, 14.0, 30.0, 19.0, 29.0, 32.0, 35.0, 33.0, 41.0, 34.0, 60.0, 48.0, 34.0, 42.0, 47.0, 55.0, 51.0, 37.0, 52.0, 40.0, 24.0, 40.0, 32.0, 22.0, 22.0, 13.0, 19.0, 7.0, 6.0, 11.0, 10.0, 5.0, 7.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.185546875, -0.17974853515625, -0.1739501953125, -0.16815185546875, -0.162353515625, -0.15655517578125, -0.1507568359375, -0.14495849609375, -0.13916015625, -0.13336181640625, -0.1275634765625, -0.12176513671875, -0.115966796875, -0.11016845703125, -0.1043701171875, -0.09857177734375, -0.0927734375, -0.08697509765625, -0.0811767578125, -0.07537841796875, -0.069580078125, -0.06378173828125, -0.0579833984375, -0.05218505859375, -0.04638671875, -0.04058837890625, -0.0347900390625, -0.02899169921875, -0.023193359375, -0.01739501953125, -0.0115966796875, -0.00579833984375, 0.0, 0.00579833984375, 0.0115966796875, 0.01739501953125, 0.023193359375, 0.02899169921875, 0.0347900390625, 0.04058837890625, 0.04638671875, 0.05218505859375, 0.0579833984375, 0.06378173828125, 0.069580078125, 0.07537841796875, 0.0811767578125, 0.08697509765625, 0.0927734375, 0.09857177734375, 0.1043701171875, 0.11016845703125, 0.115966796875, 0.12176513671875, 0.1275634765625, 0.13336181640625, 0.13916015625, 0.14495849609375, 0.1507568359375, 0.15655517578125, 0.162353515625, 0.16815185546875, 0.1739501953125, 0.17974853515625, 0.185546875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 2.0, 14.0, 20.0, 25.0, 38.0, 45.0, 68.0, 108.0, 189.0, 334.0, 722.0, 1618.0, 4775.0, 17801.0, 103342.0, 726763.0, 158586.0, 24195.0, 6098.0, 2046.0, 852.0, 381.0, 213.0, 111.0, 68.0, 54.0, 27.0, 21.0, 12.0, 6.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06341552734375, -0.06119823455810547, -0.05898094177246094, -0.056763648986816406, -0.054546356201171875, -0.052329063415527344, -0.05011177062988281, -0.04789447784423828, -0.04567718505859375, -0.04345989227294922, -0.04124259948730469, -0.039025306701660156, -0.036808013916015625, -0.034590721130371094, -0.03237342834472656, -0.03015613555908203, -0.0279388427734375, -0.02572154998779297, -0.023504257202148438, -0.021286964416503906, -0.019069671630859375, -0.016852378845214844, -0.014635086059570312, -0.012417793273925781, -0.01020050048828125, -0.007983207702636719, -0.0057659149169921875, -0.0035486221313476562, -0.001331329345703125, 0.0008859634399414062, 0.0031032562255859375, 0.005320549011230469, 0.007537841796875, 0.009755134582519531, 0.011972427368164062, 0.014189720153808594, 0.016407012939453125, 0.018624305725097656, 0.020841598510742188, 0.02305889129638672, 0.02527618408203125, 0.02749347686767578, 0.029710769653320312, 0.031928062438964844, 0.034145355224609375, 0.036362648010253906, 0.03857994079589844, 0.04079723358154297, 0.0430145263671875, 0.04523181915283203, 0.04744911193847656, 0.049666404724121094, 0.051883697509765625, 0.054100990295410156, 0.05631828308105469, 0.05853557586669922, 0.06075286865234375, 0.06297016143798828, 0.06518745422363281, 0.06740474700927734, 0.06962203979492188, 0.0718393325805664, 0.07405662536621094, 0.07627391815185547, 0.0784912109375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 3.0, 7.0, 13.0, 16.0, 16.0, 35.0, 40.0, 46.0, 64.0, 67.0, 96.0, 86.0, 107.0, 74.0, 87.0, 50.0, 43.0, 38.0, 35.0, 14.0, 16.0, 11.0, 7.0, 13.0, 4.0, 2.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3589859008789062e-05, -1.290440559387207e-05, -1.2218952178955078e-05, -1.1533498764038086e-05, -1.0848045349121094e-05, -1.0162591934204102e-05, -9.47713851928711e-06, -8.791685104370117e-06, -8.106231689453125e-06, -7.420778274536133e-06, -6.735324859619141e-06, -6.0498714447021484e-06, -5.364418029785156e-06, -4.678964614868164e-06, -3.993511199951172e-06, -3.3080577850341797e-06, -2.6226043701171875e-06, -1.9371509552001953e-06, -1.2516975402832031e-06, -5.662441253662109e-07, 1.1920928955078125e-07, 8.046627044677734e-07, 1.4901161193847656e-06, 2.175569534301758e-06, 2.86102294921875e-06, 3.546476364135742e-06, 4.231929779052734e-06, 4.9173831939697266e-06, 5.602836608886719e-06, 6.288290023803711e-06, 6.973743438720703e-06, 7.659196853637695e-06, 8.344650268554688e-06, 9.03010368347168e-06, 9.715557098388672e-06, 1.0401010513305664e-05, 1.1086463928222656e-05, 1.1771917343139648e-05, 1.245737075805664e-05, 1.3142824172973633e-05, 1.3828277587890625e-05, 1.4513731002807617e-05, 1.519918441772461e-05, 1.58846378326416e-05, 1.6570091247558594e-05, 1.7255544662475586e-05, 1.7940998077392578e-05, 1.862645149230957e-05, 1.9311904907226562e-05, 1.9997358322143555e-05, 2.0682811737060547e-05, 2.136826515197754e-05, 2.205371856689453e-05, 2.2739171981811523e-05, 2.3424625396728516e-05, 2.4110078811645508e-05, 2.47955322265625e-05, 2.5480985641479492e-05, 2.6166439056396484e-05, 2.6851892471313477e-05, 2.753734588623047e-05, 2.822279930114746e-05, 2.8908252716064453e-05, 2.9593706130981445e-05, 3.0279159545898438e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 9.0, 8.0, 6.0, 14.0, 14.0, 31.0, 47.0, 83.0, 181.0, 391.0, 946.0, 2824.0, 11516.0, 78043.0, 772579.0, 157426.0, 18114.0, 4105.0, 1251.0, 489.0, 219.0, 114.0, 53.0, 31.0, 19.0, 13.0, 7.0, 7.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06292724609375, -0.060265541076660156, -0.05760383605957031, -0.05494213104248047, -0.052280426025390625, -0.04961872100830078, -0.04695701599121094, -0.044295310974121094, -0.04163360595703125, -0.038971900939941406, -0.03631019592285156, -0.03364849090576172, -0.030986785888671875, -0.02832508087158203, -0.025663375854492188, -0.023001670837402344, -0.0203399658203125, -0.017678260803222656, -0.015016555786132812, -0.012354850769042969, -0.009693145751953125, -0.007031440734863281, -0.0043697357177734375, -0.0017080307006835938, 0.00095367431640625, 0.0036153793334960938, 0.0062770843505859375, 0.008938789367675781, 0.011600494384765625, 0.014262199401855469, 0.016923904418945312, 0.019585609436035156, 0.022247314453125, 0.024909019470214844, 0.027570724487304688, 0.03023242950439453, 0.032894134521484375, 0.03555583953857422, 0.03821754455566406, 0.040879249572753906, 0.04354095458984375, 0.046202659606933594, 0.04886436462402344, 0.05152606964111328, 0.054187774658203125, 0.05684947967529297, 0.05951118469238281, 0.062172889709472656, 0.0648345947265625, 0.06749629974365234, 0.07015800476074219, 0.07281970977783203, 0.07548141479492188, 0.07814311981201172, 0.08080482482910156, 0.0834665298461914, 0.08612823486328125, 0.0887899398803711, 0.09145164489746094, 0.09411334991455078, 0.09677505493164062, 0.09943675994873047, 0.10209846496582031, 0.10476016998291016, 0.107421875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 2.0, 2.0, 10.0, 9.0, 21.0, 27.0, 31.0, 42.0, 56.0, 65.0, 69.0, 88.0, 104.0, 91.0, 75.0, 76.0, 55.0, 53.0, 32.0, 24.0, 19.0, 8.0, 10.0, 8.0, 6.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07061767578125, -0.0686197280883789, -0.06662178039550781, -0.06462383270263672, -0.06262588500976562, -0.06062793731689453, -0.05862998962402344, -0.056632041931152344, -0.05463409423828125, -0.052636146545410156, -0.05063819885253906, -0.04864025115966797, -0.046642303466796875, -0.04464435577392578, -0.04264640808105469, -0.040648460388183594, -0.0386505126953125, -0.036652565002441406, -0.03465461730957031, -0.03265666961669922, -0.030658721923828125, -0.02866077423095703, -0.026662826538085938, -0.024664878845214844, -0.02266693115234375, -0.020668983459472656, -0.018671035766601562, -0.01667308807373047, -0.014675140380859375, -0.012677192687988281, -0.010679244995117188, -0.008681297302246094, -0.006683349609375, -0.004685401916503906, -0.0026874542236328125, -0.0006895065307617188, 0.001308441162109375, 0.0033063888549804688, 0.0053043365478515625, 0.007302284240722656, 0.00930023193359375, 0.011298179626464844, 0.013296127319335938, 0.015294075012207031, 0.017292022705078125, 0.01928997039794922, 0.021287918090820312, 0.023285865783691406, 0.0252838134765625, 0.027281761169433594, 0.029279708862304688, 0.03127765655517578, 0.033275604248046875, 0.03527355194091797, 0.03727149963378906, 0.039269447326660156, 0.04126739501953125, 0.043265342712402344, 0.04526329040527344, 0.04726123809814453, 0.049259185791015625, 0.05125713348388672, 0.05325508117675781, 0.055253028869628906, 0.0572509765625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 8.0, 17.0, 32.0, 121.0, 363.0, 297.0, 108.0, 36.0, 12.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.206325054168701, -2.137188673019409, -2.0680525302886963, -1.9989162683486938, -1.9297800064086914, -1.8606436252593994, -1.791507363319397, -1.7223711013793945, -1.653234839439392, -1.5840985774993896, -1.5149623155593872, -1.4458260536193848, -1.3766896724700928, -1.3075535297393799, -1.238417148590088, -1.1692808866500854, -1.100144624710083, -1.0310083627700806, -0.9618721008300781, -0.8927357792854309, -0.8235995173454285, -0.754463255405426, -0.6853269338607788, -0.6161906719207764, -0.5470544099807739, -0.4779181480407715, -0.40878185629844666, -0.3396455645561218, -0.2705093026161194, -0.20137304067611694, -0.13223674893379211, -0.06310045719146729, 0.006036043167114258, 0.0751723200082779, 0.14430859684944153, 0.21344487369060516, 0.2825811505317688, 0.35171741247177124, 0.42085370421409607, 0.4899899959564209, 0.5591262578964233, 0.6282625198364258, 0.6973987817764282, 0.7665351033210754, 0.8356713652610779, 0.9048076272010803, 0.9739439487457275, 1.04308021068573, 1.1122164726257324, 1.1813527345657349, 1.2504889965057373, 1.3196252584457397, 1.3887615203857422, 1.4578979015350342, 1.5270341634750366, 1.596170425415039, 1.6653066873550415, 1.734442949295044, 1.8035792112350464, 1.8727154731750488, 1.9418518543243408, 2.0109879970550537, 2.0801243782043457, 2.1492605209350586, 2.2183969020843506]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 0.0, 3.0, 4.0, 3.0, 6.0, 4.0, 9.0, 7.0, 5.0, 10.0, 11.0, 8.0, 13.0, 15.0, 14.0, 21.0, 22.0, 24.0, 28.0, 32.0, 37.0, 43.0, 48.0, 76.0, 61.0, 65.0, 57.0, 59.0, 43.0, 35.0, 21.0, 36.0, 31.0, 26.0, 24.0, 10.0, 19.0, 20.0, 9.0, 11.0, 9.0, 5.0, 6.0, 6.0, 9.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6456982493400574, -0.623222827911377, -0.6007474660873413, -0.5782720446586609, -0.5557966232299805, -0.5333212018013, -0.5108457803726196, -0.488370418548584, -0.46589499711990356, -0.44341957569122314, -0.4209441840648651, -0.3984687924385071, -0.37599337100982666, -0.35351794958114624, -0.3310425579547882, -0.3085671663284302, -0.28609174489974976, -0.26361632347106934, -0.2411409318447113, -0.21866552531719208, -0.19619011878967285, -0.17371471226215363, -0.1512393057346344, -0.12876389920711517, -0.10628849267959595, -0.08381308615207672, -0.061337679624557495, -0.03886227309703827, -0.016386866569519043, 0.006088539958000183, 0.02856394648551941, 0.051039353013038635, 0.07351481914520264, 0.09599022567272186, 0.11846563220024109, 0.14094103872776031, 0.16341644525527954, 0.18589185178279877, 0.208367258310318, 0.23084266483783722, 0.25331807136535645, 0.27579349279403687, 0.2982688844203949, 0.32074427604675293, 0.34321969747543335, 0.36569511890411377, 0.3881705105304718, 0.41064590215682983, 0.43312132358551025, 0.4555967450141907, 0.4780721366405487, 0.5005475282669067, 0.5230229496955872, 0.5454983711242676, 0.5679737329483032, 0.5904491543769836, 0.6129245758056641, 0.6353999972343445, 0.6578754186630249, 0.6803507804870605, 0.702826201915741, 0.7253016233444214, 0.747776985168457, 0.7702524065971375, 0.7927278280258179]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 2.0, 3.0, 8.0, 7.0, 16.0, 17.0, 22.0, 39.0, 37.0, 81.0, 127.0, 177.0, 285.0, 460.0, 737.0, 1248.0, 2275.0, 4059.0, 7655.0, 16602.0, 45034.0, 173660.0, 982675.0, 2231021.0, 559787.0, 109053.0, 32024.0, 12876.0, 6157.0, 3267.0, 1924.0, 1107.0, 647.0, 411.0, 263.0, 173.0, 115.0, 75.0, 45.0, 40.0, 31.0, 22.0, 9.0, 9.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.051666259765625, -0.049776554107666016, -0.04788684844970703, -0.04599714279174805, -0.04410743713378906, -0.04221773147583008, -0.040328025817871094, -0.03843832015991211, -0.036548614501953125, -0.03465890884399414, -0.032769203186035156, -0.030879497528076172, -0.028989791870117188, -0.027100086212158203, -0.02521038055419922, -0.023320674896240234, -0.02143096923828125, -0.019541263580322266, -0.01765155792236328, -0.015761852264404297, -0.013872146606445312, -0.011982440948486328, -0.010092735290527344, -0.00820302963256836, -0.006313323974609375, -0.004423618316650391, -0.0025339126586914062, -0.0006442070007324219, 0.0012454986572265625, 0.003135204315185547, 0.005024909973144531, 0.006914615631103516, 0.0088043212890625, 0.010694026947021484, 0.012583732604980469, 0.014473438262939453, 0.016363143920898438, 0.018252849578857422, 0.020142555236816406, 0.02203226089477539, 0.023921966552734375, 0.02581167221069336, 0.027701377868652344, 0.029591083526611328, 0.03148078918457031, 0.0333704948425293, 0.03526020050048828, 0.037149906158447266, 0.03903961181640625, 0.040929317474365234, 0.04281902313232422, 0.0447087287902832, 0.04659843444824219, 0.04848814010620117, 0.050377845764160156, 0.05226755142211914, 0.054157257080078125, 0.05604696273803711, 0.057936668395996094, 0.05982637405395508, 0.06171607971191406, 0.06360578536987305, 0.06549549102783203, 0.06738519668579102, 0.06927490234375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 7.0, 7.0, 4.0, 6.0, 6.0, 8.0, 9.0, 12.0, 23.0, 18.0, 22.0, 20.0, 36.0, 51.0, 37.0, 44.0, 42.0, 37.0, 56.0, 58.0, 54.0, 45.0, 54.0, 34.0, 45.0, 50.0, 34.0, 33.0, 36.0, 17.0, 21.0, 17.0, 23.0, 12.0, 4.0, 7.0, 9.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.055450439453125, -0.053768157958984375, -0.05208587646484375, -0.050403594970703125, -0.0487213134765625, -0.047039031982421875, -0.04535675048828125, -0.043674468994140625, -0.0419921875, -0.040309906005859375, -0.03862762451171875, -0.036945343017578125, -0.0352630615234375, -0.033580780029296875, -0.03189849853515625, -0.030216217041015625, -0.028533935546875, -0.026851654052734375, -0.02516937255859375, -0.023487091064453125, -0.0218048095703125, -0.020122528076171875, -0.01844024658203125, -0.016757965087890625, -0.01507568359375, -0.013393402099609375, -0.01171112060546875, -0.010028839111328125, -0.0083465576171875, -0.006664276123046875, -0.00498199462890625, -0.003299713134765625, -0.001617431640625, 6.4849853515625e-05, 0.00174713134765625, 0.003429412841796875, 0.0051116943359375, 0.006793975830078125, 0.00847625732421875, 0.010158538818359375, 0.0118408203125, 0.013523101806640625, 0.01520538330078125, 0.016887664794921875, 0.0185699462890625, 0.020252227783203125, 0.02193450927734375, 0.023616790771484375, 0.025299072265625, 0.026981353759765625, 0.02866363525390625, 0.030345916748046875, 0.0320281982421875, 0.033710479736328125, 0.03539276123046875, 0.037075042724609375, 0.03875732421875, 0.040439605712890625, 0.04212188720703125, 0.043804168701171875, 0.0454864501953125, 0.047168731689453125, 0.04885101318359375, 0.050533294677734375, 0.052215576171875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 3.0, 9.0, 9.0, 16.0, 30.0, 36.0, 72.0, 94.0, 181.0, 536.0, 1914.0, 9065.0, 88956.0, 3719728.0, 350134.0, 18727.0, 3254.0, 843.0, 312.0, 128.0, 64.0, 47.0, 24.0, 25.0, 17.0, 13.0, 9.0, 8.0, 5.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1859130859375, -0.1791973114013672, -0.17248153686523438, -0.16576576232910156, -0.15904998779296875, -0.15233421325683594, -0.14561843872070312, -0.1389026641845703, -0.1321868896484375, -0.1254711151123047, -0.11875534057617188, -0.11203956604003906, -0.10532379150390625, -0.09860801696777344, -0.09189224243164062, -0.08517646789550781, -0.078460693359375, -0.07174491882324219, -0.06502914428710938, -0.05831336975097656, -0.05159759521484375, -0.04488182067871094, -0.038166046142578125, -0.03145027160644531, -0.0247344970703125, -0.018018722534179688, -0.011302947998046875, -0.0045871734619140625, 0.00212860107421875, 0.008844375610351562, 0.015560150146484375, 0.022275924682617188, 0.02899169921875, 0.03570747375488281, 0.042423248291015625, 0.04913902282714844, 0.05585479736328125, 0.06257057189941406, 0.06928634643554688, 0.07600212097167969, 0.0827178955078125, 0.08943367004394531, 0.09614944458007812, 0.10286521911621094, 0.10958099365234375, 0.11629676818847656, 0.12301254272460938, 0.1297283172607422, 0.136444091796875, 0.1431598663330078, 0.14987564086914062, 0.15659141540527344, 0.16330718994140625, 0.17002296447753906, 0.17673873901367188, 0.1834545135498047, 0.1901702880859375, 0.1968860626220703, 0.20360183715820312, 0.21031761169433594, 0.21703338623046875, 0.22374916076660156, 0.23046493530273438, 0.2371807098388672, 0.243896484375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 7.0, 5.0, 7.0, 5.0, 11.0, 15.0, 15.0, 22.0, 37.0, 47.0, 53.0, 98.0, 148.0, 266.0, 376.0, 618.0, 664.0, 621.0, 369.0, 230.0, 125.0, 105.0, 59.0, 48.0, 27.0, 23.0, 14.0, 10.0, 16.0, 5.0, 6.0, 4.0, 3.0, 6.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10040283203125, -0.09674739837646484, -0.09309196472167969, -0.08943653106689453, -0.08578109741210938, -0.08212566375732422, -0.07847023010253906, -0.0748147964477539, -0.07115936279296875, -0.0675039291381836, -0.06384849548339844, -0.06019306182861328, -0.056537628173828125, -0.05288219451904297, -0.04922676086425781, -0.045571327209472656, -0.0419158935546875, -0.038260459899902344, -0.03460502624511719, -0.03094959259033203, -0.027294158935546875, -0.02363872528076172, -0.019983291625976562, -0.016327857971191406, -0.01267242431640625, -0.009016990661621094, -0.0053615570068359375, -0.0017061233520507812, 0.001949310302734375, 0.005604743957519531, 0.009260177612304688, 0.012915611267089844, 0.016571044921875, 0.020226478576660156, 0.023881912231445312, 0.02753734588623047, 0.031192779541015625, 0.03484821319580078, 0.03850364685058594, 0.042159080505371094, 0.04581451416015625, 0.049469947814941406, 0.05312538146972656, 0.05678081512451172, 0.060436248779296875, 0.06409168243408203, 0.06774711608886719, 0.07140254974365234, 0.0750579833984375, 0.07871341705322266, 0.08236885070800781, 0.08602428436279297, 0.08967971801757812, 0.09333515167236328, 0.09699058532714844, 0.1006460189819336, 0.10430145263671875, 0.1079568862915039, 0.11161231994628906, 0.11526775360107422, 0.11892318725585938, 0.12257862091064453, 0.1262340545654297, 0.12988948822021484, 0.133544921875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 9.0, 10.0, 30.0, 56.0, 112.0, 174.0, 234.0, 171.0, 92.0, 68.0, 18.0, 11.0, 7.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0755388736724854, -1.0312937498092651, -0.9870485663414001, -0.9428034424781799, -0.8985582590103149, -0.8543131351470947, -0.8100680112838745, -0.7658228278160095, -0.7215776443481445, -0.6773325204849243, -0.6330873370170593, -0.5888422131538391, -0.5445970296859741, -0.5003519058227539, -0.4561067521572113, -0.4118615984916687, -0.3676164746284485, -0.3233713209629059, -0.2791261672973633, -0.23488102853298187, -0.19063587486743927, -0.14639072120189667, -0.10214558243751526, -0.057900428771972656, -0.013655275106430054, 0.03058987483382225, 0.07483502477407455, 0.11908017098903656, 0.16332532465457916, 0.20757047832012177, 0.2518156170845032, 0.2960607707500458, 0.3403059244155884, 0.384551078081131, 0.4287962317466736, 0.4730413556098938, 0.5172865390777588, 0.561531662940979, 0.6057767868041992, 0.6500219702720642, 0.6942671537399292, 0.7385122776031494, 0.7827574610710144, 0.8270025849342346, 0.8712477684020996, 0.9154928922653198, 0.95973801612854, 1.0039832592010498, 1.0482282638549805, 1.0924733877182007, 1.136718511581421, 1.1809637546539307, 1.2252088785171509, 1.269454002380371, 1.3136991262435913, 1.3579442501068115, 1.4021894931793213, 1.4464346170425415, 1.4906797409057617, 1.5349249839782715, 1.5791701078414917, 1.623415231704712, 1.6676603555679321, 1.7119054794311523, 1.756150722503662]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 7.0, 8.0, 9.0, 10.0, 10.0, 14.0, 13.0, 21.0, 15.0, 18.0, 29.0, 29.0, 33.0, 41.0, 52.0, 50.0, 51.0, 45.0, 47.0, 52.0, 55.0, 61.0, 38.0, 39.0, 35.0, 40.0, 28.0, 17.0, 25.0, 15.0, 11.0, 15.0, 15.0, 17.0, 17.0, 2.0, 3.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.5719928741455078, -0.5546301603317261, -0.5372673869132996, -0.519904613494873, -0.5025418996810913, -0.4851791560649872, -0.46781641244888306, -0.45045366883277893, -0.4330909252166748, -0.4157281816005707, -0.39836543798446655, -0.3810026943683624, -0.3636399507522583, -0.3462772071361542, -0.32891446352005005, -0.3115517199039459, -0.2941889762878418, -0.27682623267173767, -0.25946348905563354, -0.24210074543952942, -0.2247380018234253, -0.20737525820732117, -0.19001251459121704, -0.17264977097511292, -0.1552870273590088, -0.13792428374290466, -0.12056154012680054, -0.10319879651069641, -0.08583605289459229, -0.06847330927848816, -0.05111056566238403, -0.03374782204627991, -0.016385138034820557, 0.0009776055812835693, 0.018340349197387695, 0.03570309281349182, 0.05306583642959595, 0.07042858004570007, 0.0877913236618042, 0.10515406727790833, 0.12251681089401245, 0.13987955451011658, 0.1572422981262207, 0.17460504174232483, 0.19196778535842896, 0.20933052897453308, 0.2266932725906372, 0.24405601620674133, 0.26141875982284546, 0.2787815034389496, 0.2961442470550537, 0.31350699067115784, 0.33086973428726196, 0.3482324779033661, 0.3655952215194702, 0.38295796513557434, 0.40032070875167847, 0.4176834523677826, 0.4350461959838867, 0.45240893959999084, 0.46977168321609497, 0.4871344268321991, 0.5044971704483032, 0.521859884262085, 0.5392226576805115]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 15.0, 8.0, 17.0, 32.0, 37.0, 43.0, 66.0, 123.0, 160.0, 259.0, 441.0, 812.0, 1279.0, 2497.0, 5165.0, 11566.0, 32259.0, 108556.0, 370343.0, 358759.0, 103291.0, 31142.0, 11239.0, 4784.0, 2403.0, 1287.0, 754.0, 395.0, 272.0, 171.0, 120.0, 75.0, 54.0, 34.0, 31.0, 23.0, 12.0, 8.0, 7.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08160400390625, -0.07888221740722656, -0.07616043090820312, -0.07343864440917969, -0.07071685791015625, -0.06799507141113281, -0.06527328491210938, -0.06255149841308594, -0.0598297119140625, -0.05710792541503906, -0.054386138916015625, -0.05166435241699219, -0.04894256591796875, -0.04622077941894531, -0.043498992919921875, -0.04077720642089844, -0.038055419921875, -0.03533363342285156, -0.032611846923828125, -0.029890060424804688, -0.02716827392578125, -0.024446487426757812, -0.021724700927734375, -0.019002914428710938, -0.0162811279296875, -0.013559341430664062, -0.010837554931640625, -0.008115768432617188, -0.00539398193359375, -0.0026721954345703125, 4.9591064453125e-05, 0.0027713775634765625, 0.0054931640625, 0.008214950561523438, 0.010936737060546875, 0.013658523559570312, 0.01638031005859375, 0.019102096557617188, 0.021823883056640625, 0.024545669555664062, 0.0272674560546875, 0.029989242553710938, 0.032711029052734375, 0.03543281555175781, 0.03815460205078125, 0.04087638854980469, 0.043598175048828125, 0.04631996154785156, 0.049041748046875, 0.05176353454589844, 0.054485321044921875, 0.05720710754394531, 0.05992889404296875, 0.06265068054199219, 0.06537246704101562, 0.06809425354003906, 0.0708160400390625, 0.07353782653808594, 0.07625961303710938, 0.07898139953613281, 0.08170318603515625, 0.08442497253417969, 0.08714675903320312, 0.08986854553222656, 0.09259033203125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 3.0, 6.0, 10.0, 12.0, 11.0, 14.0, 29.0, 24.0, 36.0, 30.0, 36.0, 38.0, 50.0, 51.0, 45.0, 54.0, 51.0, 50.0, 57.0, 49.0, 61.0, 42.0, 42.0, 30.0, 30.0, 16.0, 27.0, 24.0, 19.0, 13.0, 7.0, 10.0, 6.0, 2.0, 4.0, 3.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055694580078125, -0.053822994232177734, -0.05195140838623047, -0.0500798225402832, -0.04820823669433594, -0.04633665084838867, -0.044465065002441406, -0.04259347915649414, -0.040721893310546875, -0.03885030746459961, -0.036978721618652344, -0.03510713577270508, -0.03323554992675781, -0.03136396408081055, -0.02949237823486328, -0.027620792388916016, -0.02574920654296875, -0.023877620697021484, -0.02200603485107422, -0.020134449005126953, -0.018262863159179688, -0.016391277313232422, -0.014519691467285156, -0.01264810562133789, -0.010776519775390625, -0.00890493392944336, -0.007033348083496094, -0.005161762237548828, -0.0032901763916015625, -0.0014185905456542969, 0.00045299530029296875, 0.0023245811462402344, 0.0041961669921875, 0.006067752838134766, 0.007939338684082031, 0.009810924530029297, 0.011682510375976562, 0.013554096221923828, 0.015425682067871094, 0.01729726791381836, 0.019168853759765625, 0.02104043960571289, 0.022912025451660156, 0.024783611297607422, 0.026655197143554688, 0.028526782989501953, 0.03039836883544922, 0.032269954681396484, 0.03414154052734375, 0.036013126373291016, 0.03788471221923828, 0.03975629806518555, 0.04162788391113281, 0.04349946975708008, 0.045371055603027344, 0.04724264144897461, 0.049114227294921875, 0.05098581314086914, 0.052857398986816406, 0.05472898483276367, 0.05660057067871094, 0.0584721565246582, 0.06034374237060547, 0.062215328216552734, 0.0640869140625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 4.0, 10.0, 6.0, 16.0, 11.0, 14.0, 36.0, 39.0, 74.0, 100.0, 191.0, 292.0, 624.0, 1277.0, 3379.0, 11080.0, 53497.0, 593125.0, 326432.0, 43424.0, 9398.0, 2981.0, 1236.0, 548.0, 263.0, 182.0, 103.0, 61.0, 52.0, 34.0, 23.0, 16.0, 8.0, 3.0, 4.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.1512451171875, -0.14715099334716797, -0.14305686950683594, -0.1389627456665039, -0.13486862182617188, -0.13077449798583984, -0.1266803741455078, -0.12258625030517578, -0.11849212646484375, -0.11439800262451172, -0.11030387878417969, -0.10620975494384766, -0.10211563110351562, -0.0980215072631836, -0.09392738342285156, -0.08983325958251953, -0.0857391357421875, -0.08164501190185547, -0.07755088806152344, -0.0734567642211914, -0.06936264038085938, -0.06526851654052734, -0.06117439270019531, -0.05708026885986328, -0.05298614501953125, -0.04889202117919922, -0.04479789733886719, -0.040703773498535156, -0.036609649658203125, -0.032515525817871094, -0.028421401977539062, -0.02432727813720703, -0.020233154296875, -0.01613903045654297, -0.012044906616210938, -0.007950782775878906, -0.003856658935546875, 0.00023746490478515625, 0.0043315887451171875, 0.008425712585449219, 0.01251983642578125, 0.01661396026611328, 0.020708084106445312, 0.024802207946777344, 0.028896331787109375, 0.032990455627441406, 0.03708457946777344, 0.04117870330810547, 0.0452728271484375, 0.04936695098876953, 0.05346107482910156, 0.057555198669433594, 0.061649322509765625, 0.06574344635009766, 0.06983757019042969, 0.07393169403076172, 0.07802581787109375, 0.08211994171142578, 0.08621406555175781, 0.09030818939208984, 0.09440231323242188, 0.0984964370727539, 0.10259056091308594, 0.10668468475341797, 0.11077880859375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 2.0, 5.0, 3.0, 7.0, 8.0, 4.0, 9.0, 5.0, 13.0, 26.0, 20.0, 31.0, 40.0, 32.0, 35.0, 40.0, 50.0, 51.0, 64.0, 49.0, 55.0, 54.0, 51.0, 45.0, 51.0, 42.0, 28.0, 34.0, 36.0, 28.0, 23.0, 8.0, 7.0, 10.0, 8.0, 8.0, 4.0, 6.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.238037109375, -0.231414794921875, -0.22479248046875, -0.218170166015625, -0.2115478515625, -0.204925537109375, -0.19830322265625, -0.191680908203125, -0.18505859375, -0.178436279296875, -0.17181396484375, -0.165191650390625, -0.1585693359375, -0.151947021484375, -0.14532470703125, -0.138702392578125, -0.132080078125, -0.125457763671875, -0.11883544921875, -0.112213134765625, -0.1055908203125, -0.098968505859375, -0.09234619140625, -0.085723876953125, -0.0791015625, -0.072479248046875, -0.06585693359375, -0.059234619140625, -0.0526123046875, -0.045989990234375, -0.03936767578125, -0.032745361328125, -0.026123046875, -0.019500732421875, -0.01287841796875, -0.006256103515625, 0.0003662109375, 0.006988525390625, 0.01361083984375, 0.020233154296875, 0.02685546875, 0.033477783203125, 0.04010009765625, 0.046722412109375, 0.0533447265625, 0.059967041015625, 0.06658935546875, 0.073211669921875, 0.079833984375, 0.086456298828125, 0.09307861328125, 0.099700927734375, 0.1063232421875, 0.112945556640625, 0.11956787109375, 0.126190185546875, 0.1328125, 0.139434814453125, 0.14605712890625, 0.152679443359375, 0.1593017578125, 0.165924072265625, 0.17254638671875, 0.179168701171875, 0.185791015625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 8.0, 6.0, 20.0, 15.0, 31.0, 43.0, 33.0, 87.0, 148.0, 244.0, 431.0, 825.0, 1621.0, 3315.0, 7342.0, 18753.0, 54751.0, 202517.0, 596082.0, 107312.0, 32827.0, 12195.0, 4970.0, 2318.0, 1110.0, 667.0, 342.0, 197.0, 139.0, 81.0, 39.0, 37.0, 14.0, 16.0, 11.0, 7.0, 0.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.025390625, -0.02429962158203125, -0.0232086181640625, -0.02211761474609375, -0.021026611328125, -0.01993560791015625, -0.0188446044921875, -0.01775360107421875, -0.01666259765625, -0.01557159423828125, -0.0144805908203125, -0.01338958740234375, -0.012298583984375, -0.01120758056640625, -0.0101165771484375, -0.00902557373046875, -0.0079345703125, -0.00684356689453125, -0.0057525634765625, -0.00466156005859375, -0.003570556640625, -0.00247955322265625, -0.0013885498046875, -0.00029754638671875, 0.00079345703125, 0.00188446044921875, 0.0029754638671875, 0.00406646728515625, 0.005157470703125, 0.00624847412109375, 0.0073394775390625, 0.00843048095703125, 0.009521484375, 0.01061248779296875, 0.0117034912109375, 0.01279449462890625, 0.013885498046875, 0.01497650146484375, 0.0160675048828125, 0.01715850830078125, 0.01824951171875, 0.01934051513671875, 0.0204315185546875, 0.02152252197265625, 0.022613525390625, 0.02370452880859375, 0.0247955322265625, 0.02588653564453125, 0.0269775390625, 0.02806854248046875, 0.0291595458984375, 0.03025054931640625, 0.031341552734375, 0.03243255615234375, 0.0335235595703125, 0.03461456298828125, 0.03570556640625, 0.03679656982421875, 0.0378875732421875, 0.03897857666015625, 0.040069580078125, 0.04116058349609375, 0.0422515869140625, 0.04334259033203125, 0.04443359375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 7.0, 11.0, 12.0, 13.0, 18.0, 28.0, 35.0, 52.0, 49.0, 68.0, 72.0, 115.0, 102.0, 80.0, 71.0, 70.0, 53.0, 37.0, 29.0, 19.0, 9.0, 12.0, 8.0, 7.0, 9.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1219253540039062e-05, -2.0633451640605927e-05, -2.004764974117279e-05, -1.9461847841739655e-05, -1.887604594230652e-05, -1.8290244042873383e-05, -1.7704442143440247e-05, -1.711864024400711e-05, -1.6532838344573975e-05, -1.594703644514084e-05, -1.5361234545707703e-05, -1.4775432646274567e-05, -1.418963074684143e-05, -1.3603828847408295e-05, -1.3018026947975159e-05, -1.2432225048542023e-05, -1.1846423149108887e-05, -1.126062124967575e-05, -1.0674819350242615e-05, -1.0089017450809479e-05, -9.503215551376343e-06, -8.917413651943207e-06, -8.33161175251007e-06, -7.745809853076935e-06, -7.160007953643799e-06, -6.574206054210663e-06, -5.988404154777527e-06, -5.402602255344391e-06, -4.816800355911255e-06, -4.230998456478119e-06, -3.645196557044983e-06, -3.059394657611847e-06, -2.473592758178711e-06, -1.887790858745575e-06, -1.301988959312439e-06, -7.16187059879303e-07, -1.30385160446167e-07, 4.55416738986969e-07, 1.041218638420105e-06, 1.627020537853241e-06, 2.212822437286377e-06, 2.798624336719513e-06, 3.384426236152649e-06, 3.970228135585785e-06, 4.556030035018921e-06, 5.141831934452057e-06, 5.727633833885193e-06, 6.313435733318329e-06, 6.899237632751465e-06, 7.485039532184601e-06, 8.070841431617737e-06, 8.656643331050873e-06, 9.242445230484009e-06, 9.828247129917145e-06, 1.041404902935028e-05, 1.0999850928783417e-05, 1.1585652828216553e-05, 1.2171454727649689e-05, 1.2757256627082825e-05, 1.334305852651596e-05, 1.3928860425949097e-05, 1.4514662325382233e-05, 1.5100464224815369e-05, 1.5686266124248505e-05, 1.627206802368164e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 1.0, 3.0, 4.0, 7.0, 9.0, 19.0, 14.0, 37.0, 58.0, 118.0, 195.0, 395.0, 920.0, 2418.0, 7681.0, 33530.0, 226068.0, 687888.0, 69336.0, 13540.0, 3807.0, 1302.0, 595.0, 251.0, 138.0, 87.0, 47.0, 28.0, 28.0, 14.0, 5.0, 3.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048431396484375, -0.046651363372802734, -0.04487133026123047, -0.0430912971496582, -0.04131126403808594, -0.03953123092651367, -0.037751197814941406, -0.03597116470336914, -0.034191131591796875, -0.03241109848022461, -0.030631065368652344, -0.028851032257080078, -0.027070999145507812, -0.025290966033935547, -0.02351093292236328, -0.021730899810791016, -0.01995086669921875, -0.018170833587646484, -0.01639080047607422, -0.014610767364501953, -0.012830734252929688, -0.011050701141357422, -0.009270668029785156, -0.007490634918212891, -0.005710601806640625, -0.003930568695068359, -0.0021505355834960938, -0.0003705024719238281, 0.0014095306396484375, 0.003189563751220703, 0.004969596862792969, 0.006749629974365234, 0.0085296630859375, 0.010309696197509766, 0.012089729309082031, 0.013869762420654297, 0.015649795532226562, 0.017429828643798828, 0.019209861755371094, 0.02098989486694336, 0.022769927978515625, 0.02454996109008789, 0.026329994201660156, 0.028110027313232422, 0.029890060424804688, 0.03167009353637695, 0.03345012664794922, 0.035230159759521484, 0.03701019287109375, 0.038790225982666016, 0.04057025909423828, 0.04235029220581055, 0.04413032531738281, 0.04591035842895508, 0.047690391540527344, 0.04947042465209961, 0.051250457763671875, 0.05303049087524414, 0.054810523986816406, 0.05659055709838867, 0.05837059020996094, 0.0601506233215332, 0.06193065643310547, 0.06371068954467773, 0.06549072265625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 6.0, 17.0, 13.0, 16.0, 30.0, 28.0, 30.0, 38.0, 60.0, 73.0, 111.0, 108.0, 101.0, 84.0, 59.0, 48.0, 27.0, 32.0, 26.0, 17.0, 15.0, 14.0, 6.0, 5.0, 6.0, 4.0, 5.0, 6.0, 2.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05499267578125, -0.0534820556640625, -0.051971435546875, -0.0504608154296875, -0.0489501953125, -0.0474395751953125, -0.045928955078125, -0.0444183349609375, -0.04290771484375, -0.0413970947265625, -0.039886474609375, -0.0383758544921875, -0.036865234375, -0.0353546142578125, -0.033843994140625, -0.0323333740234375, -0.03082275390625, -0.0293121337890625, -0.027801513671875, -0.0262908935546875, -0.0247802734375, -0.0232696533203125, -0.021759033203125, -0.0202484130859375, -0.01873779296875, -0.0172271728515625, -0.015716552734375, -0.0142059326171875, -0.0126953125, -0.0111846923828125, -0.009674072265625, -0.0081634521484375, -0.00665283203125, -0.0051422119140625, -0.003631591796875, -0.0021209716796875, -0.0006103515625, 0.0009002685546875, 0.002410888671875, 0.0039215087890625, 0.00543212890625, 0.0069427490234375, 0.008453369140625, 0.0099639892578125, 0.011474609375, 0.0129852294921875, 0.014495849609375, 0.0160064697265625, 0.01751708984375, 0.0190277099609375, 0.020538330078125, 0.0220489501953125, 0.0235595703125, 0.0250701904296875, 0.026580810546875, 0.0280914306640625, 0.02960205078125, 0.0311126708984375, 0.032623291015625, 0.0341339111328125, 0.03564453125, 0.0371551513671875, 0.038665771484375, 0.0401763916015625, 0.04168701171875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 6.0, 3.0, 3.0, 8.0, 8.0, 23.0, 39.0, 90.0, 148.0, 319.0, 190.0, 82.0, 52.0, 18.0, 7.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1870087385177612, -1.1456937789916992, -1.1043787002563477, -1.0630637407302856, -1.0217487812042236, -0.9804337024688721, -0.9391187429428101, -0.8978037238121033, -0.8564887046813965, -0.8151736855506897, -0.7738586664199829, -0.7325437068939209, -0.6912286877632141, -0.6499136686325073, -0.6085987091064453, -0.5672836899757385, -0.5259686708450317, -0.48465365171432495, -0.44333866238594055, -0.40202367305755615, -0.36070865392684937, -0.3193936347961426, -0.2780786454677582, -0.23676365613937378, -0.195448637008667, -0.1541336327791214, -0.1128186285495758, -0.07150362432003021, -0.03018862009048462, 0.011126384139060974, 0.05244138836860657, 0.09375637769699097, 0.1350712776184082, 0.1763862818479538, 0.2177012860774994, 0.2590162754058838, 0.3003312945365906, 0.34164631366729736, 0.38296130299568176, 0.42427629232406616, 0.46559131145477295, 0.5069063305854797, 0.5482213497161865, 0.5895363092422485, 0.6308513283729553, 0.6721663475036621, 0.7134813070297241, 0.7547963261604309, 0.7961113452911377, 0.8374263644218445, 0.8787413835525513, 0.9200563430786133, 0.9613713622093201, 1.0026863813400269, 1.0440013408660889, 1.0853164196014404, 1.1266313791275024, 1.1679463386535645, 1.209261417388916, 1.250576376914978, 1.29189133644104, 1.3332064151763916, 1.3745213747024536, 1.4158363342285156, 1.4571514129638672]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 4.0, 11.0, 8.0, 7.0, 9.0, 9.0, 10.0, 20.0, 7.0, 22.0, 24.0, 21.0, 24.0, 32.0, 23.0, 31.0, 50.0, 46.0, 59.0, 71.0, 76.0, 72.0, 61.0, 45.0, 28.0, 32.0, 37.0, 27.0, 16.0, 21.0, 12.0, 13.0, 15.0, 10.0, 9.0, 12.0, 8.0, 6.0, 2.0, 3.0, 2.0, 0.0, 7.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.706863284111023, -0.6832928657531738, -0.6597223877906799, -0.6361519694328308, -0.6125814914703369, -0.5890110731124878, -0.5654406547546387, -0.5418702363967896, -0.5182997584342957, -0.49472931027412415, -0.47115886211395264, -0.4475884437561035, -0.424017995595932, -0.4004475474357605, -0.3768771290779114, -0.35330668091773987, -0.32973623275756836, -0.30616578459739685, -0.28259533643722534, -0.2590249180793762, -0.2354544699192047, -0.2118840217590332, -0.1883135885000229, -0.16474315524101257, -0.14117270708084106, -0.11760226637125015, -0.09403182566165924, -0.07046138495206833, -0.04689094424247742, -0.023320503532886505, 0.00024993717670440674, 0.02382037043571472, 0.04739081859588623, 0.07096125930547714, 0.09453170001506805, 0.11810214072465897, 0.14167258143424988, 0.1652430295944214, 0.1888134628534317, 0.21238389611244202, 0.23595434427261353, 0.25952479243278503, 0.28309524059295654, 0.30666565895080566, 0.3302361071109772, 0.3538065552711487, 0.3773769736289978, 0.4009474217891693, 0.4245178699493408, 0.44808831810951233, 0.47165876626968384, 0.49522918462753296, 0.5187996625900269, 0.542370080947876, 0.5659404993057251, 0.5895109176635742, 0.6130813956260681, 0.6366518139839172, 0.6602222919464111, 0.6837927103042603, 0.7073631286621094, 0.7309336066246033, 0.7545040249824524, 0.7780745029449463, 0.8016449213027954]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 2.0, 2.0, 6.0, 6.0, 8.0, 16.0, 23.0, 34.0, 45.0, 63.0, 133.0, 186.0, 326.0, 539.0, 944.0, 1787.0, 3716.0, 8684.0, 24871.0, 104970.0, 705011.0, 2558197.0, 650420.0, 95682.0, 22690.0, 8050.0, 3556.0, 1819.0, 946.0, 591.0, 378.0, 195.0, 121.0, 85.0, 64.0, 29.0, 34.0, 20.0, 19.0, 12.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06561279296875, -0.06322479248046875, -0.0608367919921875, -0.05844879150390625, -0.056060791015625, -0.05367279052734375, -0.0512847900390625, -0.04889678955078125, -0.0465087890625, -0.04412078857421875, -0.0417327880859375, -0.03934478759765625, -0.036956787109375, -0.03456878662109375, -0.0321807861328125, -0.02979278564453125, -0.02740478515625, -0.02501678466796875, -0.0226287841796875, -0.02024078369140625, -0.017852783203125, -0.01546478271484375, -0.0130767822265625, -0.01068878173828125, -0.00830078125, -0.00591278076171875, -0.0035247802734375, -0.00113677978515625, 0.001251220703125, 0.00363922119140625, 0.0060272216796875, 0.00841522216796875, 0.01080322265625, 0.01319122314453125, 0.0155792236328125, 0.01796722412109375, 0.020355224609375, 0.02274322509765625, 0.0251312255859375, 0.02751922607421875, 0.0299072265625, 0.03229522705078125, 0.0346832275390625, 0.03707122802734375, 0.039459228515625, 0.04184722900390625, 0.0442352294921875, 0.04662322998046875, 0.04901123046875, 0.05139923095703125, 0.0537872314453125, 0.05617523193359375, 0.058563232421875, 0.06095123291015625, 0.0633392333984375, 0.06572723388671875, 0.068115234375, 0.07050323486328125, 0.0728912353515625, 0.07527923583984375, 0.077667236328125, 0.08005523681640625, 0.0824432373046875, 0.08483123779296875, 0.08721923828125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 3.0, 2.0, 7.0, 6.0, 11.0, 11.0, 8.0, 13.0, 17.0, 21.0, 18.0, 22.0, 25.0, 30.0, 40.0, 48.0, 52.0, 44.0, 46.0, 34.0, 37.0, 49.0, 37.0, 31.0, 45.0, 45.0, 33.0, 39.0, 35.0, 25.0, 23.0, 13.0, 25.0, 20.0, 11.0, 10.0, 15.0, 10.0, 8.0, 8.0, 3.0, 3.0, 4.0, 7.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04779052734375, -0.04626941680908203, -0.04474830627441406, -0.043227195739746094, -0.041706085205078125, -0.040184974670410156, -0.03866386413574219, -0.03714275360107422, -0.03562164306640625, -0.03410053253173828, -0.03257942199707031, -0.031058311462402344, -0.029537200927734375, -0.028016090393066406, -0.026494979858398438, -0.02497386932373047, -0.0234527587890625, -0.02193164825439453, -0.020410537719726562, -0.018889427185058594, -0.017368316650390625, -0.015847206115722656, -0.014326095581054688, -0.012804985046386719, -0.01128387451171875, -0.009762763977050781, -0.008241653442382812, -0.006720542907714844, -0.005199432373046875, -0.0036783218383789062, -0.0021572113037109375, -0.0006361007690429688, 0.000885009765625, 0.0024061203002929688, 0.0039272308349609375, 0.005448341369628906, 0.006969451904296875, 0.008490562438964844, 0.010011672973632812, 0.011532783508300781, 0.01305389404296875, 0.014575004577636719, 0.016096115112304688, 0.017617225646972656, 0.019138336181640625, 0.020659446716308594, 0.022180557250976562, 0.02370166778564453, 0.0252227783203125, 0.02674388885498047, 0.028264999389648438, 0.029786109924316406, 0.031307220458984375, 0.032828330993652344, 0.03434944152832031, 0.03587055206298828, 0.03739166259765625, 0.03891277313232422, 0.04043388366699219, 0.041954994201660156, 0.043476104736328125, 0.044997215270996094, 0.04651832580566406, 0.04803943634033203, 0.049560546875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 9.0, 8.0, 16.0, 22.0, 42.0, 76.0, 134.0, 296.0, 890.0, 5281.0, 107682.0, 3944523.0, 127618.0, 6108.0, 970.0, 279.0, 138.0, 78.0, 47.0, 32.0, 12.0, 11.0, 4.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32763671875, -0.3197460174560547, -0.3118553161621094, -0.30396461486816406, -0.29607391357421875, -0.28818321228027344, -0.2802925109863281, -0.2724018096923828, -0.2645111083984375, -0.2566204071044922, -0.24872970581054688, -0.24083900451660156, -0.23294830322265625, -0.22505760192871094, -0.21716690063476562, -0.2092761993408203, -0.201385498046875, -0.1934947967529297, -0.18560409545898438, -0.17771339416503906, -0.16982269287109375, -0.16193199157714844, -0.15404129028320312, -0.1461505889892578, -0.1382598876953125, -0.1303691864013672, -0.12247848510742188, -0.11458778381347656, -0.10669708251953125, -0.09880638122558594, -0.09091567993164062, -0.08302497863769531, -0.07513427734375, -0.06724357604980469, -0.059352874755859375, -0.05146217346191406, -0.04357147216796875, -0.03568077087402344, -0.027790069580078125, -0.019899368286132812, -0.0120086669921875, -0.0041179656982421875, 0.003772735595703125, 0.011663436889648438, 0.01955413818359375, 0.027444839477539062, 0.035335540771484375, 0.04322624206542969, 0.051116943359375, 0.05900764465332031, 0.06689834594726562, 0.07478904724121094, 0.08267974853515625, 0.09057044982910156, 0.09846115112304688, 0.10635185241699219, 0.1142425537109375, 0.12213325500488281, 0.13002395629882812, 0.13791465759277344, 0.14580535888671875, 0.15369606018066406, 0.16158676147460938, 0.1694774627685547, 0.1773681640625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 6.0, 11.0, 10.0, 8.0, 18.0, 23.0, 29.0, 28.0, 45.0, 49.0, 92.0, 123.0, 151.0, 228.0, 352.0, 453.0, 594.0, 536.0, 402.0, 271.0, 189.0, 120.0, 74.0, 56.0, 49.0, 30.0, 24.0, 18.0, 22.0, 13.0, 9.0, 6.0, 7.0, 2.0, 5.0, 3.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08837890625, -0.0852975845336914, -0.08221626281738281, -0.07913494110107422, -0.07605361938476562, -0.07297229766845703, -0.06989097595214844, -0.06680965423583984, -0.06372833251953125, -0.060647010803222656, -0.05756568908691406, -0.05448436737060547, -0.051403045654296875, -0.04832172393798828, -0.04524040222167969, -0.042159080505371094, -0.0390777587890625, -0.035996437072753906, -0.03291511535644531, -0.02983379364013672, -0.026752471923828125, -0.02367115020751953, -0.020589828491210938, -0.017508506774902344, -0.01442718505859375, -0.011345863342285156, -0.008264541625976562, -0.005183219909667969, -0.002101898193359375, 0.0009794235229492188, 0.0040607452392578125, 0.007142066955566406, 0.010223388671875, 0.013304710388183594, 0.016386032104492188, 0.01946735382080078, 0.022548675537109375, 0.02562999725341797, 0.028711318969726562, 0.031792640686035156, 0.03487396240234375, 0.037955284118652344, 0.04103660583496094, 0.04411792755126953, 0.047199249267578125, 0.05028057098388672, 0.05336189270019531, 0.056443214416503906, 0.0595245361328125, 0.0626058578491211, 0.06568717956542969, 0.06876850128173828, 0.07184982299804688, 0.07493114471435547, 0.07801246643066406, 0.08109378814697266, 0.08417510986328125, 0.08725643157958984, 0.09033775329589844, 0.09341907501220703, 0.09650039672851562, 0.09958171844482422, 0.10266304016113281, 0.1057443618774414, 0.10882568359375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 4.0, 5.0, 12.0, 17.0, 34.0, 61.0, 100.0, 141.0, 157.0, 165.0, 119.0, 74.0, 45.0, 23.0, 13.0, 12.0, 7.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3923041820526123, -1.3603432178497314, -1.3283822536468506, -1.2964212894439697, -1.2644603252410889, -1.2324994802474976, -1.2005385160446167, -1.1685775518417358, -1.136616587638855, -1.1046556234359741, -1.0726946592330933, -1.0407336950302124, -1.008772850036621, -0.9768118262290955, -0.9448509216308594, -0.9128899574279785, -0.8809289932250977, -0.8489680290222168, -0.8170070648193359, -0.7850461602210999, -0.753085196018219, -0.7211242318153381, -0.689163327217102, -0.6572023630142212, -0.6252413988113403, -0.5932804346084595, -0.5613194704055786, -0.5293585658073425, -0.49739760160446167, -0.4654366374015808, -0.43347570300102234, -0.40151476860046387, -0.3695538640022278, -0.3375928997993469, -0.30563196539878845, -0.27367103099823, -0.24171006679534912, -0.20974911749362946, -0.1777881681919098, -0.14582721889019012, -0.11386626958847046, -0.0819053202867508, -0.04994437098503113, -0.017983421683311462, 0.013977527618408203, 0.04593847692012787, 0.07789942622184753, 0.1098603755235672, 0.14182132482528687, 0.17378227412700653, 0.2057432234287262, 0.23770417273044586, 0.2696651220321655, 0.3016260862350464, 0.33358702063560486, 0.36554795503616333, 0.3975089192390442, 0.42946988344192505, 0.4614308178424835, 0.493391752243042, 0.5253527164459229, 0.5573136806488037, 0.5892746448516846, 0.6212355494499207, 0.6531965136528015]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 7.0, 6.0, 1.0, 5.0, 3.0, 7.0, 14.0, 7.0, 15.0, 10.0, 18.0, 14.0, 22.0, 21.0, 29.0, 26.0, 23.0, 29.0, 37.0, 41.0, 39.0, 55.0, 42.0, 37.0, 44.0, 39.0, 44.0, 29.0, 34.0, 36.0, 29.0, 29.0, 26.0, 34.0, 22.0, 16.0, 21.0, 13.0, 16.0, 11.0, 14.0, 7.0, 9.0, 4.0, 5.0, 9.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.4441753029823303, -0.4309903681278229, -0.41780543327331543, -0.404620498418808, -0.39143556356430054, -0.3782505989074707, -0.36506566405296326, -0.3518807291984558, -0.33869579434394836, -0.3255108594894409, -0.31232592463493347, -0.299140989780426, -0.2859560251235962, -0.27277112007141113, -0.2595861554145813, -0.24640122056007385, -0.2332162857055664, -0.22003135085105896, -0.2068464159965515, -0.19366146624088287, -0.18047653138637543, -0.16729159653186798, -0.15410664677619934, -0.1409217119216919, -0.12773677706718445, -0.114551842212677, -0.10136689990758896, -0.08818195760250092, -0.07499702274799347, -0.06181208789348602, -0.04862714558839798, -0.035442203283309937, -0.02225726842880249, -0.009072329849004745, 0.004112608730792999, 0.017297547310590744, 0.03048248589038849, 0.043667420744895935, 0.05685236304998398, 0.07003730535507202, 0.08322224020957947, 0.09640717506408691, 0.10959211736917496, 0.122777059674263, 0.13596199452877045, 0.1491469293832779, 0.16233187913894653, 0.17551681399345398, 0.18870174884796143, 0.20188668370246887, 0.21507161855697632, 0.22825656831264496, 0.2414415031671524, 0.25462645292282104, 0.2678113877773285, 0.28099632263183594, 0.2941812574863434, 0.30736619234085083, 0.3205511271953583, 0.3337360620498657, 0.34692102670669556, 0.3601059317588806, 0.37329089641571045, 0.3864758312702179, 0.39966076612472534]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 9.0, 4.0, 8.0, 8.0, 18.0, 30.0, 36.0, 55.0, 81.0, 150.0, 208.0, 379.0, 642.0, 1222.0, 2377.0, 5110.0, 12100.0, 29815.0, 86796.0, 294932.0, 407995.0, 133728.0, 43036.0, 16380.0, 6750.0, 3156.0, 1563.0, 805.0, 456.0, 255.0, 163.0, 99.0, 69.0, 43.0, 30.0, 22.0, 16.0, 11.0, 4.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.09588623046875, -0.09323596954345703, -0.09058570861816406, -0.0879354476928711, -0.08528518676757812, -0.08263492584228516, -0.07998466491699219, -0.07733440399169922, -0.07468414306640625, -0.07203388214111328, -0.06938362121582031, -0.06673336029052734, -0.06408309936523438, -0.061432838439941406, -0.05878257751464844, -0.05613231658935547, -0.0534820556640625, -0.05083179473876953, -0.04818153381347656, -0.045531272888183594, -0.042881011962890625, -0.040230751037597656, -0.03758049011230469, -0.03493022918701172, -0.03227996826171875, -0.02962970733642578, -0.026979446411132812, -0.024329185485839844, -0.021678924560546875, -0.019028663635253906, -0.016378402709960938, -0.013728141784667969, -0.011077880859375, -0.008427619934082031, -0.0057773590087890625, -0.0031270980834960938, -0.000476837158203125, 0.0021734237670898438, 0.0048236846923828125, 0.007473945617675781, 0.01012420654296875, 0.012774467468261719, 0.015424728393554688, 0.018074989318847656, 0.020725250244140625, 0.023375511169433594, 0.026025772094726562, 0.02867603302001953, 0.0313262939453125, 0.03397655487060547, 0.03662681579589844, 0.039277076721191406, 0.041927337646484375, 0.044577598571777344, 0.04722785949707031, 0.04987812042236328, 0.05252838134765625, 0.05517864227294922, 0.05782890319824219, 0.060479164123535156, 0.06312942504882812, 0.0657796859741211, 0.06842994689941406, 0.07108020782470703, 0.07373046875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 4.0, 6.0, 9.0, 6.0, 7.0, 7.0, 8.0, 13.0, 12.0, 20.0, 12.0, 17.0, 24.0, 28.0, 22.0, 30.0, 34.0, 37.0, 39.0, 44.0, 41.0, 35.0, 51.0, 39.0, 37.0, 35.0, 42.0, 53.0, 39.0, 23.0, 32.0, 32.0, 19.0, 26.0, 15.0, 24.0, 10.0, 7.0, 11.0, 9.0, 11.0, 5.0, 7.0, 8.0, 3.0, 3.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04931640625, -0.04781532287597656, -0.046314239501953125, -0.04481315612792969, -0.04331207275390625, -0.04181098937988281, -0.040309906005859375, -0.03880882263183594, -0.0373077392578125, -0.03580665588378906, -0.034305572509765625, -0.03280448913574219, -0.03130340576171875, -0.029802322387695312, -0.028301239013671875, -0.026800155639648438, -0.025299072265625, -0.023797988891601562, -0.022296905517578125, -0.020795822143554688, -0.01929473876953125, -0.017793655395507812, -0.016292572021484375, -0.014791488647460938, -0.0132904052734375, -0.011789321899414062, -0.010288238525390625, -0.008787155151367188, -0.00728607177734375, -0.0057849884033203125, -0.004283905029296875, -0.0027828216552734375, -0.00128173828125, 0.0002193450927734375, 0.001720428466796875, 0.0032215118408203125, 0.00472259521484375, 0.0062236785888671875, 0.007724761962890625, 0.009225845336914062, 0.0107269287109375, 0.012228012084960938, 0.013729095458984375, 0.015230178833007812, 0.01673126220703125, 0.018232345581054688, 0.019733428955078125, 0.021234512329101562, 0.022735595703125, 0.024236679077148438, 0.025737762451171875, 0.027238845825195312, 0.02873992919921875, 0.030241012573242188, 0.031742095947265625, 0.03324317932128906, 0.0347442626953125, 0.03624534606933594, 0.037746429443359375, 0.03924751281738281, 0.04074859619140625, 0.04224967956542969, 0.043750762939453125, 0.04525184631347656, 0.0467529296875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 7.0, 6.0, 1.0, 12.0, 20.0, 21.0, 23.0, 32.0, 55.0, 95.0, 131.0, 214.0, 344.0, 651.0, 1283.0, 3048.0, 8928.0, 34519.0, 219314.0, 690311.0, 67077.0, 14234.0, 4379.0, 1830.0, 828.0, 448.0, 241.0, 185.0, 119.0, 57.0, 44.0, 33.0, 26.0, 13.0, 6.0, 8.0, 4.0, 3.0, 4.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1431884765625, -0.13923263549804688, -0.13527679443359375, -0.13132095336914062, -0.1273651123046875, -0.12340927124023438, -0.11945343017578125, -0.11549758911132812, -0.111541748046875, -0.10758590698242188, -0.10363006591796875, -0.09967422485351562, -0.0957183837890625, -0.09176254272460938, -0.08780670166015625, -0.08385086059570312, -0.07989501953125, -0.07593917846679688, -0.07198333740234375, -0.06802749633789062, -0.0640716552734375, -0.060115814208984375, -0.05615997314453125, -0.052204132080078125, -0.048248291015625, -0.044292449951171875, -0.04033660888671875, -0.036380767822265625, -0.0324249267578125, -0.028469085693359375, -0.02451324462890625, -0.020557403564453125, -0.0166015625, -0.012645721435546875, -0.00868988037109375, -0.004734039306640625, -0.0007781982421875, 0.003177642822265625, 0.00713348388671875, 0.011089324951171875, 0.015045166015625, 0.019001007080078125, 0.02295684814453125, 0.026912689208984375, 0.0308685302734375, 0.034824371337890625, 0.03878021240234375, 0.042736053466796875, 0.04669189453125, 0.050647735595703125, 0.05460357666015625, 0.058559417724609375, 0.0625152587890625, 0.06647109985351562, 0.07042694091796875, 0.07438278198242188, 0.078338623046875, 0.08229446411132812, 0.08625030517578125, 0.09020614624023438, 0.0941619873046875, 0.09811782836914062, 0.10207366943359375, 0.10602951049804688, 0.1099853515625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 10.0, 5.0, 8.0, 10.0, 13.0, 14.0, 23.0, 26.0, 27.0, 38.0, 49.0, 55.0, 60.0, 62.0, 59.0, 73.0, 65.0, 52.0, 50.0, 62.0, 31.0, 45.0, 36.0, 29.0, 29.0, 25.0, 6.0, 9.0, 9.0, 3.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.314208984375, -0.3063220977783203, -0.2984352111816406, -0.29054832458496094, -0.28266143798828125, -0.27477455139160156, -0.2668876647949219, -0.2590007781982422, -0.2511138916015625, -0.2432270050048828, -0.23534011840820312, -0.22745323181152344, -0.21956634521484375, -0.21167945861816406, -0.20379257202148438, -0.1959056854248047, -0.188018798828125, -0.1801319122314453, -0.17224502563476562, -0.16435813903808594, -0.15647125244140625, -0.14858436584472656, -0.14069747924804688, -0.1328105926513672, -0.1249237060546875, -0.11703681945800781, -0.10914993286132812, -0.10126304626464844, -0.09337615966796875, -0.08548927307128906, -0.07760238647460938, -0.06971549987792969, -0.06182861328125, -0.05394172668457031, -0.046054840087890625, -0.03816795349121094, -0.03028106689453125, -0.022394180297851562, -0.014507293701171875, -0.0066204071044921875, 0.0012664794921875, 0.009153366088867188, 0.017040252685546875, 0.024927139282226562, 0.03281402587890625, 0.04070091247558594, 0.048587799072265625, 0.05647468566894531, 0.064361572265625, 0.07224845886230469, 0.08013534545898438, 0.08802223205566406, 0.09590911865234375, 0.10379600524902344, 0.11168289184570312, 0.11956977844238281, 0.1274566650390625, 0.1353435516357422, 0.14323043823242188, 0.15111732482910156, 0.15900421142578125, 0.16689109802246094, 0.17477798461914062, 0.1826648712158203, 0.1905517578125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 6.0, 9.0, 14.0, 13.0, 28.0, 38.0, 54.0, 86.0, 128.0, 245.0, 538.0, 1256.0, 3009.0, 8354.0, 27160.0, 117923.0, 702873.0, 140075.0, 31250.0, 9512.0, 3307.0, 1379.0, 582.0, 290.0, 156.0, 90.0, 60.0, 37.0, 26.0, 15.0, 7.0, 9.0, 8.0, 4.0, 1.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034759521484375, -0.033621788024902344, -0.03248405456542969, -0.03134632110595703, -0.030208587646484375, -0.02907085418701172, -0.027933120727539062, -0.026795387268066406, -0.02565765380859375, -0.024519920349121094, -0.023382186889648438, -0.02224445343017578, -0.021106719970703125, -0.01996898651123047, -0.018831253051757812, -0.017693519592285156, -0.0165557861328125, -0.015418052673339844, -0.014280319213867188, -0.013142585754394531, -0.012004852294921875, -0.010867118835449219, -0.009729385375976562, -0.008591651916503906, -0.00745391845703125, -0.006316184997558594, -0.0051784515380859375, -0.004040718078613281, -0.002902984619140625, -0.0017652511596679688, -0.0006275177001953125, 0.0005102157592773438, 0.00164794921875, 0.0027856826782226562, 0.0039234161376953125, 0.005061149597167969, 0.006198883056640625, 0.007336616516113281, 0.008474349975585938, 0.009612083435058594, 0.01074981689453125, 0.011887550354003906, 0.013025283813476562, 0.014163017272949219, 0.015300750732421875, 0.01643848419189453, 0.017576217651367188, 0.018713951110839844, 0.0198516845703125, 0.020989418029785156, 0.022127151489257812, 0.02326488494873047, 0.024402618408203125, 0.02554035186767578, 0.026678085327148438, 0.027815818786621094, 0.02895355224609375, 0.030091285705566406, 0.031229019165039062, 0.03236675262451172, 0.033504486083984375, 0.03464221954345703, 0.03577995300292969, 0.036917686462402344, 0.038055419921875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 4.0, 6.0, 4.0, 7.0, 7.0, 11.0, 14.0, 16.0, 22.0, 24.0, 48.0, 53.0, 85.0, 88.0, 92.0, 103.0, 87.0, 80.0, 54.0, 51.0, 27.0, 21.0, 26.0, 11.0, 13.0, 5.0, 9.0, 12.0, 6.0, 7.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.531839370727539e-05, -1.471489667892456e-05, -1.411139965057373e-05, -1.35079026222229e-05, -1.290440559387207e-05, -1.230090856552124e-05, -1.169741153717041e-05, -1.109391450881958e-05, -1.049041748046875e-05, -9.88692045211792e-06, -9.28342342376709e-06, -8.67992639541626e-06, -8.07642936706543e-06, -7.4729323387146e-06, -6.8694353103637695e-06, -6.2659382820129395e-06, -5.662441253662109e-06, -5.058944225311279e-06, -4.455447196960449e-06, -3.851950168609619e-06, -3.248453140258789e-06, -2.644956111907959e-06, -2.041459083557129e-06, -1.4379620552062988e-06, -8.344650268554688e-07, -2.3096799850463867e-07, 3.725290298461914e-07, 9.760260581970215e-07, 1.5795230865478516e-06, 2.1830201148986816e-06, 2.7865171432495117e-06, 3.390014171600342e-06, 3.993511199951172e-06, 4.597008228302002e-06, 5.200505256652832e-06, 5.804002285003662e-06, 6.407499313354492e-06, 7.010996341705322e-06, 7.614493370056152e-06, 8.217990398406982e-06, 8.821487426757812e-06, 9.424984455108643e-06, 1.0028481483459473e-05, 1.0631978511810303e-05, 1.1235475540161133e-05, 1.1838972568511963e-05, 1.2442469596862793e-05, 1.3045966625213623e-05, 1.3649463653564453e-05, 1.4252960681915283e-05, 1.4856457710266113e-05, 1.5459954738616943e-05, 1.6063451766967773e-05, 1.6666948795318604e-05, 1.7270445823669434e-05, 1.7873942852020264e-05, 1.8477439880371094e-05, 1.9080936908721924e-05, 1.9684433937072754e-05, 2.0287930965423584e-05, 2.0891427993774414e-05, 2.1494925022125244e-05, 2.2098422050476074e-05, 2.2701919078826904e-05, 2.3305416107177734e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 4.0, 10.0, 12.0, 16.0, 23.0, 33.0, 36.0, 52.0, 100.0, 149.0, 267.0, 445.0, 803.0, 1574.0, 3428.0, 8035.0, 21706.0, 72809.0, 416582.0, 412823.0, 72797.0, 21791.0, 8140.0, 3464.0, 1519.0, 763.0, 424.0, 262.0, 152.0, 117.0, 92.0, 36.0, 19.0, 19.0, 7.0, 10.0, 7.0, 5.0, 10.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0295562744140625, -0.02860283851623535, -0.027649402618408203, -0.026695966720581055, -0.025742530822753906, -0.024789094924926758, -0.02383565902709961, -0.02288222312927246, -0.021928787231445312, -0.020975351333618164, -0.020021915435791016, -0.019068479537963867, -0.01811504364013672, -0.01716160774230957, -0.016208171844482422, -0.015254735946655273, -0.014301300048828125, -0.013347864151000977, -0.012394428253173828, -0.01144099235534668, -0.010487556457519531, -0.009534120559692383, -0.008580684661865234, -0.007627248764038086, -0.0066738128662109375, -0.005720376968383789, -0.004766941070556641, -0.003813505172729492, -0.0028600692749023438, -0.0019066333770751953, -0.0009531974792480469, 2.384185791015625e-07, 0.00095367431640625, 0.0019071102142333984, 0.002860546112060547, 0.0038139820098876953, 0.004767417907714844, 0.005720853805541992, 0.006674289703369141, 0.007627725601196289, 0.008581161499023438, 0.009534597396850586, 0.010488033294677734, 0.011441469192504883, 0.012394905090332031, 0.01334834098815918, 0.014301776885986328, 0.015255212783813477, 0.016208648681640625, 0.017162084579467773, 0.018115520477294922, 0.01906895637512207, 0.02002239227294922, 0.020975828170776367, 0.021929264068603516, 0.022882699966430664, 0.023836135864257812, 0.02478957176208496, 0.02574300765991211, 0.026696443557739258, 0.027649879455566406, 0.028603315353393555, 0.029556751251220703, 0.03051018714904785, 0.031463623046875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 3.0, 6.0, 6.0, 2.0, 17.0, 8.0, 23.0, 20.0, 27.0, 30.0, 43.0, 54.0, 61.0, 92.0, 84.0, 94.0, 74.0, 76.0, 64.0, 48.0, 45.0, 27.0, 21.0, 10.0, 15.0, 5.0, 14.0, 13.0, 5.0, 3.0, 2.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034423828125, -0.033111572265625, -0.03179931640625, -0.030487060546875, -0.0291748046875, -0.027862548828125, -0.02655029296875, -0.025238037109375, -0.02392578125, -0.022613525390625, -0.02130126953125, -0.019989013671875, -0.0186767578125, -0.017364501953125, -0.01605224609375, -0.014739990234375, -0.013427734375, -0.012115478515625, -0.01080322265625, -0.009490966796875, -0.0081787109375, -0.006866455078125, -0.00555419921875, -0.004241943359375, -0.0029296875, -0.001617431640625, -0.00030517578125, 0.001007080078125, 0.0023193359375, 0.003631591796875, 0.00494384765625, 0.006256103515625, 0.007568359375, 0.008880615234375, 0.01019287109375, 0.011505126953125, 0.0128173828125, 0.014129638671875, 0.01544189453125, 0.016754150390625, 0.01806640625, 0.019378662109375, 0.02069091796875, 0.022003173828125, 0.0233154296875, 0.024627685546875, 0.02593994140625, 0.027252197265625, 0.028564453125, 0.029876708984375, 0.03118896484375, 0.032501220703125, 0.0338134765625, 0.035125732421875, 0.03643798828125, 0.037750244140625, 0.0390625, 0.040374755859375, 0.04168701171875, 0.042999267578125, 0.0443115234375, 0.045623779296875, 0.04693603515625, 0.048248291015625, 0.049560546875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 7.0, 18.0, 29.0, 70.0, 205.0, 399.0, 148.0, 75.0, 29.0, 11.0, 4.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.105802059173584, -2.052506923675537, -1.9992116689682007, -1.9459164142608643, -1.8926211595535278, -1.8393259048461914, -1.7860307693481445, -1.732735514640808, -1.6794402599334717, -1.6261450052261353, -1.5728498697280884, -1.519554615020752, -1.4662593603134155, -1.412964105606079, -1.3596689701080322, -1.3063737154006958, -1.253078579902649, -1.1997833251953125, -1.1464881896972656, -1.0931929349899292, -1.0398976802825928, -0.9866024851799011, -0.9333072900772095, -0.880012035369873, -0.8267168402671814, -0.7734216451644897, -0.7201263904571533, -0.6668311953544617, -0.61353600025177, -0.5602407455444336, -0.5069455504417419, -0.4536503255367279, -0.4003552198410034, -0.3470599949359894, -0.29376477003097534, -0.2404695749282837, -0.18717435002326965, -0.13387912511825562, -0.08058393001556396, -0.027288705110549927, 0.02600651979446411, 0.07930173724889755, 0.132596954703331, 0.18589216470718384, 0.23918738961219788, 0.2924826145172119, 0.34577780961990356, 0.3990730345249176, 0.45236825942993164, 0.5056634545326233, 0.5589587092399597, 0.6122539043426514, 0.6655491590499878, 0.7188443541526794, 0.7721395492553711, 0.8254348039627075, 0.8787299990653992, 0.9320251941680908, 0.9853204488754272, 1.0386157035827637, 1.0919108390808105, 1.145206093788147, 1.1985013484954834, 1.2517964839935303, 1.3050917387008667]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 4.0, 8.0, 4.0, 9.0, 8.0, 11.0, 14.0, 19.0, 20.0, 28.0, 22.0, 29.0, 28.0, 49.0, 59.0, 80.0, 94.0, 89.0, 78.0, 50.0, 37.0, 40.0, 32.0, 23.0, 27.0, 16.0, 23.0, 13.0, 21.0, 10.0, 10.0, 7.0, 11.0, 7.0, 4.0, 2.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.8954162001609802, -0.8705326318740845, -0.845649003982544, -0.8207653760910034, -0.7958818078041077, -0.7709982395172119, -0.7461146116256714, -0.7212309837341309, -0.6963474154472351, -0.6714638471603394, -0.6465802192687988, -0.6216965913772583, -0.5968130230903625, -0.5719294548034668, -0.5470458269119263, -0.5221621990203857, -0.49727863073349, -0.47239503264427185, -0.4475114345550537, -0.42262783646583557, -0.39774423837661743, -0.3728606402873993, -0.34797704219818115, -0.323093444108963, -0.2982098460197449, -0.27332624793052673, -0.2484426498413086, -0.22355905175209045, -0.19867545366287231, -0.17379185557365417, -0.14890825748443604, -0.1240246593952179, -0.09914106130599976, -0.07425746321678162, -0.04937386512756348, -0.024490267038345337, 0.00039333105087280273, 0.025276929140090942, 0.05016052722930908, 0.07504412531852722, 0.09992772340774536, 0.1248113214969635, 0.14969491958618164, 0.17457851767539978, 0.19946211576461792, 0.22434571385383606, 0.2492293119430542, 0.27411291003227234, 0.2989965081214905, 0.3238801062107086, 0.34876370429992676, 0.3736473023891449, 0.39853090047836304, 0.4234144985675812, 0.4482980966567993, 0.47318169474601746, 0.4980652928352356, 0.5229488611221313, 0.5478324890136719, 0.5727161169052124, 0.5975996851921082, 0.6224832534790039, 0.6473668813705444, 0.672250509262085, 0.6971340775489807]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 10.0, 13.0, 10.0, 21.0, 38.0, 55.0, 83.0, 155.0, 250.0, 396.0, 760.0, 1435.0, 2897.0, 6542.0, 17188.0, 54241.0, 223531.0, 1077675.0, 2029715.0, 600563.0, 122850.0, 33320.0, 12165.0, 4974.0, 2381.0, 1245.0, 649.0, 371.0, 255.0, 163.0, 105.0, 75.0, 45.0, 38.0, 19.0, 17.0, 6.0, 11.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.099365234375, -0.0961923599243164, -0.09301948547363281, -0.08984661102294922, -0.08667373657226562, -0.08350086212158203, -0.08032798767089844, -0.07715511322021484, -0.07398223876953125, -0.07080936431884766, -0.06763648986816406, -0.06446361541748047, -0.061290740966796875, -0.05811786651611328, -0.05494499206542969, -0.051772117614746094, -0.0485992431640625, -0.045426368713378906, -0.04225349426269531, -0.03908061981201172, -0.035907745361328125, -0.03273487091064453, -0.029561996459960938, -0.026389122009277344, -0.02321624755859375, -0.020043373107910156, -0.016870498657226562, -0.013697624206542969, -0.010524749755859375, -0.007351875305175781, -0.0041790008544921875, -0.0010061264038085938, 0.002166748046875, 0.005339622497558594, 0.008512496948242188, 0.011685371398925781, 0.014858245849609375, 0.01803112030029297, 0.021203994750976562, 0.024376869201660156, 0.02754974365234375, 0.030722618103027344, 0.03389549255371094, 0.03706836700439453, 0.040241241455078125, 0.04341411590576172, 0.04658699035644531, 0.049759864807128906, 0.0529327392578125, 0.056105613708496094, 0.05927848815917969, 0.06245136260986328, 0.06562423706054688, 0.06879711151123047, 0.07196998596191406, 0.07514286041259766, 0.07831573486328125, 0.08148860931396484, 0.08466148376464844, 0.08783435821533203, 0.09100723266601562, 0.09418010711669922, 0.09735298156738281, 0.1005258560180664, 0.10369873046875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 3.0, 3.0, 4.0, 3.0, 7.0, 8.0, 7.0, 12.0, 10.0, 13.0, 17.0, 24.0, 20.0, 22.0, 32.0, 33.0, 28.0, 37.0, 44.0, 38.0, 42.0, 41.0, 39.0, 46.0, 50.0, 50.0, 37.0, 36.0, 36.0, 31.0, 29.0, 34.0, 24.0, 26.0, 18.0, 24.0, 9.0, 11.0, 12.0, 7.0, 14.0, 5.0, 2.0, 1.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04644775390625, -0.044939517974853516, -0.04343128204345703, -0.04192304611206055, -0.04041481018066406, -0.03890657424926758, -0.037398338317871094, -0.03589010238647461, -0.034381866455078125, -0.03287363052368164, -0.031365394592285156, -0.029857158660888672, -0.028348922729492188, -0.026840686798095703, -0.02533245086669922, -0.023824214935302734, -0.02231597900390625, -0.020807743072509766, -0.01929950714111328, -0.017791271209716797, -0.016283035278320312, -0.014774799346923828, -0.013266563415527344, -0.01175832748413086, -0.010250091552734375, -0.00874185562133789, -0.007233619689941406, -0.005725383758544922, -0.0042171478271484375, -0.002708911895751953, -0.0012006759643554688, 0.0003075599670410156, 0.0018157958984375, 0.0033240318298339844, 0.004832267761230469, 0.006340503692626953, 0.007848739624023438, 0.009356975555419922, 0.010865211486816406, 0.01237344741821289, 0.013881683349609375, 0.01538991928100586, 0.016898155212402344, 0.018406391143798828, 0.019914627075195312, 0.021422863006591797, 0.02293109893798828, 0.024439334869384766, 0.02594757080078125, 0.027455806732177734, 0.02896404266357422, 0.030472278594970703, 0.03198051452636719, 0.03348875045776367, 0.034996986389160156, 0.03650522232055664, 0.038013458251953125, 0.03952169418334961, 0.041029930114746094, 0.04253816604614258, 0.04404640197753906, 0.04555463790893555, 0.04706287384033203, 0.048571109771728516, 0.050079345703125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 6.0, 14.0, 15.0, 20.0, 40.0, 44.0, 88.0, 108.0, 175.0, 262.0, 508.0, 1131.0, 3232.0, 16470.0, 776648.0, 3353766.0, 34159.0, 4675.0, 1392.0, 663.0, 318.0, 176.0, 110.0, 83.0, 52.0, 24.0, 28.0, 16.0, 12.0, 15.0, 8.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.434326171875, -0.4223060607910156, -0.41028594970703125, -0.3982658386230469, -0.3862457275390625, -0.3742256164550781, -0.36220550537109375, -0.3501853942871094, -0.338165283203125, -0.3261451721191406, -0.31412506103515625, -0.3021049499511719, -0.2900848388671875, -0.2780647277832031, -0.26604461669921875, -0.2540245056152344, -0.24200439453125, -0.22998428344726562, -0.21796417236328125, -0.20594406127929688, -0.1939239501953125, -0.18190383911132812, -0.16988372802734375, -0.15786361694335938, -0.145843505859375, -0.13382339477539062, -0.12180328369140625, -0.10978317260742188, -0.0977630615234375, -0.08574295043945312, -0.07372283935546875, -0.061702728271484375, -0.0496826171875, -0.037662506103515625, -0.02564239501953125, -0.013622283935546875, -0.0016021728515625, 0.010417938232421875, 0.02243804931640625, 0.034458160400390625, 0.046478271484375, 0.058498382568359375, 0.07051849365234375, 0.08253860473632812, 0.0945587158203125, 0.10657882690429688, 0.11859893798828125, 0.13061904907226562, 0.14263916015625, 0.15465927124023438, 0.16667938232421875, 0.17869949340820312, 0.1907196044921875, 0.20273971557617188, 0.21475982666015625, 0.22677993774414062, 0.238800048828125, 0.2508201599121094, 0.26284027099609375, 0.2748603820800781, 0.2868804931640625, 0.2989006042480469, 0.31092071533203125, 0.3229408264160156, 0.3349609375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 5.0, 5.0, 2.0, 9.0, 11.0, 19.0, 17.0, 25.0, 49.0, 43.0, 48.0, 78.0, 129.0, 163.0, 189.0, 273.0, 369.0, 402.0, 450.0, 400.0, 321.0, 269.0, 184.0, 149.0, 108.0, 73.0, 81.0, 45.0, 36.0, 32.0, 22.0, 17.0, 16.0, 6.0, 10.0, 2.0, 2.0, 7.0, 2.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1507568359375, -0.1457843780517578, -0.14081192016601562, -0.13583946228027344, -0.13086700439453125, -0.12589454650878906, -0.12092208862304688, -0.11594963073730469, -0.1109771728515625, -0.10600471496582031, -0.10103225708007812, -0.09605979919433594, -0.09108734130859375, -0.08611488342285156, -0.08114242553710938, -0.07616996765136719, -0.071197509765625, -0.06622505187988281, -0.061252593994140625, -0.05628013610839844, -0.05130767822265625, -0.04633522033691406, -0.041362762451171875, -0.03639030456542969, -0.0314178466796875, -0.026445388793945312, -0.021472930908203125, -0.016500473022460938, -0.01152801513671875, -0.0065555572509765625, -0.001583099365234375, 0.0033893585205078125, 0.00836181640625, 0.013334274291992188, 0.018306732177734375, 0.023279190063476562, 0.02825164794921875, 0.03322410583496094, 0.038196563720703125, 0.04316902160644531, 0.0481414794921875, 0.05311393737792969, 0.058086395263671875, 0.06305885314941406, 0.06803131103515625, 0.07300376892089844, 0.07797622680664062, 0.08294868469238281, 0.087921142578125, 0.09289360046386719, 0.09786605834960938, 0.10283851623535156, 0.10781097412109375, 0.11278343200683594, 0.11775588989257812, 0.12272834777832031, 0.1277008056640625, 0.1326732635498047, 0.13764572143554688, 0.14261817932128906, 0.14759063720703125, 0.15256309509277344, 0.15753555297851562, 0.1625080108642578, 0.16748046875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 11.0, 7.0, 7.0, 17.0, 37.0, 88.0, 161.0, 213.0, 223.0, 115.0, 69.0, 23.0, 10.0, 6.0, 7.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.9089221954345703, -3.8128654956817627, -3.716808557510376, -3.6207518577575684, -3.5246949195861816, -3.428638219833374, -3.3325815200805664, -3.2365245819091797, -3.140467882156372, -3.0444111824035645, -2.9483542442321777, -2.85229754447937, -2.7562408447265625, -2.660183906555176, -2.564127206802368, -2.4680705070495605, -2.372013568878174, -2.275956869125366, -2.1798999309539795, -2.083843231201172, -1.9877864122390747, -1.8917295932769775, -1.79567289352417, -1.6996160745620728, -1.6035592555999756, -1.5075024366378784, -1.4114456176757812, -1.3153889179229736, -1.2193320989608765, -1.1232752799987793, -1.0272185802459717, -0.9311617612838745, -0.8351047039031982, -0.7390478849411011, -0.6429911255836487, -0.5469343662261963, -0.4508775472640991, -0.35482075810432434, -0.25876396894454956, -0.16270720958709717, -0.066650390625, 0.02940639853477478, 0.12546318769454956, 0.22151997685432434, 0.3175767660140991, 0.4136335551738739, 0.5096903443336487, 0.6057471036911011, 0.7018039226531982, 0.7978607416152954, 0.8939175009727478, 0.9899742603302002, 1.0860310792922974, 1.1820878982543945, 1.2781445980072021, 1.3742014169692993, 1.4702582359313965, 1.5663150548934937, 1.6623718738555908, 1.7584285736083984, 1.8544853925704956, 1.9505422115325928, 2.0465989112854004, 2.142655849456787, 2.2387125492095947]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 4.0, 7.0, 3.0, 11.0, 8.0, 8.0, 13.0, 15.0, 13.0, 11.0, 24.0, 24.0, 36.0, 25.0, 25.0, 33.0, 34.0, 26.0, 45.0, 46.0, 46.0, 52.0, 43.0, 46.0, 43.0, 45.0, 26.0, 43.0, 26.0, 26.0, 21.0, 30.0, 17.0, 17.0, 13.0, 16.0, 10.0, 10.0, 10.0, 10.0, 10.0, 6.0, 10.0, 3.0, 3.0, 1.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.8835044503211975, -0.854857861995697, -0.8262112140655518, -0.7975646257400513, -0.7689180374145508, -0.7402713894844055, -0.711624801158905, -0.6829781532287598, -0.6543315649032593, -0.6256849765777588, -0.5970383286476135, -0.568391740322113, -0.5397450923919678, -0.5110985040664673, -0.4824519157409668, -0.4538052976131439, -0.42515867948532104, -0.39651206135749817, -0.3678654432296753, -0.3392188549041748, -0.31057223677635193, -0.28192561864852905, -0.25327903032302856, -0.2246324121952057, -0.1959857940673828, -0.16733917593955994, -0.13869257271289825, -0.11004596203565598, -0.0813993513584137, -0.05275273323059082, -0.024106130003929138, 0.004540473222732544, 0.033187150955200195, 0.061833761632442474, 0.09048037230968475, 0.11912698298692703, 0.1477735936641693, 0.1764202117919922, 0.20506681501865387, 0.23371341824531555, 0.2623600363731384, 0.2910066545009613, 0.3196532726287842, 0.34829986095428467, 0.37694647908210754, 0.4055930972099304, 0.4342396855354309, 0.4628863036632538, 0.49153292179107666, 0.5201795101165771, 0.5488261580467224, 0.5774727463722229, 0.6061193943023682, 0.6347659826278687, 0.6634125709533691, 0.6920591592788696, 0.7207058072090149, 0.7493523955345154, 0.7779990434646606, 0.8066456317901611, 0.8352922201156616, 0.8639388680458069, 0.8925854563713074, 0.9212321043014526, 0.9498786926269531]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 4.0, 7.0, 6.0, 10.0, 16.0, 25.0, 43.0, 62.0, 75.0, 127.0, 195.0, 298.0, 429.0, 691.0, 1036.0, 1720.0, 3027.0, 5328.0, 10033.0, 20578.0, 45123.0, 112434.0, 395497.0, 288356.0, 88842.0, 37225.0, 17237.0, 8750.0, 4583.0, 2639.0, 1540.0, 903.0, 605.0, 346.0, 239.0, 164.0, 121.0, 76.0, 43.0, 38.0, 28.0, 26.0, 11.0, 9.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0731201171875, -0.07096195220947266, -0.06880378723144531, -0.06664562225341797, -0.06448745727539062, -0.06232929229736328, -0.06017112731933594, -0.058012962341308594, -0.05585479736328125, -0.053696632385253906, -0.05153846740722656, -0.04938030242919922, -0.047222137451171875, -0.04506397247314453, -0.04290580749511719, -0.040747642517089844, -0.0385894775390625, -0.036431312561035156, -0.03427314758300781, -0.03211498260498047, -0.029956817626953125, -0.02779865264892578, -0.025640487670898438, -0.023482322692871094, -0.02132415771484375, -0.019165992736816406, -0.017007827758789062, -0.014849662780761719, -0.012691497802734375, -0.010533332824707031, -0.008375167846679688, -0.006217002868652344, -0.004058837890625, -0.0019006729125976562, 0.0002574920654296875, 0.0024156570434570312, 0.004573822021484375, 0.006731986999511719, 0.008890151977539062, 0.011048316955566406, 0.01320648193359375, 0.015364646911621094, 0.017522811889648438, 0.01968097686767578, 0.021839141845703125, 0.02399730682373047, 0.026155471801757812, 0.028313636779785156, 0.0304718017578125, 0.032629966735839844, 0.03478813171386719, 0.03694629669189453, 0.039104461669921875, 0.04126262664794922, 0.04342079162597656, 0.045578956604003906, 0.04773712158203125, 0.049895286560058594, 0.05205345153808594, 0.05421161651611328, 0.056369781494140625, 0.05852794647216797, 0.06068611145019531, 0.06284427642822266, 0.06500244140625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 4.0, 4.0, 6.0, 9.0, 5.0, 11.0, 14.0, 8.0, 10.0, 21.0, 21.0, 20.0, 36.0, 41.0, 40.0, 39.0, 44.0, 42.0, 56.0, 45.0, 39.0, 47.0, 41.0, 45.0, 47.0, 31.0, 36.0, 34.0, 35.0, 24.0, 21.0, 26.0, 12.0, 16.0, 16.0, 11.0, 8.0, 8.0, 4.0, 5.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0726318359375, -0.07026100158691406, -0.06789016723632812, -0.06551933288574219, -0.06314849853515625, -0.06077766418457031, -0.058406829833984375, -0.05603599548339844, -0.0536651611328125, -0.05129432678222656, -0.048923492431640625, -0.04655265808105469, -0.04418182373046875, -0.04181098937988281, -0.039440155029296875, -0.03706932067871094, -0.034698486328125, -0.03232765197753906, -0.029956817626953125, -0.027585983276367188, -0.02521514892578125, -0.022844314575195312, -0.020473480224609375, -0.018102645874023438, -0.0157318115234375, -0.013360977172851562, -0.010990142822265625, -0.008619308471679688, -0.00624847412109375, -0.0038776397705078125, -0.001506805419921875, 0.0008640289306640625, 0.00323486328125, 0.0056056976318359375, 0.007976531982421875, 0.010347366333007812, 0.01271820068359375, 0.015089035034179688, 0.017459869384765625, 0.019830703735351562, 0.0222015380859375, 0.024572372436523438, 0.026943206787109375, 0.029314041137695312, 0.03168487548828125, 0.03405570983886719, 0.036426544189453125, 0.03879737854003906, 0.041168212890625, 0.04353904724121094, 0.045909881591796875, 0.04828071594238281, 0.05065155029296875, 0.05302238464355469, 0.055393218994140625, 0.05776405334472656, 0.0601348876953125, 0.06250572204589844, 0.06487655639648438, 0.06724739074707031, 0.06961822509765625, 0.07198905944824219, 0.07435989379882812, 0.07673072814941406, 0.0791015625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 6.0, 8.0, 13.0, 20.0, 38.0, 59.0, 133.0, 227.0, 400.0, 1135.0, 4488.0, 33634.0, 924628.0, 74031.0, 7163.0, 1577.0, 537.0, 221.0, 108.0, 53.0, 29.0, 15.0, 12.0, 9.0, 5.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.255859375, -0.24847412109375, -0.2410888671875, -0.23370361328125, -0.226318359375, -0.21893310546875, -0.2115478515625, -0.20416259765625, -0.19677734375, -0.18939208984375, -0.1820068359375, -0.17462158203125, -0.167236328125, -0.15985107421875, -0.1524658203125, -0.14508056640625, -0.1376953125, -0.13031005859375, -0.1229248046875, -0.11553955078125, -0.108154296875, -0.10076904296875, -0.0933837890625, -0.08599853515625, -0.07861328125, -0.07122802734375, -0.0638427734375, -0.05645751953125, -0.049072265625, -0.04168701171875, -0.0343017578125, -0.02691650390625, -0.01953125, -0.01214599609375, -0.0047607421875, 0.00262451171875, 0.010009765625, 0.01739501953125, 0.0247802734375, 0.03216552734375, 0.03955078125, 0.04693603515625, 0.0543212890625, 0.06170654296875, 0.069091796875, 0.07647705078125, 0.0838623046875, 0.09124755859375, 0.0986328125, 0.10601806640625, 0.1134033203125, 0.12078857421875, 0.128173828125, 0.13555908203125, 0.1429443359375, 0.15032958984375, 0.15771484375, 0.16510009765625, 0.1724853515625, 0.17987060546875, 0.187255859375, 0.19464111328125, 0.2020263671875, 0.20941162109375, 0.216796875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 2.0, 2.0, 3.0, 12.0, 7.0, 4.0, 8.0, 9.0, 10.0, 10.0, 14.0, 16.0, 22.0, 25.0, 29.0, 34.0, 41.0, 47.0, 72.0, 66.0, 78.0, 84.0, 69.0, 81.0, 50.0, 38.0, 23.0, 25.0, 24.0, 20.0, 16.0, 13.0, 12.0, 11.0, 5.0, 6.0, 3.0, 3.0, 3.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34814453125, -0.3368034362792969, -0.32546234130859375, -0.3141212463378906, -0.3027801513671875, -0.2914390563964844, -0.28009796142578125, -0.2687568664550781, -0.257415771484375, -0.24607467651367188, -0.23473358154296875, -0.22339248657226562, -0.2120513916015625, -0.20071029663085938, -0.18936920166015625, -0.17802810668945312, -0.16668701171875, -0.15534591674804688, -0.14400482177734375, -0.13266372680664062, -0.1213226318359375, -0.10998153686523438, -0.09864044189453125, -0.08729934692382812, -0.075958251953125, -0.06461715698242188, -0.05327606201171875, -0.041934967041015625, -0.0305938720703125, -0.019252777099609375, -0.00791168212890625, 0.003429412841796875, 0.0147705078125, 0.026111602783203125, 0.03745269775390625, 0.048793792724609375, 0.0601348876953125, 0.07147598266601562, 0.08281707763671875, 0.09415817260742188, 0.105499267578125, 0.11684036254882812, 0.12818145751953125, 0.13952255249023438, 0.1508636474609375, 0.16220474243164062, 0.17354583740234375, 0.18488693237304688, 0.19622802734375, 0.20756912231445312, 0.21891021728515625, 0.23025131225585938, 0.2415924072265625, 0.2529335021972656, 0.26427459716796875, 0.2756156921386719, 0.286956787109375, 0.2982978820800781, 0.30963897705078125, 0.3209800720214844, 0.3323211669921875, 0.3436622619628906, 0.35500335693359375, 0.3663444519042969, 0.377685546875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 6.0, 5.0, 2.0, 9.0, 11.0, 6.0, 20.0, 14.0, 18.0, 37.0, 42.0, 50.0, 76.0, 117.0, 166.0, 279.0, 464.0, 1062.0, 2347.0, 6899.0, 30214.0, 762292.0, 211221.0, 23247.0, 5779.0, 2014.0, 858.0, 469.0, 249.0, 163.0, 116.0, 74.0, 62.0, 36.0, 28.0, 25.0, 20.0, 15.0, 9.0, 7.0, 10.0, 3.0, 4.0, 1.0, 7.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04010009765625, -0.03871345520019531, -0.037326812744140625, -0.03594017028808594, -0.03455352783203125, -0.03316688537597656, -0.031780242919921875, -0.030393600463867188, -0.0290069580078125, -0.027620315551757812, -0.026233673095703125, -0.024847030639648438, -0.02346038818359375, -0.022073745727539062, -0.020687103271484375, -0.019300460815429688, -0.017913818359375, -0.016527175903320312, -0.015140533447265625, -0.013753890991210938, -0.01236724853515625, -0.010980606079101562, -0.009593963623046875, -0.008207321166992188, -0.0068206787109375, -0.0054340362548828125, -0.004047393798828125, -0.0026607513427734375, -0.00127410888671875, 0.0001125335693359375, 0.001499176025390625, 0.0028858184814453125, 0.0042724609375, 0.0056591033935546875, 0.007045745849609375, 0.008432388305664062, 0.00981903076171875, 0.011205673217773438, 0.012592315673828125, 0.013978958129882812, 0.0153656005859375, 0.016752243041992188, 0.018138885498046875, 0.019525527954101562, 0.02091217041015625, 0.022298812866210938, 0.023685455322265625, 0.025072097778320312, 0.026458740234375, 0.027845382690429688, 0.029232025146484375, 0.030618667602539062, 0.03200531005859375, 0.03339195251464844, 0.034778594970703125, 0.03616523742675781, 0.0375518798828125, 0.03893852233886719, 0.040325164794921875, 0.04171180725097656, 0.04309844970703125, 0.04448509216308594, 0.045871734619140625, 0.04725837707519531, 0.04864501953125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 6.0, 9.0, 9.0, 9.0, 11.0, 11.0, 19.0, 24.0, 20.0, 30.0, 33.0, 49.0, 54.0, 63.0, 87.0, 70.0, 72.0, 72.0, 63.0, 57.0, 32.0, 44.0, 32.0, 29.0, 16.0, 18.0, 8.0, 13.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 6.0, 2.0, 5.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4185905456542969e-05, -1.3763085007667542e-05, -1.3340264558792114e-05, -1.2917444109916687e-05, -1.249462366104126e-05, -1.2071803212165833e-05, -1.1648982763290405e-05, -1.1226162314414978e-05, -1.080334186553955e-05, -1.0380521416664124e-05, -9.957700967788696e-06, -9.534880518913269e-06, -9.112060070037842e-06, -8.689239621162415e-06, -8.266419172286987e-06, -7.84359872341156e-06, -7.420778274536133e-06, -6.9979578256607056e-06, -6.575137376785278e-06, -6.152316927909851e-06, -5.729496479034424e-06, -5.306676030158997e-06, -4.883855581283569e-06, -4.461035132408142e-06, -4.038214683532715e-06, -3.6153942346572876e-06, -3.1925737857818604e-06, -2.769753336906433e-06, -2.346932888031006e-06, -1.9241124391555786e-06, -1.5012919902801514e-06, -1.0784715414047241e-06, -6.556510925292969e-07, -2.3283064365386963e-07, 1.8998980522155762e-07, 6.128102540969849e-07, 1.0356307029724121e-06, 1.4584511518478394e-06, 1.8812716007232666e-06, 2.304092049598694e-06, 2.726912498474121e-06, 3.1497329473495483e-06, 3.5725533962249756e-06, 3.995373845100403e-06, 4.41819429397583e-06, 4.841014742851257e-06, 5.2638351917266846e-06, 5.686655640602112e-06, 6.109476089477539e-06, 6.532296538352966e-06, 6.9551169872283936e-06, 7.377937436103821e-06, 7.800757884979248e-06, 8.223578333854675e-06, 8.646398782730103e-06, 9.06921923160553e-06, 9.492039680480957e-06, 9.914860129356384e-06, 1.0337680578231812e-05, 1.0760501027107239e-05, 1.1183321475982666e-05, 1.1606141924858093e-05, 1.202896237373352e-05, 1.2451782822608948e-05, 1.2874603271484375e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 5.0, 7.0, 9.0, 13.0, 18.0, 29.0, 60.0, 132.0, 290.0, 878.0, 3826.0, 24295.0, 889860.0, 115957.0, 10274.0, 1957.0, 527.0, 202.0, 88.0, 41.0, 28.0, 22.0, 15.0, 5.0, 9.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0736083984375, -0.07149219512939453, -0.06937599182128906, -0.0672597885131836, -0.06514358520507812, -0.06302738189697266, -0.06091117858886719, -0.05879497528076172, -0.05667877197265625, -0.05456256866455078, -0.05244636535644531, -0.050330162048339844, -0.048213958740234375, -0.046097755432128906, -0.04398155212402344, -0.04186534881591797, -0.0397491455078125, -0.03763294219970703, -0.03551673889160156, -0.033400535583496094, -0.031284332275390625, -0.029168128967285156, -0.027051925659179688, -0.02493572235107422, -0.02281951904296875, -0.02070331573486328, -0.018587112426757812, -0.016470909118652344, -0.014354705810546875, -0.012238502502441406, -0.010122299194335938, -0.008006095886230469, -0.005889892578125, -0.0037736892700195312, -0.0016574859619140625, 0.00045871734619140625, 0.002574920654296875, 0.004691123962402344, 0.0068073272705078125, 0.008923530578613281, 0.01103973388671875, 0.013155937194824219, 0.015272140502929688, 0.017388343811035156, 0.019504547119140625, 0.021620750427246094, 0.023736953735351562, 0.02585315704345703, 0.0279693603515625, 0.03008556365966797, 0.03220176696777344, 0.034317970275878906, 0.036434173583984375, 0.038550376892089844, 0.04066658020019531, 0.04278278350830078, 0.04489898681640625, 0.04701519012451172, 0.04913139343261719, 0.051247596740722656, 0.053363800048828125, 0.055480003356933594, 0.05759620666503906, 0.05971240997314453, 0.06182861328125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 4.0, 4.0, 9.0, 10.0, 9.0, 7.0, 9.0, 11.0, 9.0, 15.0, 15.0, 28.0, 54.0, 58.0, 84.0, 107.0, 110.0, 119.0, 80.0, 59.0, 47.0, 18.0, 19.0, 23.0, 24.0, 10.0, 8.0, 11.0, 9.0, 10.0, 9.0, 6.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.04913330078125, -0.047570228576660156, -0.04600715637207031, -0.04444408416748047, -0.042881011962890625, -0.04131793975830078, -0.03975486755371094, -0.038191795349121094, -0.03662872314453125, -0.035065650939941406, -0.03350257873535156, -0.03193950653076172, -0.030376434326171875, -0.02881336212158203, -0.027250289916992188, -0.025687217712402344, -0.0241241455078125, -0.022561073303222656, -0.020998001098632812, -0.01943492889404297, -0.017871856689453125, -0.01630878448486328, -0.014745712280273438, -0.013182640075683594, -0.01161956787109375, -0.010056495666503906, -0.008493423461914062, -0.006930351257324219, -0.005367279052734375, -0.0038042068481445312, -0.0022411346435546875, -0.0006780624389648438, 0.000885009765625, 0.0024480819702148438, 0.0040111541748046875, 0.005574226379394531, 0.007137298583984375, 0.008700370788574219, 0.010263442993164062, 0.011826515197753906, 0.01338958740234375, 0.014952659606933594, 0.016515731811523438, 0.01807880401611328, 0.019641876220703125, 0.02120494842529297, 0.022768020629882812, 0.024331092834472656, 0.0258941650390625, 0.027457237243652344, 0.029020309448242188, 0.03058338165283203, 0.032146453857421875, 0.03370952606201172, 0.03527259826660156, 0.036835670471191406, 0.03839874267578125, 0.039961814880371094, 0.04152488708496094, 0.04308795928955078, 0.044651031494140625, 0.04621410369873047, 0.04777717590332031, 0.049340248107910156, 0.0509033203125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 4.0, 8.0, 9.0, 18.0, 43.0, 80.0, 268.0, 363.0, 107.0, 38.0, 33.0, 14.0, 10.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0455381870269775, -1.9872790575027466, -1.9290199279785156, -1.8707609176635742, -1.8125017881393433, -1.7542426586151123, -1.695983648300171, -1.63772451877594, -1.579465389251709, -1.521206259727478, -1.462947130203247, -1.4046881198883057, -1.3464289903640747, -1.2881698608398438, -1.2299108505249023, -1.1716517210006714, -1.1133925914764404, -1.0551334619522095, -0.9968743920326233, -0.9386153221130371, -0.8803561925888062, -0.8220970630645752, -0.763837993144989, -0.7055789232254028, -0.6473197937011719, -0.5890606641769409, -0.5308015942573547, -0.47254249453544617, -0.4142833948135376, -0.35602429509162903, -0.29776519536972046, -0.2395060956478119, -0.18124699592590332, -0.12298789620399475, -0.06472879648208618, -0.006469696760177612, 0.05178940296173096, 0.11004850268363953, 0.1683076024055481, 0.22656670212745667, 0.28482580184936523, 0.3430849015712738, 0.4013440012931824, 0.45960310101509094, 0.5178622007369995, 0.5761213302612305, 0.6343804001808167, 0.6926394701004028, 0.7508985996246338, 0.8091577291488647, 0.8674167990684509, 0.9256758689880371, 0.9839349985122681, 1.042194128036499, 1.1004531383514404, 1.1587122678756714, 1.2169713973999023, 1.2752305269241333, 1.3334896564483643, 1.3917486667633057, 1.4500077962875366, 1.5082669258117676, 1.566525936126709, 1.62478506565094, 1.683044195175171]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 1.0, 3.0, 6.0, 8.0, 4.0, 10.0, 10.0, 11.0, 17.0, 25.0, 21.0, 20.0, 41.0, 45.0, 63.0, 73.0, 87.0, 88.0, 71.0, 78.0, 51.0, 46.0, 32.0, 24.0, 25.0, 26.0, 17.0, 10.0, 7.0, 16.0, 11.0, 9.0, 5.0, 11.0, 6.0, 3.0, 3.0, 1.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.0160033702850342, -0.9856521487236023, -0.9553009271621704, -0.9249496459960938, -0.8945984244346619, -0.86424720287323, -0.8338959813117981, -0.8035447597503662, -0.7731934785842896, -0.7428422570228577, -0.7124910354614258, -0.6821397542953491, -0.6517885327339172, -0.6214373111724854, -0.5910860896110535, -0.5607348680496216, -0.5303835868835449, -0.500032365322113, -0.46968111395835876, -0.4393298923969269, -0.4089786410331726, -0.3786274194717407, -0.34827619791030884, -0.31792494654655457, -0.28757375478744507, -0.2572225332260132, -0.2268712818622589, -0.19652006030082703, -0.16616880893707275, -0.13581758737564087, -0.10546635091304779, -0.07511511445045471, -0.04476386308670044, -0.01441262848675251, 0.01593860611319542, 0.0462898388504982, 0.07664107531309128, 0.10699230432510376, 0.13734354078769684, 0.16769477725028992, 0.198046013712883, 0.22839725017547607, 0.25874847173690796, 0.28909972310066223, 0.3194509446620941, 0.3498021960258484, 0.3801534175872803, 0.41050463914871216, 0.44085589051246643, 0.4712071120738983, 0.5015583634376526, 0.5319095849990845, 0.5622608065605164, 0.5926120281219482, 0.6229633092880249, 0.6533145308494568, 0.6836657524108887, 0.7140169739723206, 0.7443681955337524, 0.7747194766998291, 0.805070698261261, 0.8354219198226929, 0.8657731413841248, 0.8961243629455566, 0.9264756441116333]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 8.0, 7.0, 18.0, 15.0, 11.0, 25.0, 21.0, 12.0, 24.0, 26.0, 29.0, 33.0, 15.0, 43.0, 65.0, 124.0, 151.0, 70.0, 39.0, 30.0, 36.0, 23.0, 20.0, 24.0, 23.0, 23.0, 15.0, 10.0, 8.0, 8.0, 11.0, 8.0, 8.0, 5.0, 5.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0712890625, -0.06891536712646484, -0.06654167175292969, -0.06416797637939453, -0.061794281005859375, -0.05942058563232422, -0.05704689025878906, -0.054673194885253906, -0.05229949951171875, -0.049925804138183594, -0.04755210876464844, -0.04517841339111328, -0.042804718017578125, -0.04043102264404297, -0.03805732727050781, -0.035683631896972656, -0.0333099365234375, -0.030936241149902344, -0.028562545776367188, -0.02618885040283203, -0.023815155029296875, -0.02144145965576172, -0.019067764282226562, -0.016694068908691406, -0.01432037353515625, -0.011946678161621094, -0.009572982788085938, -0.007199287414550781, -0.004825592041015625, -0.0024518966674804688, -7.82012939453125e-05, 0.0022954940795898438, 0.004669189453125, 0.007042884826660156, 0.009416580200195312, 0.011790275573730469, 0.014163970947265625, 0.01653766632080078, 0.018911361694335938, 0.021285057067871094, 0.02365875244140625, 0.026032447814941406, 0.028406143188476562, 0.03077983856201172, 0.033153533935546875, 0.03552722930908203, 0.03790092468261719, 0.040274620056152344, 0.0426483154296875, 0.045022010803222656, 0.04739570617675781, 0.04976940155029297, 0.052143096923828125, 0.05451679229736328, 0.05689048767089844, 0.059264183044433594, 0.06163787841796875, 0.0640115737915039, 0.06638526916503906, 0.06875896453857422, 0.07113265991210938, 0.07350635528564453, 0.07588005065917969, 0.07825374603271484, 0.08062744140625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 6.0, 3.0, 4.0, 1.0, 7.0, 1.0, 5.0, 5.0, 9.0, 20.0, 13.0, 25.0, 33.0, 45.0, 53.0, 103.0, 132.0, 247.0, 489.0, 1103.0, 2891.0, 9028.0, 154523.0, 8198933.0, 13901.0, 3907.0, 1548.0, 671.0, 303.0, 194.0, 97.0, 63.0, 56.0, 39.0, 22.0, 25.0, 23.0, 9.0, 7.0, 7.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 5.0, 2.0, 2.0], "bins": [-0.4251953363418579, -0.4119632840156555, -0.3987312316894531, -0.3854992091655731, -0.3722671568393707, -0.35903510451316833, -0.34580308198928833, -0.33257102966308594, -0.31933897733688354, -0.30610692501068115, -0.29287487268447876, -0.27964285016059875, -0.26641079783439636, -0.25317874550819397, -0.23994670808315277, -0.22671467065811157, -0.21348261833190918, -0.2002505660057068, -0.1870185285806656, -0.1737864911556244, -0.160554438829422, -0.1473223865032196, -0.1340903490781784, -0.12085830420255661, -0.10762625932693481, -0.09439421445131302, -0.08116216957569122, -0.06793012470006943, -0.05469807982444763, -0.041466034948825836, -0.02823399007320404, -0.015001945197582245, -0.0017699003219604492, 0.011462144553661346, 0.024694189429283142, 0.03792623430490494, 0.05115827918052673, 0.06439032405614853, 0.07762236893177032, 0.09085441380739212, 0.10408645868301392, 0.11731850355863571, 0.1305505484342575, 0.1437825858592987, 0.1570146381855011, 0.1702466905117035, 0.1834787279367447, 0.1967107653617859, 0.20994281768798828, 0.22317487001419067, 0.23640690743923187, 0.24963894486427307, 0.26287099719047546, 0.27610304951667786, 0.28933507204055786, 0.30256712436676025, 0.31579917669296265, 0.32903122901916504, 0.34226328134536743, 0.35549530386924744, 0.36872735619544983, 0.3819594085216522, 0.3951914310455322, 0.4084234833717346, 0.421655535697937]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 6.0, 4.0, 7.0, 1.0, 3.0, 7.0, 4.0, 5.0, 6.0, 4.0, 1.0, 7.0, 2.0, 4.0, 4.0, 3.0, 4.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8421979546546936, -0.8183676600456238, -0.794537365436554, -0.7707071304321289, -0.7468768358230591, -0.7230465412139893, -0.6992162466049194, -0.6753859519958496, -0.6515556573867798, -0.62772536277771, -0.6038950681686401, -0.5800647735595703, -0.5562345385551453, -0.5324042439460754, -0.5085739493370056, -0.4847436547279358, -0.46091341972351074, -0.4370831251144409, -0.4132528603076935, -0.38942256569862366, -0.3655923008918762, -0.3417620062828064, -0.3179317116737366, -0.29410141706466675, -0.2702711522579193, -0.24644087255001068, -0.22261059284210205, -0.19878029823303223, -0.1749500185251236, -0.15111973881721497, -0.12728944420814514, -0.10345916450023651, -0.0796288251876831, -0.05579854175448418, -0.03196825832128525, -0.00813797116279602, 0.01569230854511261, 0.03952258825302124, 0.06335288286209106, 0.0871831625699997, 0.11101344227790833, 0.13484372198581696, 0.15867400169372559, 0.1825042963027954, 0.20633457601070404, 0.23016485571861267, 0.2539951503276825, 0.27782541513442993, 0.30165570974349976, 0.3254860043525696, 0.349316269159317, 0.37314656376838684, 0.3969768285751343, 0.4208071231842041, 0.4446374177932739, 0.46846771240234375, 0.4922979772090912, 0.5161282420158386, 0.5399585366249084, 0.5637888312339783, 0.5876191258430481, 0.6114493608474731, 0.635279655456543, 0.6591099500656128, 0.6829402446746826]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 11.0, 13.0, 17.0, 22.0, 40.0, 56.0, 71.0, 92.0, 96.0, 118.0, 97.0, 102.0, 85.0, 66.0, 38.0, 35.0, 16.0, 11.0, 8.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0726318359375, -0.06878089904785156, -0.06492996215820312, -0.06107902526855469, -0.05722808837890625, -0.05337715148925781, -0.049526214599609375, -0.04567527770996094, -0.0418243408203125, -0.03797340393066406, -0.034122467041015625, -0.030271530151367188, -0.02642059326171875, -0.022569656372070312, -0.018718719482421875, -0.014867782592773438, -0.011016845703125, -0.0071659088134765625, -0.003314971923828125, 0.0005359649658203125, 0.00438690185546875, 0.008237838745117188, 0.012088775634765625, 0.015939712524414062, 0.0197906494140625, 0.023641586303710938, 0.027492523193359375, 0.03134346008300781, 0.03519439697265625, 0.03904533386230469, 0.042896270751953125, 0.04674720764160156, 0.05059814453125, 0.05444908142089844, 0.058300018310546875, 0.06215095520019531, 0.06600189208984375, 0.06985282897949219, 0.07370376586914062, 0.07755470275878906, 0.0814056396484375, 0.08525657653808594, 0.08910751342773438, 0.09295845031738281, 0.09680938720703125, 0.10066032409667969, 0.10451126098632812, 0.10836219787597656, 0.112213134765625, 0.11606407165527344, 0.11991500854492188, 0.12376594543457031, 0.12761688232421875, 0.1314678192138672, 0.13531875610351562, 0.13916969299316406, 0.1430206298828125, 0.14687156677246094, 0.15072250366210938, 0.1545734405517578, 0.15842437744140625, 0.1622753143310547, 0.16612625122070312, 0.16997718811035156, 0.173828125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 7.0, 2.0, 4.0, 16.0, 22.0, 32.0, 50.0, 72.0, 175.0, 334.0, 817.0, 2804.0, 12739.0, 75737.0, 306130.0, 103090.0, 16722.0, 3654.0, 1044.0, 381.0, 191.0, 93.0, 62.0, 35.0, 23.0, 5.0, 8.0, 4.0, 3.0, 1.0, 6.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.78271484375, -0.7553253173828125, -0.727935791015625, -0.7005462646484375, -0.67315673828125, -0.6457672119140625, -0.618377685546875, -0.5909881591796875, -0.5635986328125, -0.5362091064453125, -0.508819580078125, -0.4814300537109375, -0.45404052734375, -0.4266510009765625, -0.399261474609375, -0.3718719482421875, -0.344482421875, -0.3170928955078125, -0.289703369140625, -0.2623138427734375, -0.23492431640625, -0.2075347900390625, -0.180145263671875, -0.1527557373046875, -0.1253662109375, -0.0979766845703125, -0.070587158203125, -0.0431976318359375, -0.01580810546875, 0.0115814208984375, 0.038970947265625, 0.0663604736328125, 0.09375, 0.1211395263671875, 0.148529052734375, 0.1759185791015625, 0.20330810546875, 0.2306976318359375, 0.258087158203125, 0.2854766845703125, 0.3128662109375, 0.3402557373046875, 0.367645263671875, 0.3950347900390625, 0.42242431640625, 0.4498138427734375, 0.477203369140625, 0.5045928955078125, 0.531982421875, 0.5593719482421875, 0.586761474609375, 0.6141510009765625, 0.64154052734375, 0.6689300537109375, 0.696319580078125, 0.7237091064453125, 0.7510986328125, 0.7784881591796875, 0.805877685546875, 0.8332672119140625, 0.86065673828125, 0.8880462646484375, 0.915435791015625, 0.9428253173828125, 0.97021484375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 7.0, 4.0, 4.0, 7.0, 15.0, 8.0, 17.0, 16.0, 14.0, 32.0, 26.0, 39.0, 56.0, 61.0, 47.0, 52.0, 77.0, 61.0, 59.0, 76.0, 56.0, 47.0, 39.0, 35.0, 26.0, 27.0, 17.0, 18.0, 9.0, 13.0, 6.0, 9.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0771484375, -0.07456493377685547, -0.07198143005371094, -0.0693979263305664, -0.06681442260742188, -0.06423091888427734, -0.06164741516113281, -0.05906391143798828, -0.05648040771484375, -0.05389690399169922, -0.05131340026855469, -0.048729896545410156, -0.046146392822265625, -0.043562889099121094, -0.04097938537597656, -0.03839588165283203, -0.0358123779296875, -0.03322887420654297, -0.030645370483398438, -0.028061866760253906, -0.025478363037109375, -0.022894859313964844, -0.020311355590820312, -0.01772785186767578, -0.01514434814453125, -0.012560844421386719, -0.009977340698242188, -0.007393836975097656, -0.004810333251953125, -0.0022268295288085938, 0.0003566741943359375, 0.0029401779174804688, 0.005523681640625, 0.008107185363769531, 0.010690689086914062, 0.013274192810058594, 0.015857696533203125, 0.018441200256347656, 0.021024703979492188, 0.02360820770263672, 0.02619171142578125, 0.02877521514892578, 0.03135871887207031, 0.033942222595214844, 0.036525726318359375, 0.039109230041503906, 0.04169273376464844, 0.04427623748779297, 0.0468597412109375, 0.04944324493408203, 0.05202674865722656, 0.054610252380371094, 0.057193756103515625, 0.059777259826660156, 0.06236076354980469, 0.06494426727294922, 0.06752777099609375, 0.07011127471923828, 0.07269477844238281, 0.07527828216552734, 0.07786178588867188, 0.0804452896118164, 0.08302879333496094, 0.08561229705810547, 0.08819580078125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 5.0, 13.0, 18.0, 30.0, 88.0, 122.0, 93.0, 51.0, 22.0, 11.0, 11.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8101673722267151, -0.7868161201477051, -0.7634648680686951, -0.7401136159896851, -0.7167624235153198, -0.6934111714363098, -0.6700599193572998, -0.6467086672782898, -0.6233574151992798, -0.6000061631202698, -0.5766549110412598, -0.5533036589622498, -0.5299524068832397, -0.5066012144088745, -0.4832499623298645, -0.4598987102508545, -0.4365474581718445, -0.4131962060928345, -0.38984495401382446, -0.36649373173713684, -0.34314247965812683, -0.3197912275791168, -0.2964400053024292, -0.2730887532234192, -0.24973750114440918, -0.22638624906539917, -0.20303501188755035, -0.17968377470970154, -0.15633252263069153, -0.13298127055168152, -0.1096300333738327, -0.08627879619598389, -0.0629274845123291, -0.03957623988389969, -0.016224995255470276, 0.007126249372959137, 0.03047749400138855, 0.05382873862981796, 0.07717998325824738, 0.10053122043609619, 0.1238824725151062, 0.1472337245941162, 0.17058496177196503, 0.19393619894981384, 0.21728745102882385, 0.24063870310783386, 0.2639899253845215, 0.2873411774635315, 0.3106924295425415, 0.3340436816215515, 0.3573949337005615, 0.38074615597724915, 0.40409740805625916, 0.42744866013526917, 0.4507998824119568, 0.4741511344909668, 0.4975023865699768, 0.5208536386489868, 0.5442048907279968, 0.5675561428070068, 0.5909073352813721, 0.6142585873603821, 0.6376098394393921, 0.6609610915184021, 0.6843123435974121]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 0.0, 4.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 5.0, 5.0, 7.0, 6.0, 4.0, 8.0, 12.0, 18.0, 34.0, 55.0, 63.0, 63.0, 65.0, 52.0, 21.0, 14.0, 12.0, 6.0, 4.0, 1.0, 4.0, 3.0, 3.0, 1.0, 3.0, 0.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4378100037574768, -0.4249344766139984, -0.41205894947052, -0.39918339252471924, -0.38630786538124084, -0.37343233823776245, -0.36055681109428406, -0.34768128395080566, -0.3348057270050049, -0.3219301998615265, -0.3090546727180481, -0.2961791157722473, -0.2833035886287689, -0.2704280614852905, -0.25755253434181213, -0.24467700719833374, -0.23180148005485535, -0.21892595291137695, -0.20605041086673737, -0.19317488372325897, -0.18029934167861938, -0.167423814535141, -0.1545482873916626, -0.1416727602481842, -0.12879721820354462, -0.11592168360948563, -0.10304614901542664, -0.09017062187194824, -0.07729508727788925, -0.06441955268383026, -0.05154402554035187, -0.03866849094629288, -0.025792956352233887, -0.012917423620820045, -4.1890889406204224e-05, 0.012833639979362488, 0.02570917457342148, 0.03858470916748047, 0.05146023631095886, 0.06433577090501785, 0.07721130549907684, 0.09008684009313583, 0.10296237468719482, 0.11583790183067322, 0.1287134289741516, 0.1415889710187912, 0.1544644981622696, 0.16734004020690918, 0.18021556735038757, 0.19309109449386597, 0.20596663653850555, 0.21884216368198395, 0.23171770572662354, 0.24459323287010193, 0.2574687600135803, 0.2703442871570587, 0.2832198143005371, 0.2960953414440155, 0.3089708685874939, 0.3218464255332947, 0.33472195267677307, 0.34759747982025146, 0.36047300696372986, 0.37334853410720825, 0.38622409105300903]}, "eval/loss": 0.309664785861969, "eval/wer": 0.09321697738992463, "eval/runtime": 583.4014, "eval/samples_per_second": 4.529, "eval/steps_per_second": 0.567, "train/train_runtime": 27349.9818, "train/train_samples_per_second": 5.217, "train/train_steps_per_second": 0.082, "train/total_flos": 0.0, "train/train_loss": 1.4829948718221064} \ No newline at end of file