diff --git "a/wandb/run-20220322_163235-2yj5gh94/files/wandb-summary.json" "b/wandb/run-20220322_163235-2yj5gh94/files/wandb-summary.json" --- "a/wandb/run-20220322_163235-2yj5gh94/files/wandb-summary.json" +++ "b/wandb/run-20220322_163235-2yj5gh94/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 0.1199, "train/learning_rate": 6.936416184971098e-07, "train/epoch": 5.0, "train/global_step": 2230, "_runtime": 27349, "_timestamp": 1647994104, "_step": 2234, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 12.0, 56.0, 279.0, 497.0, 140.0, 30.0, 5.0], "bins": [-7.940925598144531, -7.809273719787598, -7.677621841430664, -7.5459699630737305, -7.414318084716797, -7.282666206359863, -7.15101432800293, -7.019362449645996, -6.8877105712890625, -6.756058692932129, -6.624406814575195, -6.492754936218262, -6.361103057861328, -6.2294511795043945, -6.097799301147461, -5.966147422790527, -5.834495544433594, -5.70284366607666, -5.571191787719727, -5.439539909362793, -5.307888031005859, -5.176236152648926, -5.044584274291992, -4.912932395935059, -4.781280517578125, -4.649628639221191, -4.517976760864258, -4.386324882507324, -4.254673004150391, -4.123021125793457, -3.9913692474365234, -3.85971736907959, -3.728065013885498, -3.5964131355285645, -3.464761257171631, -3.3331093788146973, -3.2014575004577637, -3.06980562210083, -2.9381537437438965, -2.806501865386963, -2.6748499870300293, -2.5431981086730957, -2.411546230316162, -2.2798943519592285, -2.148242473602295, -2.0165905952453613, -1.8849387168884277, -1.7532868385314941, -1.62163507938385, -1.4899832010269165, -1.358331322669983, -1.2266794443130493, -1.0950275659561157, -0.9633756875991821, -0.8317238092422485, -0.7000719308853149, -0.5684200525283813, -0.43676817417144775, -0.30511629581451416, -0.17346441745758057, -0.04181253910064697, 0.08983933925628662, 0.22149121761322021, 0.3531430959701538, 0.4847949743270874]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 5.0, 3.0, 6.0, 2.0, 5.0, 9.0, 10.0, 15.0, 12.0, 17.0, 16.0, 22.0, 29.0, 39.0, 28.0, 36.0, 29.0, 35.0, 38.0, 45.0, 62.0, 45.0, 49.0, 48.0, 51.0, 40.0, 45.0, 43.0, 33.0, 29.0, 31.0, 30.0, 21.0, 16.0, 17.0, 14.0, 10.0, 9.0, 5.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4662081003189087, -0.44751691818237305, -0.4288257360458374, -0.41013455390930176, -0.3914433717727661, -0.37275218963623047, -0.35406097769737244, -0.3353697955608368, -0.31667861342430115, -0.2979874312877655, -0.27929624915122986, -0.2606050670146942, -0.24191386997699738, -0.22322268784046173, -0.2045314908027649, -0.18584030866622925, -0.1671491265296936, -0.14845794439315796, -0.12976676225662231, -0.11107556521892548, -0.09238438308238983, -0.07369320094585419, -0.055002011358737946, -0.036310821771621704, -0.01761963963508606, 0.0010715462267398834, 0.019762732088565826, 0.03845391795039177, 0.05714510381221771, 0.07583628594875336, 0.0945274755358696, 0.11321866512298584, 0.13190990686416626, 0.1506010890007019, 0.16929227113723755, 0.1879834681749344, 0.20667465031147003, 0.22536583244800568, 0.24405702948570251, 0.26274821162223816, 0.2814393937587738, 0.30013057589530945, 0.3188217580318451, 0.33751294016838074, 0.35620415210723877, 0.3748953342437744, 0.39358651638031006, 0.4122776985168457, 0.43096888065338135, 0.449660062789917, 0.46835124492645264, 0.4870424270629883, 0.5057336091995239, 0.5244247913360596, 0.5431159734725952, 0.5618071556091309, 0.5804983377456665, 0.5991895198822021, 0.6178807020187378, 0.6365718841552734, 0.6552630662918091, 0.6739542484283447, 0.6926454305648804, 0.711336612701416, 0.7300278544425964]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 0.0, 2.0, 4.0, 6.0, 8.0, 7.0, 15.0, 12.0, 27.0, 27.0, 51.0, 58.0, 97.0, 154.0, 252.0, 420.0, 743.0, 1437.0, 3148.0, 8260.0, 35352.0, 952590.0, 3075218.0, 95395.0, 12498.0, 4388.0, 1911.0, 942.0, 493.0, 251.0, 183.0, 104.0, 56.0, 47.0, 33.0, 32.0, 8.0, 18.0, 9.0, 7.0, 7.0, 3.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.841796875, -2.753509521484375, -2.66522216796875, -2.576934814453125, -2.4886474609375, -2.400360107421875, -2.31207275390625, -2.223785400390625, -2.135498046875, -2.047210693359375, -1.95892333984375, -1.870635986328125, -1.7823486328125, -1.694061279296875, -1.60577392578125, -1.517486572265625, -1.42919921875, -1.340911865234375, -1.25262451171875, -1.164337158203125, -1.0760498046875, -0.987762451171875, -0.89947509765625, -0.811187744140625, -0.722900390625, -0.634613037109375, -0.54632568359375, -0.458038330078125, -0.3697509765625, -0.281463623046875, -0.19317626953125, -0.104888916015625, -0.0166015625, 0.071685791015625, 0.15997314453125, 0.248260498046875, 0.3365478515625, 0.424835205078125, 0.51312255859375, 0.601409912109375, 0.689697265625, 0.777984619140625, 0.86627197265625, 0.954559326171875, 1.0428466796875, 1.131134033203125, 1.21942138671875, 1.307708740234375, 1.39599609375, 1.484283447265625, 1.57257080078125, 1.660858154296875, 1.7491455078125, 1.837432861328125, 1.92572021484375, 2.014007568359375, 2.102294921875, 2.190582275390625, 2.27886962890625, 2.367156982421875, 2.4554443359375, 2.543731689453125, 2.63201904296875, 2.720306396484375, 2.80859375]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 7.0, 8.0, 10.0, 4.0, 10.0, 13.0, 10.0, 15.0, 26.0, 12.0, 29.0, 26.0, 29.0, 19.0, 31.0, 37.0, 31.0, 38.0, 52.0, 48.0, 44.0, 45.0, 49.0, 38.0, 35.0, 44.0, 37.0, 35.0, 36.0, 31.0, 20.0, 26.0, 24.0, 19.0, 10.0, 16.0, 10.0, 9.0, 7.0, 6.0, 5.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.87841796875, -0.8500137329101562, -0.8216094970703125, -0.7932052612304688, -0.764801025390625, -0.7363967895507812, -0.7079925537109375, -0.6795883178710938, -0.65118408203125, -0.6227798461914062, -0.5943756103515625, -0.5659713745117188, -0.537567138671875, -0.5091629028320312, -0.4807586669921875, -0.45235443115234375, -0.4239501953125, -0.39554595947265625, -0.3671417236328125, -0.33873748779296875, -0.310333251953125, -0.28192901611328125, -0.2535247802734375, -0.22512054443359375, -0.19671630859375, -0.16831207275390625, -0.1399078369140625, -0.11150360107421875, -0.083099365234375, -0.05469512939453125, -0.0262908935546875, 0.00211334228515625, 0.030517578125, 0.05892181396484375, 0.0873260498046875, 0.11573028564453125, 0.144134521484375, 0.17253875732421875, 0.2009429931640625, 0.22934722900390625, 0.25775146484375, 0.28615570068359375, 0.3145599365234375, 0.34296417236328125, 0.371368408203125, 0.39977264404296875, 0.4281768798828125, 0.45658111572265625, 0.4849853515625, 0.5133895874023438, 0.5417938232421875, 0.5701980590820312, 0.598602294921875, 0.6270065307617188, 0.6554107666015625, 0.6838150024414062, 0.71221923828125, 0.7406234741210938, 0.7690277099609375, 0.7974319458007812, 0.825836181640625, 0.8542404174804688, 0.8826446533203125, 0.9110488891601562, 0.939453125]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 4.0, 13.0, 18.0, 28.0, 46.0, 120.0, 245.0, 876.0, 3459606.0, 732161.0, 799.0, 164.0, 90.0, 37.0, 28.0, 21.0, 6.0, 3.0, 6.0, 2.0, 0.0, 5.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-22.125, -21.6102294921875, -21.095458984375, -20.5806884765625, -20.06591796875, -19.5511474609375, -19.036376953125, -18.5216064453125, -18.0068359375, -17.4920654296875, -16.977294921875, -16.4625244140625, -15.94775390625, -15.4329833984375, -14.918212890625, -14.4034423828125, -13.888671875, -13.3739013671875, -12.859130859375, -12.3443603515625, -11.82958984375, -11.3148193359375, -10.800048828125, -10.2852783203125, -9.7705078125, -9.2557373046875, -8.740966796875, -8.2261962890625, -7.71142578125, -7.1966552734375, -6.681884765625, -6.1671142578125, -5.65234375, -5.1375732421875, -4.622802734375, -4.1080322265625, -3.59326171875, -3.0784912109375, -2.563720703125, -2.0489501953125, -1.5341796875, -1.0194091796875, -0.504638671875, 0.0101318359375, 0.52490234375, 1.0396728515625, 1.554443359375, 2.0692138671875, 2.583984375, 3.0987548828125, 3.613525390625, 4.1282958984375, 4.64306640625, 5.1578369140625, 5.672607421875, 6.1873779296875, 6.7021484375, 7.2169189453125, 7.731689453125, 8.2464599609375, 8.76123046875, 9.2760009765625, 9.790771484375, 10.3055419921875, 10.8203125]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 7.0, 15.0, 14.0, 27.0, 67.0, 102.0, 190.0, 681.0, 1946.0, 665.0, 165.0, 80.0, 41.0, 27.0, 20.0, 9.0, 7.0, 2.0, 4.0, 2.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2822265625, -1.2540359497070312, -1.2258453369140625, -1.1976547241210938, -1.169464111328125, -1.1412734985351562, -1.1130828857421875, -1.0848922729492188, -1.05670166015625, -1.0285110473632812, -1.0003204345703125, -0.9721298217773438, -0.943939208984375, -0.9157485961914062, -0.8875579833984375, -0.8593673706054688, -0.8311767578125, -0.8029861450195312, -0.7747955322265625, -0.7466049194335938, -0.718414306640625, -0.6902236938476562, -0.6620330810546875, -0.6338424682617188, -0.60565185546875, -0.5774612426757812, -0.5492706298828125, -0.5210800170898438, -0.492889404296875, -0.46469879150390625, -0.4365081787109375, -0.40831756591796875, -0.380126953125, -0.35193634033203125, -0.3237457275390625, -0.29555511474609375, -0.267364501953125, -0.23917388916015625, -0.2109832763671875, -0.18279266357421875, -0.15460205078125, -0.12641143798828125, -0.0982208251953125, -0.07003021240234375, -0.041839599609375, -0.01364898681640625, 0.0145416259765625, 0.04273223876953125, 0.0709228515625, 0.09911346435546875, 0.1273040771484375, 0.15549468994140625, 0.183685302734375, 0.21187591552734375, 0.2400665283203125, 0.26825714111328125, 0.29644775390625, 0.32463836669921875, 0.3528289794921875, 0.38101959228515625, 0.409210205078125, 0.43740081787109375, 0.4655914306640625, 0.49378204345703125, 0.52197265625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 2.0, 7.0, 11.0, 11.0, 8.0, 12.0, 24.0, 24.0, 36.0, 47.0, 53.0, 70.0, 79.0, 89.0, 98.0, 87.0, 70.0, 58.0, 48.0, 44.0, 30.0, 24.0, 14.0, 18.0, 13.0, 10.0, 7.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9769927263259888, -0.9347792863845825, -0.8925658464431763, -0.8503524661064148, -0.8081390261650085, -0.7659255862236023, -0.7237122058868408, -0.6814987659454346, -0.6392853260040283, -0.5970718860626221, -0.5548584461212158, -0.5126450657844543, -0.4704316258430481, -0.42821818590164185, -0.386004775762558, -0.3437913656234741, -0.30157792568206787, -0.2593644857406616, -0.21715107560157776, -0.1749376505613327, -0.13272422552108765, -0.09051080048084259, -0.048297375440597534, -0.006083965301513672, 0.03612947463989258, 0.07834289968013763, 0.12055632472038269, 0.16276974976062775, 0.2049831748008728, 0.24719659984111786, 0.2894100248813629, 0.3316234350204468, 0.3738369941711426, 0.41605043411254883, 0.4582638442516327, 0.5004772543907166, 0.5426906943321228, 0.584904134273529, 0.6271175146102905, 0.6693309545516968, 0.711544394493103, 0.7537578344345093, 0.7959712743759155, 0.838184654712677, 0.8803980946540833, 0.9226115345954895, 0.964824914932251, 1.0070383548736572, 1.0492517948150635, 1.0914652347564697, 1.133678674697876, 1.1758921146392822, 1.2181055545806885, 1.2603188753128052, 1.3025323152542114, 1.3447457551956177, 1.386959195137024, 1.4291726350784302, 1.4713860750198364, 1.5135995149612427, 1.5558128356933594, 1.5980262756347656, 1.6402397155761719, 1.6824531555175781, 1.7246665954589844]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 10.0, 8.0, 11.0, 10.0, 11.0, 15.0, 19.0, 12.0, 19.0, 28.0, 28.0, 28.0, 23.0, 36.0, 41.0, 44.0, 36.0, 31.0, 44.0, 47.0, 41.0, 46.0, 37.0, 35.0, 35.0, 35.0, 34.0, 33.0, 26.0, 28.0, 29.0, 26.0, 15.0, 15.0, 17.0, 13.0, 14.0, 10.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7832375168800354, -0.7575938701629639, -0.7319502830505371, -0.7063066363334656, -0.680662989616394, -0.6550193428993225, -0.629375696182251, -0.6037321090698242, -0.5780884623527527, -0.5524448156356812, -0.5268012285232544, -0.5011575818061829, -0.47551393508911133, -0.4498702883720398, -0.42422667145729065, -0.3985830545425415, -0.37293940782546997, -0.34729576110839844, -0.3216521441936493, -0.29600852727890015, -0.2703648805618286, -0.24472124874591827, -0.21907761693000793, -0.1934339851140976, -0.16779035329818726, -0.14214672148227692, -0.11650308966636658, -0.09085945785045624, -0.0652158260345459, -0.03957219421863556, -0.01392856240272522, 0.01171506941318512, 0.037358641624450684, 0.06300227344036102, 0.08864590525627136, 0.1142895370721817, 0.13993316888809204, 0.16557680070400238, 0.19122043251991272, 0.21686406433582306, 0.2425076961517334, 0.26815134286880493, 0.2937949597835541, 0.3194385766983032, 0.34508222341537476, 0.3707258701324463, 0.39636948704719543, 0.4220131039619446, 0.4476567506790161, 0.47330039739608765, 0.4989440143108368, 0.5245876312255859, 0.5502312779426575, 0.575874924659729, 0.6015185117721558, 0.6271621584892273, 0.6528058052062988, 0.6784494519233704, 0.7040930986404419, 0.7297366857528687, 0.7553803324699402, 0.7810239791870117, 0.8066675662994385, 0.83231121301651, 0.8579548597335815]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 4.0, 12.0, 8.0, 31.0, 29.0, 40.0, 50.0, 84.0, 139.0, 185.0, 251.0, 369.0, 555.0, 753.0, 1155.0, 1643.0, 2561.0, 3756.0, 5780.0, 8996.0, 14705.0, 24379.0, 43156.0, 80441.0, 171793.0, 311438.0, 179636.0, 84756.0, 44890.0, 25105.0, 14985.0, 9146.0, 5832.0, 3889.0, 2508.0, 1682.0, 1156.0, 848.0, 535.0, 408.0, 258.0, 189.0, 131.0, 87.0, 62.0, 44.0, 25.0, 19.0, 20.0, 11.0, 9.0, 6.0, 6.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.397216796875, -0.3850059509277344, -0.37279510498046875, -0.3605842590332031, -0.3483734130859375, -0.3361625671386719, -0.32395172119140625, -0.3117408752441406, -0.299530029296875, -0.2873191833496094, -0.27510833740234375, -0.2628974914550781, -0.2506866455078125, -0.23847579956054688, -0.22626495361328125, -0.21405410766601562, -0.20184326171875, -0.18963241577148438, -0.17742156982421875, -0.16521072387695312, -0.1529998779296875, -0.14078903198242188, -0.12857818603515625, -0.11636734008789062, -0.104156494140625, -0.09194564819335938, -0.07973480224609375, -0.06752395629882812, -0.0553131103515625, -0.043102264404296875, -0.03089141845703125, -0.018680572509765625, -0.0064697265625, 0.005741119384765625, 0.01795196533203125, 0.030162811279296875, 0.0423736572265625, 0.054584503173828125, 0.06679534912109375, 0.07900619506835938, 0.091217041015625, 0.10342788696289062, 0.11563873291015625, 0.12784957885742188, 0.1400604248046875, 0.15227127075195312, 0.16448211669921875, 0.17669296264648438, 0.18890380859375, 0.20111465454101562, 0.21332550048828125, 0.22553634643554688, 0.2377471923828125, 0.24995803833007812, 0.26216888427734375, 0.2743797302246094, 0.286590576171875, 0.2988014221191406, 0.31101226806640625, 0.3232231140136719, 0.3354339599609375, 0.3476448059082031, 0.35985565185546875, 0.3720664978027344, 0.38427734375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 6.0, 2.0, 8.0, 6.0, 8.0, 9.0, 7.0, 14.0, 15.0, 21.0, 21.0, 18.0, 28.0, 31.0, 33.0, 24.0, 31.0, 38.0, 44.0, 43.0, 27.0, 45.0, 46.0, 45.0, 40.0, 46.0, 23.0, 39.0, 32.0, 41.0, 31.0, 36.0, 26.0, 21.0, 19.0, 13.0, 10.0, 9.0, 10.0, 10.0, 6.0, 9.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.467529296875, -0.4515571594238281, -0.43558502197265625, -0.4196128845214844, -0.4036407470703125, -0.3876686096191406, -0.37169647216796875, -0.3557243347167969, -0.339752197265625, -0.3237800598144531, -0.30780792236328125, -0.2918357849121094, -0.2758636474609375, -0.2598915100097656, -0.24391937255859375, -0.22794723510742188, -0.21197509765625, -0.19600296020507812, -0.18003082275390625, -0.16405868530273438, -0.1480865478515625, -0.13211441040039062, -0.11614227294921875, -0.10017013549804688, -0.084197998046875, -0.06822586059570312, -0.05225372314453125, -0.036281585693359375, -0.0203094482421875, -0.004337310791015625, 0.01163482666015625, 0.027606964111328125, 0.0435791015625, 0.059551239013671875, 0.07552337646484375, 0.09149551391601562, 0.1074676513671875, 0.12343978881835938, 0.13941192626953125, 0.15538406372070312, 0.171356201171875, 0.18732833862304688, 0.20330047607421875, 0.21927261352539062, 0.2352447509765625, 0.2512168884277344, 0.26718902587890625, 0.2831611633300781, 0.29913330078125, 0.3151054382324219, 0.33107757568359375, 0.3470497131347656, 0.3630218505859375, 0.3789939880371094, 0.39496612548828125, 0.4109382629394531, 0.426910400390625, 0.4428825378417969, 0.45885467529296875, 0.4748268127441406, 0.4907989501953125, 0.5067710876464844, 0.5227432250976562, 0.5387153625488281, 0.5546875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 10.0, 11.0, 15.0, 19.0, 25.0, 40.0, 50.0, 87.0, 121.0, 226.0, 393.0, 770.0, 1604.0, 4019.0, 11302.0, 38684.0, 175614.0, 592346.0, 167750.0, 37173.0, 10984.0, 3846.0, 1645.0, 757.0, 422.0, 216.0, 130.0, 82.0, 70.0, 45.0, 36.0, 21.0, 11.0, 4.0, 9.0, 4.0, 4.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6591796875, -0.6368255615234375, -0.614471435546875, -0.5921173095703125, -0.56976318359375, -0.5474090576171875, -0.525054931640625, -0.5027008056640625, -0.4803466796875, -0.4579925537109375, -0.435638427734375, -0.4132843017578125, -0.39093017578125, -0.3685760498046875, -0.346221923828125, -0.3238677978515625, -0.301513671875, -0.2791595458984375, -0.256805419921875, -0.2344512939453125, -0.21209716796875, -0.1897430419921875, -0.167388916015625, -0.1450347900390625, -0.1226806640625, -0.1003265380859375, -0.077972412109375, -0.0556182861328125, -0.03326416015625, -0.0109100341796875, 0.011444091796875, 0.0337982177734375, 0.05615234375, 0.0785064697265625, 0.100860595703125, 0.1232147216796875, 0.14556884765625, 0.1679229736328125, 0.190277099609375, 0.2126312255859375, 0.2349853515625, 0.2573394775390625, 0.279693603515625, 0.3020477294921875, 0.32440185546875, 0.3467559814453125, 0.369110107421875, 0.3914642333984375, 0.413818359375, 0.4361724853515625, 0.458526611328125, 0.4808807373046875, 0.50323486328125, 0.5255889892578125, 0.547943115234375, 0.5702972412109375, 0.5926513671875, 0.6150054931640625, 0.637359619140625, 0.6597137451171875, 0.68206787109375, 0.7044219970703125, 0.726776123046875, 0.7491302490234375, 0.771484375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 8.0, 2.0, 3.0, 5.0, 4.0, 9.0, 3.0, 15.0, 16.0, 16.0, 11.0, 18.0, 21.0, 20.0, 22.0, 34.0, 28.0, 31.0, 40.0, 30.0, 30.0, 52.0, 46.0, 31.0, 36.0, 37.0, 42.0, 42.0, 39.0, 35.0, 29.0, 35.0, 33.0, 25.0, 22.0, 22.0, 16.0, 12.0, 18.0, 12.0, 11.0, 10.0, 9.0, 7.0, 8.0, 4.0, 3.0, 3.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.97998046875, -0.9475173950195312, -0.9150543212890625, -0.8825912475585938, -0.850128173828125, -0.8176651000976562, -0.7852020263671875, -0.7527389526367188, -0.72027587890625, -0.6878128051757812, -0.6553497314453125, -0.6228866577148438, -0.590423583984375, -0.5579605102539062, -0.5254974365234375, -0.49303436279296875, -0.4605712890625, -0.42810821533203125, -0.3956451416015625, -0.36318206787109375, -0.330718994140625, -0.29825592041015625, -0.2657928466796875, -0.23332977294921875, -0.20086669921875, -0.16840362548828125, -0.1359405517578125, -0.10347747802734375, -0.071014404296875, -0.03855133056640625, -0.0060882568359375, 0.02637481689453125, 0.058837890625, 0.09130096435546875, 0.1237640380859375, 0.15622711181640625, 0.188690185546875, 0.22115325927734375, 0.2536163330078125, 0.28607940673828125, 0.31854248046875, 0.35100555419921875, 0.3834686279296875, 0.41593170166015625, 0.448394775390625, 0.48085784912109375, 0.5133209228515625, 0.5457839965820312, 0.5782470703125, 0.6107101440429688, 0.6431732177734375, 0.6756362915039062, 0.708099365234375, 0.7405624389648438, 0.7730255126953125, 0.8054885864257812, 0.83795166015625, 0.8704147338867188, 0.9028778076171875, 0.9353408813476562, 0.967803955078125, 1.0002670288085938, 1.0327301025390625, 1.0651931762695312, 1.09765625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 2.0, 5.0, 10.0, 9.0, 11.0, 20.0, 26.0, 41.0, 63.0, 89.0, 133.0, 236.0, 383.0, 614.0, 1075.0, 2224.0, 4633.0, 10843.0, 30540.0, 125972.0, 622456.0, 185615.0, 38995.0, 13142.0, 5604.0, 2588.0, 1322.0, 717.0, 435.0, 263.0, 167.0, 99.0, 58.0, 57.0, 30.0, 29.0, 14.0, 12.0, 6.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1253662109375, -0.12152099609375, -0.11767578125, -0.11383056640625, -0.1099853515625, -0.10614013671875, -0.102294921875, -0.09844970703125, -0.0946044921875, -0.09075927734375, -0.0869140625, -0.08306884765625, -0.0792236328125, -0.07537841796875, -0.071533203125, -0.06768798828125, -0.0638427734375, -0.05999755859375, -0.05615234375, -0.05230712890625, -0.0484619140625, -0.04461669921875, -0.040771484375, -0.03692626953125, -0.0330810546875, -0.02923583984375, -0.025390625, -0.02154541015625, -0.0177001953125, -0.01385498046875, -0.010009765625, -0.00616455078125, -0.0023193359375, 0.00152587890625, 0.00537109375, 0.00921630859375, 0.0130615234375, 0.01690673828125, 0.020751953125, 0.02459716796875, 0.0284423828125, 0.03228759765625, 0.0361328125, 0.03997802734375, 0.0438232421875, 0.04766845703125, 0.051513671875, 0.05535888671875, 0.0592041015625, 0.06304931640625, 0.06689453125, 0.07073974609375, 0.0745849609375, 0.07843017578125, 0.082275390625, 0.08612060546875, 0.0899658203125, 0.09381103515625, 0.09765625, 0.10150146484375, 0.1053466796875, 0.10919189453125, 0.113037109375, 0.11688232421875, 0.1207275390625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 3.0, 8.0, 7.0, 22.0, 24.0, 38.0, 94.0, 202.0, 280.0, 168.0, 66.0, 29.0, 17.0, 17.0, 6.0, 8.0, 4.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014853477478027344, -0.0001431051641702652, -0.00013767555356025696, -0.00013224594295024872, -0.00012681633234024048, -0.00012138672173023224, -0.000115957111120224, -0.00011052750051021576, -0.00010509788990020752, -9.966827929019928e-05, -9.423866868019104e-05, -8.88090580701828e-05, -8.337944746017456e-05, -7.794983685016632e-05, -7.252022624015808e-05, -6.709061563014984e-05, -6.16610050201416e-05, -5.623139441013336e-05, -5.080178380012512e-05, -4.537217319011688e-05, -3.994256258010864e-05, -3.45129519701004e-05, -2.9083341360092163e-05, -2.3653730750083923e-05, -1.8224120140075684e-05, -1.2794509530067444e-05, -7.364898920059204e-06, -1.9352883100509644e-06, 3.4943222999572754e-06, 8.923932909965515e-06, 1.4353543519973755e-05, 1.9783154129981995e-05, 2.5212764739990234e-05, 3.0642375349998474e-05, 3.6071985960006714e-05, 4.1501596570014954e-05, 4.693120718002319e-05, 5.236081779003143e-05, 5.779042840003967e-05, 6.322003901004791e-05, 6.864964962005615e-05, 7.407926023006439e-05, 7.950887084007263e-05, 8.493848145008087e-05, 9.036809206008911e-05, 9.579770267009735e-05, 0.00010122731328010559, 0.00010665692389011383, 0.00011208653450012207, 0.00011751614511013031, 0.00012294575572013855, 0.0001283753663301468, 0.00013380497694015503, 0.00013923458755016327, 0.0001446641981601715, 0.00015009380877017975, 0.000155523419380188, 0.00016095302999019623, 0.00016638264060020447, 0.0001718122512102127, 0.00017724186182022095, 0.0001826714724302292, 0.00018810108304023743, 0.00019353069365024567, 0.0001989603042602539]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 2.0, 3.0, 6.0, 9.0, 12.0, 12.0, 20.0, 26.0, 44.0, 53.0, 93.0, 163.0, 472.0, 1708.0, 9062.0, 84776.0, 867065.0, 74046.0, 8568.0, 1576.0, 383.0, 185.0, 83.0, 46.0, 38.0, 23.0, 15.0, 7.0, 10.0, 16.0, 8.0, 1.0, 1.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.255126953125, -0.24584197998046875, -0.2365570068359375, -0.22727203369140625, -0.217987060546875, -0.20870208740234375, -0.1994171142578125, -0.19013214111328125, -0.18084716796875, -0.17156219482421875, -0.1622772216796875, -0.15299224853515625, -0.143707275390625, -0.13442230224609375, -0.1251373291015625, -0.11585235595703125, -0.1065673828125, -0.09728240966796875, -0.0879974365234375, -0.07871246337890625, -0.069427490234375, -0.06014251708984375, -0.0508575439453125, -0.04157257080078125, -0.03228759765625, -0.02300262451171875, -0.0137176513671875, -0.00443267822265625, 0.004852294921875, 0.01413726806640625, 0.0234222412109375, 0.03270721435546875, 0.0419921875, 0.05127716064453125, 0.0605621337890625, 0.06984710693359375, 0.079132080078125, 0.08841705322265625, 0.0977020263671875, 0.10698699951171875, 0.11627197265625, 0.12555694580078125, 0.1348419189453125, 0.14412689208984375, 0.153411865234375, 0.16269683837890625, 0.1719818115234375, 0.18126678466796875, 0.1905517578125, 0.19983673095703125, 0.2091217041015625, 0.21840667724609375, 0.227691650390625, 0.23697662353515625, 0.2462615966796875, 0.25554656982421875, 0.26483154296875, 0.27411651611328125, 0.2834014892578125, 0.29268646240234375, 0.301971435546875, 0.31125640869140625, 0.3205413818359375, 0.32982635498046875, 0.339111328125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 8.0, 0.0, 3.0, 5.0, 6.0, 3.0, 6.0, 9.0, 7.0, 14.0, 17.0, 20.0, 32.0, 38.0, 49.0, 77.0, 86.0, 109.0, 104.0, 98.0, 79.0, 57.0, 52.0, 40.0, 15.0, 7.0, 9.0, 12.0, 5.0, 6.0, 7.0, 7.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0423583984375, -0.040851593017578125, -0.03934478759765625, -0.037837982177734375, -0.0363311767578125, -0.034824371337890625, -0.03331756591796875, -0.031810760498046875, -0.030303955078125, -0.028797149658203125, -0.02729034423828125, -0.025783538818359375, -0.0242767333984375, -0.022769927978515625, -0.02126312255859375, -0.019756317138671875, -0.01824951171875, -0.016742706298828125, -0.01523590087890625, -0.013729095458984375, -0.0122222900390625, -0.010715484619140625, -0.00920867919921875, -0.007701873779296875, -0.006195068359375, -0.004688262939453125, -0.00318145751953125, -0.001674652099609375, -0.0001678466796875, 0.001338958740234375, 0.00284576416015625, 0.004352569580078125, 0.005859375, 0.007366180419921875, 0.00887298583984375, 0.010379791259765625, 0.0118865966796875, 0.013393402099609375, 0.01490020751953125, 0.016407012939453125, 0.017913818359375, 0.019420623779296875, 0.02092742919921875, 0.022434234619140625, 0.0239410400390625, 0.025447845458984375, 0.02695465087890625, 0.028461456298828125, 0.02996826171875, 0.031475067138671875, 0.03298187255859375, 0.034488677978515625, 0.0359954833984375, 0.037502288818359375, 0.03900909423828125, 0.040515899658203125, 0.042022705078125, 0.043529510498046875, 0.04503631591796875, 0.046543121337890625, 0.0480499267578125, 0.049556732177734375, 0.05106353759765625, 0.052570343017578125, 0.0540771484375]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 6.0, 10.0, 13.0, 48.0, 138.0, 300.0, 284.0, 140.0, 53.0, 13.0, 6.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7234145402908325, -1.645379662513733, -1.5673447847366333, -1.4893099069595337, -1.411275029182434, -1.3332401514053345, -1.2552051544189453, -1.1771702766418457, -1.099135398864746, -1.0211005210876465, -0.9430656433105469, -0.8650307655334473, -0.7869958877563477, -0.708961009979248, -0.6309260725975037, -0.552891194820404, -0.4748563766479492, -0.3968214988708496, -0.31878662109375, -0.240751713514328, -0.1627168357372284, -0.08468195796012878, -0.006647050380706787, 0.07138782739639282, 0.14942270517349243, 0.22745758295059204, 0.30549246072769165, 0.38352736830711365, 0.46156224608421326, 0.5395971536636353, 0.6176320314407349, 0.6956669092178345, 0.7737016677856445, 0.8517365455627441, 0.9297714233398438, 1.0078063011169434, 1.085841178894043, 1.1638760566711426, 1.2419109344482422, 1.3199458122253418, 1.3979806900024414, 1.476015567779541, 1.5540504455566406, 1.6320853233337402, 1.7101202011108398, 1.7881550788879395, 1.866189956665039, 1.9442248344421387, 2.0222597122192383, 2.100294589996338, 2.1783294677734375, 2.256364345550537, 2.3343992233276367, 2.4124341011047363, 2.490468978881836, 2.5685038566589355, 2.6465389728546143, 2.724573850631714, 2.8026087284088135, 2.880643606185913, 2.9586784839630127, 3.0367133617401123, 3.114748239517212, 3.1927831172943115, 3.270817995071411]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 7.0, 5.0, 6.0, 10.0, 6.0, 13.0, 22.0, 14.0, 22.0, 17.0, 27.0, 28.0, 24.0, 36.0, 47.0, 33.0, 30.0, 47.0, 44.0, 42.0, 52.0, 45.0, 36.0, 32.0, 32.0, 45.0, 42.0, 34.0, 36.0, 32.0, 35.0, 24.0, 14.0, 12.0, 13.0, 11.0, 11.0, 10.0, 1.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.49540552496910095, -0.47856956720352173, -0.4617336094379425, -0.4448976516723633, -0.42806169390678406, -0.41122573614120483, -0.394389808177948, -0.3775538206100464, -0.36071789264678955, -0.3438819348812103, -0.3270459771156311, -0.3102100193500519, -0.29337406158447266, -0.27653810381889343, -0.2597021460533142, -0.24286620318889618, -0.22603023052215576, -0.20919427275657654, -0.19235831499099731, -0.1755223572254181, -0.15868639945983887, -0.14185044169425964, -0.1250144988298416, -0.10817854106426239, -0.09134258329868317, -0.07450662553310394, -0.05767067149281502, -0.04083471745252609, -0.02399875968694687, -0.007162801921367645, 0.009673148393630981, 0.026509106159210205, 0.043345093727111816, 0.06018105149269104, 0.07701700925827026, 0.09385295957326889, 0.11068891733884811, 0.12752488255500793, 0.14436082541942596, 0.1611967831850052, 0.1780327409505844, 0.19486869871616364, 0.21170465648174286, 0.2285405993461609, 0.2453765571117401, 0.26221251487731934, 0.27904847264289856, 0.2958844304084778, 0.312720388174057, 0.32955634593963623, 0.34639230370521545, 0.3632282614707947, 0.3800642192363739, 0.3969001770019531, 0.41373610496520996, 0.4305720925331116, 0.4474080204963684, 0.46424397826194763, 0.48107993602752686, 0.4979158937931061, 0.5147518515586853, 0.5315877795219421, 0.5484237670898438, 0.5652596950531006, 0.5820956826210022]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 6.0, 8.0, 12.0, 19.0, 17.0, 45.0, 47.0, 66.0, 95.0, 139.0, 223.0, 298.0, 400.0, 542.0, 805.0, 1194.0, 1783.0, 2511.0, 3643.0, 5385.0, 8093.0, 12271.0, 18494.0, 28566.0, 44604.0, 73856.0, 133460.0, 280382.0, 183934.0, 92881.0, 54460.0, 34101.0, 21735.0, 14236.0, 9588.0, 6459.0, 4417.0, 3087.0, 2124.0, 1389.0, 975.0, 658.0, 496.0, 311.0, 253.0, 135.0, 122.0, 72.0, 58.0, 38.0, 29.0, 13.0, 8.0, 9.0, 4.0, 5.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.1849365234375, -0.17910385131835938, -0.17327117919921875, -0.16743850708007812, -0.1616058349609375, -0.15577316284179688, -0.14994049072265625, -0.14410781860351562, -0.138275146484375, -0.13244247436523438, -0.12660980224609375, -0.12077713012695312, -0.1149444580078125, -0.10911178588867188, -0.10327911376953125, -0.09744644165039062, -0.09161376953125, -0.08578109741210938, -0.07994842529296875, -0.07411575317382812, -0.0682830810546875, -0.062450408935546875, -0.05661773681640625, -0.050785064697265625, -0.044952392578125, -0.039119720458984375, -0.03328704833984375, -0.027454376220703125, -0.0216217041015625, -0.015789031982421875, -0.00995635986328125, -0.004123687744140625, 0.001708984375, 0.007541656494140625, 0.01337432861328125, 0.019207000732421875, 0.0250396728515625, 0.030872344970703125, 0.03670501708984375, 0.042537689208984375, 0.048370361328125, 0.054203033447265625, 0.06003570556640625, 0.06586837768554688, 0.0717010498046875, 0.07753372192382812, 0.08336639404296875, 0.08919906616210938, 0.09503173828125, 0.10086441040039062, 0.10669708251953125, 0.11252975463867188, 0.1183624267578125, 0.12419509887695312, 0.13002777099609375, 0.13586044311523438, 0.141693115234375, 0.14752578735351562, 0.15335845947265625, 0.15919113159179688, 0.1650238037109375, 0.17085647583007812, 0.17668914794921875, 0.18252182006835938, 0.1883544921875]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 5.0, 4.0, 9.0, 10.0, 15.0, 11.0, 17.0, 23.0, 22.0, 12.0, 27.0, 16.0, 20.0, 21.0, 24.0, 36.0, 17.0, 36.0, 28.0, 41.0, 52.0, 61.0, 45.0, 36.0, 38.0, 33.0, 45.0, 31.0, 28.0, 22.0, 35.0, 24.0, 24.0, 18.0, 21.0, 17.0, 11.0, 11.0, 10.0, 9.0, 8.0, 7.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.353515625, -3.24029541015625, -3.1270751953125, -3.01385498046875, -2.900634765625, -2.78741455078125, -2.6741943359375, -2.56097412109375, -2.44775390625, -2.33453369140625, -2.2213134765625, -2.10809326171875, -1.994873046875, -1.88165283203125, -1.7684326171875, -1.65521240234375, -1.5419921875, -1.42877197265625, -1.3155517578125, -1.20233154296875, -1.089111328125, -0.97589111328125, -0.8626708984375, -0.74945068359375, -0.63623046875, -0.52301025390625, -0.4097900390625, -0.29656982421875, -0.183349609375, -0.07012939453125, 0.0430908203125, 0.15631103515625, 0.26953125, 0.38275146484375, 0.4959716796875, 0.60919189453125, 0.722412109375, 0.83563232421875, 0.9488525390625, 1.06207275390625, 1.17529296875, 1.28851318359375, 1.4017333984375, 1.51495361328125, 1.628173828125, 1.74139404296875, 1.8546142578125, 1.96783447265625, 2.0810546875, 2.19427490234375, 2.3074951171875, 2.42071533203125, 2.533935546875, 2.64715576171875, 2.7603759765625, 2.87359619140625, 2.98681640625, 3.10003662109375, 3.2132568359375, 3.32647705078125, 3.439697265625, 3.55291748046875, 3.6661376953125, 3.77935791015625, 3.892578125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 2.0, 3.0, 2.0, 4.0, 4.0, 12.0, 9.0, 18.0, 22.0, 19.0, 22.0, 28.0, 30.0, 32.0, 46.0, 62.0, 80.0, 105.0, 150.0, 305.0, 827.0, 15270.0, 1017048.0, 12811.0, 744.0, 322.0, 138.0, 109.0, 56.0, 55.0, 43.0, 34.0, 23.0, 28.0, 19.0, 11.0, 12.0, 10.0, 5.0, 14.0, 4.0, 4.0, 4.0, 2.0, 5.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-3.357421875, -3.265411376953125, -3.17340087890625, -3.081390380859375, -2.9893798828125, -2.897369384765625, -2.80535888671875, -2.713348388671875, -2.621337890625, -2.529327392578125, -2.43731689453125, -2.345306396484375, -2.2532958984375, -2.161285400390625, -2.06927490234375, -1.977264404296875, -1.88525390625, -1.793243408203125, -1.70123291015625, -1.609222412109375, -1.5172119140625, -1.425201416015625, -1.33319091796875, -1.241180419921875, -1.149169921875, -1.057159423828125, -0.96514892578125, -0.873138427734375, -0.7811279296875, -0.689117431640625, -0.59710693359375, -0.505096435546875, -0.4130859375, -0.321075439453125, -0.22906494140625, -0.137054443359375, -0.0450439453125, 0.046966552734375, 0.13897705078125, 0.230987548828125, 0.322998046875, 0.415008544921875, 0.50701904296875, 0.599029541015625, 0.6910400390625, 0.783050537109375, 0.87506103515625, 0.967071533203125, 1.05908203125, 1.151092529296875, 1.24310302734375, 1.335113525390625, 1.4271240234375, 1.519134521484375, 1.61114501953125, 1.703155517578125, 1.795166015625, 1.887176513671875, 1.97918701171875, 2.071197509765625, 2.1632080078125, 2.255218505859375, 2.34722900390625, 2.439239501953125, 2.53125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 1.0, 3.0, 2.0, 4.0, 5.0, 13.0, 12.0, 16.0, 20.0, 14.0, 26.0, 27.0, 17.0, 28.0, 37.0, 31.0, 35.0, 39.0, 28.0, 46.0, 40.0, 52.0, 53.0, 36.0, 47.0, 45.0, 33.0, 42.0, 28.0, 32.0, 29.0, 27.0, 22.0, 23.0, 19.0, 11.0, 9.0, 10.0, 7.0, 13.0, 4.0, 3.0, 5.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.75390625, -4.6231689453125, -4.492431640625, -4.3616943359375, -4.23095703125, -4.1002197265625, -3.969482421875, -3.8387451171875, -3.7080078125, -3.5772705078125, -3.446533203125, -3.3157958984375, -3.18505859375, -3.0543212890625, -2.923583984375, -2.7928466796875, -2.662109375, -2.5313720703125, -2.400634765625, -2.2698974609375, -2.13916015625, -2.0084228515625, -1.877685546875, -1.7469482421875, -1.6162109375, -1.4854736328125, -1.354736328125, -1.2239990234375, -1.09326171875, -0.9625244140625, -0.831787109375, -0.7010498046875, -0.5703125, -0.4395751953125, -0.308837890625, -0.1781005859375, -0.04736328125, 0.0833740234375, 0.214111328125, 0.3448486328125, 0.4755859375, 0.6063232421875, 0.737060546875, 0.8677978515625, 0.99853515625, 1.1292724609375, 1.260009765625, 1.3907470703125, 1.521484375, 1.6522216796875, 1.782958984375, 1.9136962890625, 2.04443359375, 2.1751708984375, 2.305908203125, 2.4366455078125, 2.5673828125, 2.6981201171875, 2.828857421875, 2.9595947265625, 3.09033203125, 3.2210693359375, 3.351806640625, 3.4825439453125, 3.61328125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 6.0, 11.0, 17.0, 22.0, 25.0, 34.0, 49.0, 116.0, 174.0, 272.0, 488.0, 868.0, 1627.0, 3866.0, 14039.0, 894249.0, 116665.0, 9632.0, 3118.0, 1449.0, 718.0, 424.0, 255.0, 154.0, 74.0, 55.0, 35.0, 38.0, 18.0, 15.0, 12.0, 3.0, 5.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.2314453125, -0.22517013549804688, -0.21889495849609375, -0.21261978149414062, -0.2063446044921875, -0.20006942749023438, -0.19379425048828125, -0.18751907348632812, -0.181243896484375, -0.17496871948242188, -0.16869354248046875, -0.16241836547851562, -0.1561431884765625, -0.14986801147460938, -0.14359283447265625, -0.13731765747070312, -0.13104248046875, -0.12476730346679688, -0.11849212646484375, -0.11221694946289062, -0.1059417724609375, -0.09966659545898438, -0.09339141845703125, -0.08711624145507812, -0.080841064453125, -0.07456588745117188, -0.06829071044921875, -0.062015533447265625, -0.0557403564453125, -0.049465179443359375, -0.04319000244140625, -0.036914825439453125, -0.0306396484375, -0.024364471435546875, -0.01808929443359375, -0.011814117431640625, -0.0055389404296875, 0.000736236572265625, 0.00701141357421875, 0.013286590576171875, 0.019561767578125, 0.025836944580078125, 0.03211212158203125, 0.038387298583984375, 0.0446624755859375, 0.050937652587890625, 0.05721282958984375, 0.06348800659179688, 0.06976318359375, 0.07603836059570312, 0.08231353759765625, 0.08858871459960938, 0.0948638916015625, 0.10113906860351562, 0.10741424560546875, 0.11368942260742188, 0.119964599609375, 0.12623977661132812, 0.13251495361328125, 0.13879013061523438, 0.1450653076171875, 0.15134048461914062, 0.15761566162109375, 0.16389083862304688, 0.170166015625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 7.0, 8.0, 17.0, 32.0, 215.0, 595.0, 67.0, 20.0, 9.0, 7.0, 8.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5510787963867188e-05, -2.436526119709015e-05, -2.321973443031311e-05, -2.2074207663536072e-05, -2.0928680896759033e-05, -1.9783154129981995e-05, -1.8637627363204956e-05, -1.7492100596427917e-05, -1.634657382965088e-05, -1.520104706287384e-05, -1.4055520296096802e-05, -1.2909993529319763e-05, -1.1764466762542725e-05, -1.0618939995765686e-05, -9.473413228988647e-06, -8.327886462211609e-06, -7.18235969543457e-06, -6.036832928657532e-06, -4.891306161880493e-06, -3.7457793951034546e-06, -2.600252628326416e-06, -1.4547258615493774e-06, -3.0919909477233887e-07, 8.363276720046997e-07, 1.9818544387817383e-06, 3.127381205558777e-06, 4.2729079723358154e-06, 5.418434739112854e-06, 6.563961505889893e-06, 7.709488272666931e-06, 8.85501503944397e-06, 1.0000541806221008e-05, 1.1146068572998047e-05, 1.2291595339775085e-05, 1.3437122106552124e-05, 1.4582648873329163e-05, 1.57281756401062e-05, 1.687370240688324e-05, 1.801922917366028e-05, 1.9164755940437317e-05, 2.0310282707214355e-05, 2.1455809473991394e-05, 2.2601336240768433e-05, 2.374686300754547e-05, 2.489238977432251e-05, 2.603791654109955e-05, 2.7183443307876587e-05, 2.8328970074653625e-05, 2.9474496841430664e-05, 3.06200236082077e-05, 3.176555037498474e-05, 3.291107714176178e-05, 3.405660390853882e-05, 3.520213067531586e-05, 3.6347657442092896e-05, 3.7493184208869934e-05, 3.863871097564697e-05, 3.978423774242401e-05, 4.092976450920105e-05, 4.207529127597809e-05, 4.322081804275513e-05, 4.4366344809532166e-05, 4.5511871576309204e-05, 4.665739834308624e-05, 4.780292510986328e-05]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 12.0, 21.0, 24.0, 21.0, 49.0, 80.0, 103.0, 195.0, 479.0, 973.0, 2485.0, 10857.0, 992173.0, 34409.0, 4017.0, 1347.0, 625.0, 278.0, 170.0, 57.0, 54.0, 38.0, 37.0, 17.0, 12.0, 3.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.3642578125, -0.353759765625, -0.34326171875, -0.332763671875, -0.322265625, -0.311767578125, -0.30126953125, -0.290771484375, -0.2802734375, -0.269775390625, -0.25927734375, -0.248779296875, -0.23828125, -0.227783203125, -0.21728515625, -0.206787109375, -0.1962890625, -0.185791015625, -0.17529296875, -0.164794921875, -0.154296875, -0.143798828125, -0.13330078125, -0.122802734375, -0.1123046875, -0.101806640625, -0.09130859375, -0.080810546875, -0.0703125, -0.059814453125, -0.04931640625, -0.038818359375, -0.0283203125, -0.017822265625, -0.00732421875, 0.003173828125, 0.013671875, 0.024169921875, 0.03466796875, 0.045166015625, 0.0556640625, 0.066162109375, 0.07666015625, 0.087158203125, 0.09765625, 0.108154296875, 0.11865234375, 0.129150390625, 0.1396484375, 0.150146484375, 0.16064453125, 0.171142578125, 0.181640625, 0.192138671875, 0.20263671875, 0.213134765625, 0.2236328125, 0.234130859375, 0.24462890625, 0.255126953125, 0.265625, 0.276123046875, 0.28662109375, 0.297119140625, 0.3076171875]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 15.0, 33.0, 88.0, 694.0, 93.0, 32.0, 20.0, 6.0, 4.0, 4.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.145263671875, -0.14129066467285156, -0.13731765747070312, -0.1333446502685547, -0.12937164306640625, -0.1253986358642578, -0.12142562866210938, -0.11745262145996094, -0.1134796142578125, -0.10950660705566406, -0.10553359985351562, -0.10156059265136719, -0.09758758544921875, -0.09361457824707031, -0.08964157104492188, -0.08566856384277344, -0.081695556640625, -0.07772254943847656, -0.07374954223632812, -0.06977653503417969, -0.06580352783203125, -0.06183052062988281, -0.057857513427734375, -0.05388450622558594, -0.0499114990234375, -0.04593849182128906, -0.041965484619140625, -0.03799247741699219, -0.03401947021484375, -0.030046463012695312, -0.026073455810546875, -0.022100448608398438, -0.01812744140625, -0.014154434204101562, -0.010181427001953125, -0.0062084197998046875, -0.00223541259765625, 0.0017375946044921875, 0.005710601806640625, 0.009683609008789062, 0.0136566162109375, 0.017629623413085938, 0.021602630615234375, 0.025575637817382812, 0.02954864501953125, 0.03352165222167969, 0.037494659423828125, 0.04146766662597656, 0.045440673828125, 0.04941368103027344, 0.053386688232421875, 0.05735969543457031, 0.06133270263671875, 0.06530570983886719, 0.06927871704101562, 0.07325172424316406, 0.0772247314453125, 0.08119773864746094, 0.08517074584960938, 0.08914375305175781, 0.09311676025390625, 0.09708976745605469, 0.10106277465820312, 0.10503578186035156, 0.1090087890625]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 26.0, 929.0, 67.0, 0.0, 0.0, 1.0], "bins": [-40.947471618652344, -40.26072311401367, -39.573974609375, -38.887229919433594, -38.20048141479492, -37.51373291015625, -36.82698440551758, -36.140235900878906, -35.453487396240234, -34.76673889160156, -34.07999038696289, -33.39324188232422, -32.70649719238281, -32.01974868774414, -31.33300018310547, -30.646251678466797, -29.959505081176758, -29.272756576538086, -28.586009979248047, -27.899261474609375, -27.212512969970703, -26.52576446533203, -25.839017868041992, -25.15226936340332, -24.46552276611328, -23.77877426147461, -23.09202766418457, -22.4052791595459, -21.718530654907227, -21.031784057617188, -20.345035552978516, -19.658287048339844, -18.971540451049805, -18.284791946411133, -17.598045349121094, -16.911296844482422, -16.22454833984375, -15.537800788879395, -14.851053237915039, -14.164304733276367, -13.477556228637695, -12.79080867767334, -12.104060173034668, -11.417312622070312, -10.73056411743164, -10.043816566467285, -9.35706901550293, -8.670320510864258, -7.9835734367370605, -7.296825408935547, -6.610077857971191, -5.923329830169678, -5.236581802368164, -4.54983377456665, -3.863086223602295, -3.1763381958007812, -2.4895901679992676, -1.8028422594070435, -1.1160943508148193, -0.42934656143188477, 0.2574014663696289, 0.9441494941711426, 1.630897045135498, 2.3176450729370117, 3.0043931007385254]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 5.0, 5.0, 2.0, 8.0, 7.0, 12.0, 12.0, 14.0, 18.0, 22.0, 21.0, 28.0, 25.0, 21.0, 26.0, 33.0, 38.0, 40.0, 43.0, 43.0, 41.0, 40.0, 46.0, 50.0, 37.0, 35.0, 47.0, 24.0, 43.0, 27.0, 20.0, 29.0, 26.0, 24.0, 17.0, 17.0, 11.0, 8.0, 8.0, 12.0, 5.0, 4.0, 3.0, 1.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.156064033508301, -5.960081100463867, -5.764098644256592, -5.568115711212158, -5.372132778167725, -5.176150321960449, -4.980167388916016, -4.784184455871582, -4.588201999664307, -4.392219066619873, -4.196236610412598, -4.000253677368164, -3.8042709827423096, -3.608288288116455, -3.4123053550720215, -3.216322660446167, -3.0203397274017334, -2.824357032775879, -2.6283740997314453, -2.432391405105591, -2.2364087104797363, -2.0404257774353027, -1.8444430828094482, -1.6484603881835938, -1.4524775743484497, -1.2564947605133057, -1.0605120658874512, -0.8645292520523071, -0.6685464978218079, -0.4725637435913086, -0.27658092975616455, -0.08059823513031006, 0.11538457870483398, 0.31136733293533325, 0.5073500871658325, 0.7033329010009766, 0.8993156552314758, 1.095298409461975, 1.2912812232971191, 1.4872639179229736, 1.6832467317581177, 1.8792295455932617, 2.075212240219116, 2.2711949348449707, 2.4671778678894043, 2.663160562515259, 2.8591432571411133, 3.055126190185547, 3.2511088848114014, 3.447091579437256, 3.6430745124816895, 3.839057207107544, 4.035039901733398, 4.231022834777832, 4.427005767822266, 4.622988224029541, 4.818971157073975, 5.014954090118408, 5.210936546325684, 5.406919479370117, 5.602902412414551, 5.798884868621826, 5.99486780166626, 6.190850257873535, 6.386833190917969]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 1.0, 4.0, 2.0, 6.0, 4.0, 10.0, 8.0, 14.0, 13.0, 18.0, 24.0, 22.0, 26.0, 24.0, 50.0, 47.0, 87.0, 184.0, 441.0, 1176.0, 4386.0, 21286.0, 874982.0, 3238203.0, 43019.0, 7062.0, 1899.0, 622.0, 256.0, 109.0, 60.0, 41.0, 36.0, 35.0, 21.0, 19.0, 19.0, 17.0, 13.0, 8.0, 5.0, 5.0, 3.0, 7.0, 3.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.84375, -1.782623291015625, -1.72149658203125, -1.660369873046875, -1.5992431640625, -1.538116455078125, -1.47698974609375, -1.415863037109375, -1.354736328125, -1.293609619140625, -1.23248291015625, -1.171356201171875, -1.1102294921875, -1.049102783203125, -0.98797607421875, -0.926849365234375, -0.86572265625, -0.804595947265625, -0.74346923828125, -0.682342529296875, -0.6212158203125, -0.560089111328125, -0.49896240234375, -0.437835693359375, -0.376708984375, -0.315582275390625, -0.25445556640625, -0.193328857421875, -0.1322021484375, -0.071075439453125, -0.00994873046875, 0.051177978515625, 0.1123046875, 0.173431396484375, 0.23455810546875, 0.295684814453125, 0.3568115234375, 0.417938232421875, 0.47906494140625, 0.540191650390625, 0.601318359375, 0.662445068359375, 0.72357177734375, 0.784698486328125, 0.8458251953125, 0.906951904296875, 0.96807861328125, 1.029205322265625, 1.09033203125, 1.151458740234375, 1.21258544921875, 1.273712158203125, 1.3348388671875, 1.395965576171875, 1.45709228515625, 1.518218994140625, 1.579345703125, 1.640472412109375, 1.70159912109375, 1.762725830078125, 1.8238525390625, 1.884979248046875, 1.94610595703125, 2.007232666015625, 2.068359375]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 11.0, 14.0, 9.0, 14.0, 15.0, 17.0, 20.0, 29.0, 35.0, 44.0, 47.0, 39.0, 52.0, 54.0, 61.0, 56.0, 50.0, 67.0, 56.0, 51.0, 57.0, 40.0, 38.0, 32.0, 24.0, 14.0, 19.0, 12.0, 9.0, 7.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.447998046875, -0.4272346496582031, -0.40647125244140625, -0.3857078552246094, -0.3649444580078125, -0.3441810607910156, -0.32341766357421875, -0.3026542663574219, -0.281890869140625, -0.2611274719238281, -0.24036407470703125, -0.21960067749023438, -0.1988372802734375, -0.17807388305664062, -0.15731048583984375, -0.13654708862304688, -0.11578369140625, -0.09502029418945312, -0.07425689697265625, -0.053493499755859375, -0.0327301025390625, -0.011966705322265625, 0.00879669189453125, 0.029560089111328125, 0.050323486328125, 0.07108688354492188, 0.09185028076171875, 0.11261367797851562, 0.1333770751953125, 0.15414047241210938, 0.17490386962890625, 0.19566726684570312, 0.2164306640625, 0.23719406127929688, 0.25795745849609375, 0.2787208557128906, 0.2994842529296875, 0.3202476501464844, 0.34101104736328125, 0.3617744445800781, 0.382537841796875, 0.4033012390136719, 0.42406463623046875, 0.4448280334472656, 0.4655914306640625, 0.4863548278808594, 0.5071182250976562, 0.5278816223144531, 0.54864501953125, 0.5694084167480469, 0.5901718139648438, 0.6109352111816406, 0.6316986083984375, 0.6524620056152344, 0.6732254028320312, 0.6939888000488281, 0.714752197265625, 0.7355155944824219, 0.7562789916992188, 0.7770423889160156, 0.7978057861328125, 0.8185691833496094, 0.8393325805664062, 0.8600959777832031, 0.880859375]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 8.0, 22.0, 101.0, 4193788.0, 310.0, 37.0, 11.0, 11.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.2421875, -13.4971923828125, -11.752197265625, -10.0072021484375, -8.26220703125, -6.5172119140625, -4.772216796875, -3.0272216796875, -1.2822265625, 0.4627685546875, 2.207763671875, 3.9527587890625, 5.69775390625, 7.4427490234375, 9.187744140625, 10.9327392578125, 12.677734375, 14.4227294921875, 16.167724609375, 17.9127197265625, 19.65771484375, 21.4027099609375, 23.147705078125, 24.8927001953125, 26.6376953125, 28.3826904296875, 30.127685546875, 31.8726806640625, 33.61767578125, 35.3626708984375, 37.107666015625, 38.8526611328125, 40.59765625, 42.3426513671875, 44.087646484375, 45.8326416015625, 47.57763671875, 49.3226318359375, 51.067626953125, 52.8126220703125, 54.5576171875, 56.3026123046875, 58.047607421875, 59.7926025390625, 61.53759765625, 63.2825927734375, 65.027587890625, 66.7725830078125, 68.517578125, 70.2625732421875, 72.007568359375, 73.7525634765625, 75.49755859375, 77.2425537109375, 78.987548828125, 80.7325439453125, 82.4775390625, 84.2225341796875, 85.967529296875, 87.7125244140625, 89.45751953125, 91.2025146484375, 92.947509765625, 94.6925048828125, 96.4375]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 5.0, 7.0, 21.0, 21.0, 30.0, 39.0, 74.0, 127.0, 311.0, 957.0, 1422.0, 588.0, 196.0, 113.0, 62.0, 38.0, 26.0, 17.0, 10.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.296875, -0.282928466796875, -0.26898193359375, -0.255035400390625, -0.2410888671875, -0.227142333984375, -0.21319580078125, -0.199249267578125, -0.185302734375, -0.171356201171875, -0.15740966796875, -0.143463134765625, -0.1295166015625, -0.115570068359375, -0.10162353515625, -0.087677001953125, -0.07373046875, -0.059783935546875, -0.04583740234375, -0.031890869140625, -0.0179443359375, -0.003997802734375, 0.00994873046875, 0.023895263671875, 0.037841796875, 0.051788330078125, 0.06573486328125, 0.079681396484375, 0.0936279296875, 0.107574462890625, 0.12152099609375, 0.135467529296875, 0.1494140625, 0.163360595703125, 0.17730712890625, 0.191253662109375, 0.2052001953125, 0.219146728515625, 0.23309326171875, 0.247039794921875, 0.260986328125, 0.274932861328125, 0.28887939453125, 0.302825927734375, 0.3167724609375, 0.330718994140625, 0.34466552734375, 0.358612060546875, 0.37255859375, 0.386505126953125, 0.40045166015625, 0.414398193359375, 0.4283447265625, 0.442291259765625, 0.45623779296875, 0.470184326171875, 0.484130859375, 0.498077392578125, 0.51202392578125, 0.525970458984375, 0.5399169921875, 0.553863525390625, 0.56781005859375, 0.581756591796875, 0.595703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 5.0, 4.0, 9.0, 15.0, 27.0, 42.0, 60.0, 104.0, 142.0, 186.0, 165.0, 99.0, 57.0, 31.0, 26.0, 23.0, 12.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5449100136756897, -0.5015302300453186, -0.4581504464149475, -0.4147706627845764, -0.3713908791542053, -0.32801109552383423, -0.28463128209114075, -0.24125149846076965, -0.19787171483039856, -0.15449193120002747, -0.11111214011907578, -0.06773234903812408, -0.02435256540775299, 0.019027218222618103, 0.06240701675415039, 0.10578680038452148, 0.14916658401489258, 0.19254636764526367, 0.23592615127563477, 0.27930593490600586, 0.32268571853637695, 0.36606550216674805, 0.40944531559944153, 0.4528250992298126, 0.4962048828601837, 0.5395846962928772, 0.5829644799232483, 0.6263442635536194, 0.6697240471839905, 0.7131038308143616, 0.7564836144447327, 0.7998633980751038, 0.8432432413101196, 0.8866230249404907, 0.9300028085708618, 0.9733825922012329, 1.016762375831604, 1.060142159461975, 1.1035219430923462, 1.1469017267227173, 1.1902815103530884, 1.2336612939834595, 1.2770410776138306, 1.3204208612442017, 1.3638006448745728, 1.4071804285049438, 1.450560212135315, 1.493939995765686, 1.5373198986053467, 1.5806996822357178, 1.6240794658660889, 1.66745924949646, 1.710839033126831, 1.7542188167572021, 1.7975986003875732, 1.8409783840179443, 1.8843581676483154, 1.9277379512786865, 1.9711177349090576, 2.0144975185394287, 2.0578773021698, 2.101257085800171, 2.144636869430542, 2.188016653060913, 2.231396436691284]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 5.0, 3.0, 6.0, 10.0, 10.0, 11.0, 15.0, 19.0, 23.0, 24.0, 32.0, 35.0, 34.0, 31.0, 29.0, 32.0, 49.0, 38.0, 44.0, 48.0, 57.0, 48.0, 34.0, 43.0, 50.0, 33.0, 27.0, 40.0, 30.0, 24.0, 20.0, 18.0, 16.0, 17.0, 8.0, 11.0, 12.0, 4.0, 5.0, 3.0, 3.0, 1.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5113065838813782, -0.49378257989883423, -0.47625860571861267, -0.4587346315383911, -0.44121062755584717, -0.4236866235733032, -0.40616264939308167, -0.3886386752128601, -0.37111467123031616, -0.3535906672477722, -0.33606669306755066, -0.3185427188873291, -0.30101871490478516, -0.2834947109222412, -0.26597073674201965, -0.2484467476606369, -0.23092275857925415, -0.2133987694978714, -0.19587478041648865, -0.1783507913351059, -0.16082680225372314, -0.1433028131723404, -0.12577882409095764, -0.10825483500957489, -0.09073084592819214, -0.07320685684680939, -0.055682867765426636, -0.038158878684043884, -0.020634889602661133, -0.0031109005212783813, 0.01441308856010437, 0.03193707764148712, 0.0494610071182251, 0.06698499619960785, 0.0845089852809906, 0.10203297436237335, 0.1195569634437561, 0.13708095252513885, 0.1546049416065216, 0.17212893068790436, 0.1896529197692871, 0.20717690885066986, 0.2247008979320526, 0.24222488701343536, 0.2597488760948181, 0.27727288007736206, 0.2947968542575836, 0.3123208284378052, 0.3298448324203491, 0.34736883640289307, 0.3648928105831146, 0.3824167847633362, 0.3999407887458801, 0.4174647927284241, 0.43498876690864563, 0.4525127410888672, 0.47003674507141113, 0.4875607490539551, 0.505084753036499, 0.5226086974143982, 0.5401327013969421, 0.5576567053794861, 0.5751806497573853, 0.5927046537399292, 0.6102286577224731]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 9.0, 11.0, 11.0, 20.0, 30.0, 35.0, 60.0, 91.0, 157.0, 229.0, 345.0, 525.0, 852.0, 1356.0, 2300.0, 3898.0, 7022.0, 13536.0, 28545.0, 64499.0, 172676.0, 395900.0, 211852.0, 76748.0, 32839.0, 15962.0, 8160.0, 4315.0, 2485.0, 1489.0, 932.0, 587.0, 385.0, 228.0, 147.0, 100.0, 73.0, 49.0, 35.0, 23.0, 19.0, 9.0, 10.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.293212890625, -0.28421783447265625, -0.2752227783203125, -0.26622772216796875, -0.257232666015625, -0.24823760986328125, -0.2392425537109375, -0.23024749755859375, -0.22125244140625, -0.21225738525390625, -0.2032623291015625, -0.19426727294921875, -0.185272216796875, -0.17627716064453125, -0.1672821044921875, -0.15828704833984375, -0.1492919921875, -0.14029693603515625, -0.1313018798828125, -0.12230682373046875, -0.113311767578125, -0.10431671142578125, -0.0953216552734375, -0.08632659912109375, -0.07733154296875, -0.06833648681640625, -0.0593414306640625, -0.05034637451171875, -0.041351318359375, -0.03235626220703125, -0.0233612060546875, -0.01436614990234375, -0.00537109375, 0.00362396240234375, 0.0126190185546875, 0.02161407470703125, 0.030609130859375, 0.03960418701171875, 0.0485992431640625, 0.05759429931640625, 0.06658935546875, 0.07558441162109375, 0.0845794677734375, 0.09357452392578125, 0.102569580078125, 0.11156463623046875, 0.1205596923828125, 0.12955474853515625, 0.1385498046875, 0.14754486083984375, 0.1565399169921875, 0.16553497314453125, 0.174530029296875, 0.18352508544921875, 0.1925201416015625, 0.20151519775390625, 0.21051025390625, 0.21950531005859375, 0.2285003662109375, 0.23749542236328125, 0.246490478515625, 0.25548553466796875, 0.2644805908203125, 0.27347564697265625, 0.282470703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 8.0, 10.0, 9.0, 17.0, 12.0, 21.0, 24.0, 31.0, 41.0, 33.0, 31.0, 36.0, 36.0, 34.0, 57.0, 59.0, 59.0, 41.0, 53.0, 45.0, 51.0, 41.0, 34.0, 35.0, 43.0, 30.0, 20.0, 19.0, 18.0, 7.0, 18.0, 3.0, 9.0, 3.0, 3.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.339111328125, -0.32689666748046875, -0.3146820068359375, -0.30246734619140625, -0.290252685546875, -0.27803802490234375, -0.2658233642578125, -0.25360870361328125, -0.24139404296875, -0.22917938232421875, -0.2169647216796875, -0.20475006103515625, -0.192535400390625, -0.18032073974609375, -0.1681060791015625, -0.15589141845703125, -0.1436767578125, -0.13146209716796875, -0.1192474365234375, -0.10703277587890625, -0.094818115234375, -0.08260345458984375, -0.0703887939453125, -0.05817413330078125, -0.04595947265625, -0.03374481201171875, -0.0215301513671875, -0.00931549072265625, 0.002899169921875, 0.01511383056640625, 0.0273284912109375, 0.03954315185546875, 0.0517578125, 0.06397247314453125, 0.0761871337890625, 0.08840179443359375, 0.100616455078125, 0.11283111572265625, 0.1250457763671875, 0.13726043701171875, 0.14947509765625, 0.16168975830078125, 0.1739044189453125, 0.18611907958984375, 0.198333740234375, 0.21054840087890625, 0.2227630615234375, 0.23497772216796875, 0.2471923828125, 0.25940704345703125, 0.2716217041015625, 0.28383636474609375, 0.296051025390625, 0.30826568603515625, 0.3204803466796875, 0.33269500732421875, 0.34490966796875, 0.35712432861328125, 0.3693389892578125, 0.38155364990234375, 0.393768310546875, 0.40598297119140625, 0.4181976318359375, 0.43041229248046875, 0.442626953125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 2.0, 3.0, 4.0, 4.0, 6.0, 14.0, 11.0, 8.0, 22.0, 33.0, 49.0, 95.0, 123.0, 216.0, 392.0, 681.0, 1404.0, 3334.0, 8996.0, 28500.0, 113722.0, 499199.0, 299948.0, 63492.0, 17577.0, 5957.0, 2388.0, 1051.0, 529.0, 297.0, 171.0, 100.0, 68.0, 47.0, 26.0, 30.0, 14.0, 10.0, 9.0, 9.0, 6.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.392578125, -0.3812980651855469, -0.37001800537109375, -0.3587379455566406, -0.3474578857421875, -0.3361778259277344, -0.32489776611328125, -0.3136177062988281, -0.302337646484375, -0.2910575866699219, -0.27977752685546875, -0.2684974670410156, -0.2572174072265625, -0.24593734741210938, -0.23465728759765625, -0.22337722778320312, -0.21209716796875, -0.20081710815429688, -0.18953704833984375, -0.17825698852539062, -0.1669769287109375, -0.15569686889648438, -0.14441680908203125, -0.13313674926757812, -0.121856689453125, -0.11057662963867188, -0.09929656982421875, -0.08801651000976562, -0.0767364501953125, -0.06545639038085938, -0.05417633056640625, -0.042896270751953125, -0.0316162109375, -0.020336151123046875, -0.00905609130859375, 0.002223968505859375, 0.0135040283203125, 0.024784088134765625, 0.03606414794921875, 0.047344207763671875, 0.058624267578125, 0.06990432739257812, 0.08118438720703125, 0.09246444702148438, 0.1037445068359375, 0.11502456665039062, 0.12630462646484375, 0.13758468627929688, 0.14886474609375, 0.16014480590820312, 0.17142486572265625, 0.18270492553710938, 0.1939849853515625, 0.20526504516601562, 0.21654510498046875, 0.22782516479492188, 0.239105224609375, 0.2503852844238281, 0.26166534423828125, 0.2729454040527344, 0.2842254638671875, 0.2955055236816406, 0.30678558349609375, 0.3180656433105469, 0.329345703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 4.0, 8.0, 6.0, 10.0, 15.0, 10.0, 16.0, 14.0, 17.0, 17.0, 21.0, 32.0, 30.0, 32.0, 28.0, 33.0, 43.0, 42.0, 54.0, 40.0, 29.0, 47.0, 50.0, 30.0, 33.0, 33.0, 34.0, 29.0, 13.0, 19.0, 22.0, 21.0, 26.0, 16.0, 20.0, 14.0, 20.0, 9.0, 16.0, 13.0, 3.0, 12.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.57666015625, -0.5589218139648438, -0.5411834716796875, -0.5234451293945312, -0.505706787109375, -0.48796844482421875, -0.4702301025390625, -0.45249176025390625, -0.43475341796875, -0.41701507568359375, -0.3992767333984375, -0.38153839111328125, -0.363800048828125, -0.34606170654296875, -0.3283233642578125, -0.31058502197265625, -0.2928466796875, -0.27510833740234375, -0.2573699951171875, -0.23963165283203125, -0.221893310546875, -0.20415496826171875, -0.1864166259765625, -0.16867828369140625, -0.15093994140625, -0.13320159912109375, -0.1154632568359375, -0.09772491455078125, -0.079986572265625, -0.06224822998046875, -0.0445098876953125, -0.02677154541015625, -0.009033203125, 0.00870513916015625, 0.0264434814453125, 0.04418182373046875, 0.061920166015625, 0.07965850830078125, 0.0973968505859375, 0.11513519287109375, 0.13287353515625, 0.15061187744140625, 0.1683502197265625, 0.18608856201171875, 0.203826904296875, 0.22156524658203125, 0.2393035888671875, 0.25704193115234375, 0.2747802734375, 0.29251861572265625, 0.3102569580078125, 0.32799530029296875, 0.345733642578125, 0.36347198486328125, 0.3812103271484375, 0.39894866943359375, 0.41668701171875, 0.43442535400390625, 0.4521636962890625, 0.46990203857421875, 0.487640380859375, 0.5053787231445312, 0.5231170654296875, 0.5408554077148438, 0.55859375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 9.0, 12.0, 10.0, 20.0, 33.0, 41.0, 46.0, 79.0, 118.0, 180.0, 309.0, 586.0, 1259.0, 2802.0, 7479.0, 25836.0, 123278.0, 604784.0, 222153.0, 41322.0, 10983.0, 3818.0, 1578.0, 833.0, 389.0, 247.0, 121.0, 85.0, 50.0, 27.0, 16.0, 12.0, 17.0, 7.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.1011962890625, -0.09857845306396484, -0.09596061706542969, -0.09334278106689453, -0.09072494506835938, -0.08810710906982422, -0.08548927307128906, -0.0828714370727539, -0.08025360107421875, -0.0776357650756836, -0.07501792907714844, -0.07240009307861328, -0.06978225708007812, -0.06716442108154297, -0.06454658508300781, -0.061928749084472656, -0.0593109130859375, -0.056693077087402344, -0.05407524108886719, -0.05145740509033203, -0.048839569091796875, -0.04622173309326172, -0.04360389709472656, -0.040986061096191406, -0.03836822509765625, -0.035750389099121094, -0.03313255310058594, -0.03051471710205078, -0.027896881103515625, -0.02527904510498047, -0.022661209106445312, -0.020043373107910156, -0.017425537109375, -0.014807701110839844, -0.012189865112304688, -0.009572029113769531, -0.006954193115234375, -0.004336357116699219, -0.0017185211181640625, 0.0008993148803710938, 0.00351715087890625, 0.006134986877441406, 0.008752822875976562, 0.011370658874511719, 0.013988494873046875, 0.01660633087158203, 0.019224166870117188, 0.021842002868652344, 0.0244598388671875, 0.027077674865722656, 0.029695510864257812, 0.03231334686279297, 0.034931182861328125, 0.03754901885986328, 0.04016685485839844, 0.042784690856933594, 0.04540252685546875, 0.048020362854003906, 0.05063819885253906, 0.05325603485107422, 0.055873870849609375, 0.05849170684814453, 0.06110954284667969, 0.06372737884521484, 0.06634521484375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 6.0, 4.0, 10.0, 10.0, 10.0, 20.0, 24.0, 29.0, 38.0, 47.0, 88.0, 100.0, 136.0, 122.0, 86.0, 71.0, 53.0, 34.0, 36.0, 20.0, 9.0, 4.0, 6.0, 11.0, 3.0, 5.0, 10.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.404783248901367e-05, -4.2280182242393494e-05, -4.0512531995773315e-05, -3.874488174915314e-05, -3.697723150253296e-05, -3.520958125591278e-05, -3.34419310092926e-05, -3.1674280762672424e-05, -2.9906630516052246e-05, -2.8138980269432068e-05, -2.637133002281189e-05, -2.460367977619171e-05, -2.2836029529571533e-05, -2.1068379282951355e-05, -1.9300729036331177e-05, -1.7533078789711e-05, -1.576542854309082e-05, -1.3997778296470642e-05, -1.2230128049850464e-05, -1.0462477803230286e-05, -8.694827556610107e-06, -6.927177309989929e-06, -5.159527063369751e-06, -3.3918768167495728e-06, -1.6242265701293945e-06, 1.434236764907837e-07, 1.911073923110962e-06, 3.67872416973114e-06, 5.446374416351318e-06, 7.214024662971497e-06, 8.981674909591675e-06, 1.0749325156211853e-05, 1.2516975402832031e-05, 1.428462564945221e-05, 1.6052275896072388e-05, 1.7819926142692566e-05, 1.9587576389312744e-05, 2.1355226635932922e-05, 2.31228768825531e-05, 2.489052712917328e-05, 2.6658177375793457e-05, 2.8425827622413635e-05, 3.0193477869033813e-05, 3.196112811565399e-05, 3.372877836227417e-05, 3.549642860889435e-05, 3.7264078855514526e-05, 3.9031729102134705e-05, 4.079937934875488e-05, 4.256702959537506e-05, 4.433467984199524e-05, 4.610233008861542e-05, 4.7869980335235596e-05, 4.9637630581855774e-05, 5.140528082847595e-05, 5.317293107509613e-05, 5.494058132171631e-05, 5.670823156833649e-05, 5.8475881814956665e-05, 6.024353206157684e-05, 6.201118230819702e-05, 6.37788325548172e-05, 6.554648280143738e-05, 6.731413304805756e-05, 6.908178329467773e-05]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 8.0, 2.0, 7.0, 3.0, 4.0, 2.0, 5.0, 10.0, 25.0, 13.0, 21.0, 23.0, 22.0, 37.0, 51.0, 70.0, 241.0, 14388.0, 1029056.0, 4094.0, 149.0, 79.0, 48.0, 25.0, 34.0, 28.0, 15.0, 10.0, 14.0, 12.0, 7.0, 10.0, 6.0, 4.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.396484375, -0.38385772705078125, -0.3712310791015625, -0.35860443115234375, -0.345977783203125, -0.33335113525390625, -0.3207244873046875, -0.30809783935546875, -0.29547119140625, -0.28284454345703125, -0.2702178955078125, -0.25759124755859375, -0.244964599609375, -0.23233795166015625, -0.2197113037109375, -0.20708465576171875, -0.1944580078125, -0.18183135986328125, -0.1692047119140625, -0.15657806396484375, -0.143951416015625, -0.13132476806640625, -0.1186981201171875, -0.10607147216796875, -0.09344482421875, -0.08081817626953125, -0.0681915283203125, -0.05556488037109375, -0.042938232421875, -0.03031158447265625, -0.0176849365234375, -0.00505828857421875, 0.007568359375, 0.02019500732421875, 0.0328216552734375, 0.04544830322265625, 0.058074951171875, 0.07070159912109375, 0.0833282470703125, 0.09595489501953125, 0.10858154296875, 0.12120819091796875, 0.1338348388671875, 0.14646148681640625, 0.159088134765625, 0.17171478271484375, 0.1843414306640625, 0.19696807861328125, 0.2095947265625, 0.22222137451171875, 0.2348480224609375, 0.24747467041015625, 0.260101318359375, 0.27272796630859375, 0.2853546142578125, 0.29798126220703125, 0.31060791015625, 0.32323455810546875, 0.3358612060546875, 0.34848785400390625, 0.361114501953125, 0.37374114990234375, 0.3863677978515625, 0.39899444580078125, 0.41162109375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 1.0, 3.0, 4.0, 6.0, 14.0, 8.0, 7.0, 8.0, 13.0, 19.0, 27.0, 33.0, 33.0, 46.0, 49.0, 49.0, 55.0, 67.0, 53.0, 73.0, 59.0, 52.0, 61.0, 47.0, 34.0, 27.0, 24.0, 26.0, 17.0, 17.0, 13.0, 10.0, 9.0, 7.0, 8.0, 4.0, 6.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0164337158203125, -0.015799522399902344, -0.015165328979492188, -0.014531135559082031, -0.013896942138671875, -0.013262748718261719, -0.012628555297851562, -0.011994361877441406, -0.01136016845703125, -0.010725975036621094, -0.010091781616210938, -0.009457588195800781, -0.008823394775390625, -0.008189201354980469, -0.0075550079345703125, -0.006920814514160156, -0.00628662109375, -0.005652427673339844, -0.0050182342529296875, -0.004384040832519531, -0.003749847412109375, -0.0031156539916992188, -0.0024814605712890625, -0.0018472671508789062, -0.00121307373046875, -0.0005788803100585938, 5.53131103515625e-05, 0.0006895065307617188, 0.001323699951171875, 0.0019578933715820312, 0.0025920867919921875, 0.0032262802124023438, 0.0038604736328125, 0.004494667053222656, 0.0051288604736328125, 0.005763053894042969, 0.006397247314453125, 0.007031440734863281, 0.0076656341552734375, 0.008299827575683594, 0.00893402099609375, 0.009568214416503906, 0.010202407836914062, 0.010836601257324219, 0.011470794677734375, 0.012104988098144531, 0.012739181518554688, 0.013373374938964844, 0.014007568359375, 0.014641761779785156, 0.015275955200195312, 0.01591014862060547, 0.016544342041015625, 0.01717853546142578, 0.017812728881835938, 0.018446922302246094, 0.01908111572265625, 0.019715309143066406, 0.020349502563476562, 0.02098369598388672, 0.021617889404296875, 0.02225208282470703, 0.022886276245117188, 0.023520469665527344, 0.0241546630859375]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 3.0, 11.0, 14.0, 26.0, 35.0, 62.0, 100.0, 150.0, 172.0, 146.0, 123.0, 51.0, 53.0, 20.0, 13.0, 9.0, 7.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.477413535118103, -0.4553607404232025, -0.4333079755306244, -0.4112551808357239, -0.38920241594314575, -0.36714962124824524, -0.3450968265533447, -0.3230440616607666, -0.3009912669658661, -0.2789384722709656, -0.25688570737838745, -0.23483291268348694, -0.21278013288974762, -0.1907273530960083, -0.1686745584011078, -0.14662177860736847, -0.12456899881362915, -0.10251621901988983, -0.08046343177556992, -0.05841064453125, -0.03635786473751068, -0.014305084943771362, 0.00774770975112915, 0.02980048954486847, 0.05185326933860779, 0.0739060491323471, 0.09595883637666702, 0.11801162362098694, 0.14006440341472626, 0.16211718320846558, 0.1841699779033661, 0.2062227576971054, 0.22827553749084473, 0.25032833218574524, 0.27238109707832336, 0.2944338917732239, 0.316486656665802, 0.3385394513607025, 0.360592246055603, 0.38264501094818115, 0.40469780564308167, 0.4267506003379822, 0.4488033652305603, 0.4708561599254608, 0.49290895462036133, 0.5149617195129395, 0.5370144844055176, 0.5590673089027405, 0.5811200737953186, 0.6031728386878967, 0.6252256631851196, 0.6472784280776978, 0.6693311929702759, 0.691383957862854, 0.7134367823600769, 0.735489547252655, 0.7575423717498779, 0.779595136642456, 0.801647961139679, 0.8237007260322571, 0.8457534909248352, 0.8678063154220581, 0.8898590803146362, 0.9119118452072144, 0.9339646100997925]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 6.0, 7.0, 8.0, 10.0, 17.0, 19.0, 29.0, 29.0, 44.0, 30.0, 31.0, 44.0, 48.0, 46.0, 45.0, 49.0, 62.0, 52.0, 56.0, 59.0, 45.0, 50.0, 33.0, 34.0, 34.0, 25.0, 23.0, 19.0, 13.0, 11.0, 4.0, 11.0, 2.0, 2.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.374891996383667, -0.3621973395347595, -0.34950268268585205, -0.3368080258369446, -0.3241133689880371, -0.31141871213912964, -0.29872405529022217, -0.2860293984413147, -0.2733347415924072, -0.26064008474349976, -0.24794542789459229, -0.23525077104568481, -0.22255611419677734, -0.20986145734786987, -0.1971667855978012, -0.18447212874889374, -0.17177745699882507, -0.1590828001499176, -0.14638814330101013, -0.13369348645210266, -0.1209988221526146, -0.10830416530370712, -0.09560950100421906, -0.08291484415531158, -0.07022018730640411, -0.05752553045749664, -0.044830869883298874, -0.032136209309101105, -0.019441552460193634, -0.006746895611286163, 0.005947768688201904, 0.018642425537109375, 0.03133705258369446, 0.04403170943260193, 0.0567263700067997, 0.06942103058099747, 0.08211568742990494, 0.09481034427881241, 0.10750500857830048, 0.12019966542720795, 0.13289432227611542, 0.1455889791250229, 0.15828363597393036, 0.17097830772399902, 0.1836729645729065, 0.19636762142181396, 0.20906227827072144, 0.2217569351196289, 0.23445159196853638, 0.24714624881744385, 0.2598409056663513, 0.2725355625152588, 0.28523021936416626, 0.29792487621307373, 0.3106195330619812, 0.32331418991088867, 0.33600884675979614, 0.3487035036087036, 0.3613981604576111, 0.37409281730651855, 0.386787474155426, 0.3994821310043335, 0.41217678785324097, 0.42487144470214844, 0.4375661313533783]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 5.0, 4.0, 8.0, 5.0, 9.0, 18.0, 22.0, 28.0, 32.0, 46.0, 72.0, 92.0, 150.0, 230.0, 318.0, 502.0, 839.0, 1501.0, 2586.0, 4830.0, 9223.0, 18370.0, 38922.0, 87838.0, 220991.0, 365720.0, 165878.0, 67388.0, 30787.0, 14913.0, 7735.0, 3978.0, 2174.0, 1242.0, 721.0, 466.0, 297.0, 182.0, 133.0, 93.0, 53.0, 41.0, 40.0, 26.0, 19.0, 9.0, 9.0, 7.0, 5.0, 2.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1292724609375, -0.12514877319335938, -0.12102508544921875, -0.11690139770507812, -0.1127777099609375, -0.10865402221679688, -0.10453033447265625, -0.10040664672851562, -0.096282958984375, -0.09215927124023438, -0.08803558349609375, -0.08391189575195312, -0.0797882080078125, -0.07566452026367188, -0.07154083251953125, -0.06741714477539062, -0.06329345703125, -0.059169769287109375, -0.05504608154296875, -0.050922393798828125, -0.0467987060546875, -0.042675018310546875, -0.03855133056640625, -0.034427642822265625, -0.030303955078125, -0.026180267333984375, -0.02205657958984375, -0.017932891845703125, -0.0138092041015625, -0.009685516357421875, -0.00556182861328125, -0.001438140869140625, 0.002685546875, 0.006809234619140625, 0.01093292236328125, 0.015056610107421875, 0.0191802978515625, 0.023303985595703125, 0.02742767333984375, 0.031551361083984375, 0.035675048828125, 0.039798736572265625, 0.04392242431640625, 0.048046112060546875, 0.0521697998046875, 0.056293487548828125, 0.06041717529296875, 0.06454086303710938, 0.06866455078125, 0.07278823852539062, 0.07691192626953125, 0.08103561401367188, 0.0851593017578125, 0.08928298950195312, 0.09340667724609375, 0.09753036499023438, 0.101654052734375, 0.10577774047851562, 0.10990142822265625, 0.11402511596679688, 0.1181488037109375, 0.12227249145507812, 0.12639617919921875, 0.13051986694335938, 0.1346435546875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 8.0, 4.0, 9.0, 9.0, 18.0, 17.0, 13.0, 23.0, 13.0, 34.0, 33.0, 26.0, 36.0, 36.0, 46.0, 43.0, 54.0, 64.0, 57.0, 49.0, 42.0, 45.0, 52.0, 38.0, 36.0, 31.0, 29.0, 26.0, 23.0, 13.0, 13.0, 11.0, 11.0, 9.0, 6.0, 8.0, 5.0, 7.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8779296875, -1.8259124755859375, -1.773895263671875, -1.7218780517578125, -1.66986083984375, -1.6178436279296875, -1.565826416015625, -1.5138092041015625, -1.4617919921875, -1.4097747802734375, -1.357757568359375, -1.3057403564453125, -1.25372314453125, -1.2017059326171875, -1.149688720703125, -1.0976715087890625, -1.045654296875, -0.9936370849609375, -0.941619873046875, -0.8896026611328125, -0.83758544921875, -0.7855682373046875, -0.733551025390625, -0.6815338134765625, -0.6295166015625, -0.5774993896484375, -0.525482177734375, -0.4734649658203125, -0.42144775390625, -0.3694305419921875, -0.317413330078125, -0.2653961181640625, -0.21337890625, -0.1613616943359375, -0.109344482421875, -0.0573272705078125, -0.00531005859375, 0.0467071533203125, 0.098724365234375, 0.1507415771484375, 0.2027587890625, 0.2547760009765625, 0.306793212890625, 0.3588104248046875, 0.41082763671875, 0.4628448486328125, 0.514862060546875, 0.5668792724609375, 0.618896484375, 0.6709136962890625, 0.722930908203125, 0.7749481201171875, 0.82696533203125, 0.8789825439453125, 0.930999755859375, 0.9830169677734375, 1.0350341796875, 1.0870513916015625, 1.139068603515625, 1.1910858154296875, 1.24310302734375, 1.2951202392578125, 1.347137451171875, 1.3991546630859375, 1.451171875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 6.0, 4.0, 2.0, 5.0, 7.0, 16.0, 14.0, 24.0, 30.0, 51.0, 45.0, 57.0, 65.0, 80.0, 343.0, 1045766.0, 1505.0, 156.0, 78.0, 53.0, 48.0, 47.0, 44.0, 29.0, 19.0, 20.0, 10.0, 11.0, 8.0, 7.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.91796875, -6.7298583984375, -6.541748046875, -6.3536376953125, -6.16552734375, -5.9774169921875, -5.789306640625, -5.6011962890625, -5.4130859375, -5.2249755859375, -5.036865234375, -4.8487548828125, -4.66064453125, -4.4725341796875, -4.284423828125, -4.0963134765625, -3.908203125, -3.7200927734375, -3.531982421875, -3.3438720703125, -3.15576171875, -2.9676513671875, -2.779541015625, -2.5914306640625, -2.4033203125, -2.2152099609375, -2.027099609375, -1.8389892578125, -1.65087890625, -1.4627685546875, -1.274658203125, -1.0865478515625, -0.8984375, -0.7103271484375, -0.522216796875, -0.3341064453125, -0.14599609375, 0.0421142578125, 0.230224609375, 0.4183349609375, 0.6064453125, 0.7945556640625, 0.982666015625, 1.1707763671875, 1.35888671875, 1.5469970703125, 1.735107421875, 1.9232177734375, 2.111328125, 2.2994384765625, 2.487548828125, 2.6756591796875, 2.86376953125, 3.0518798828125, 3.239990234375, 3.4281005859375, 3.6162109375, 3.8043212890625, 3.992431640625, 4.1805419921875, 4.36865234375, 4.5567626953125, 4.744873046875, 4.9329833984375, 5.12109375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 6.0, 4.0, 2.0, 4.0, 8.0, 18.0, 12.0, 27.0, 31.0, 50.0, 50.0, 50.0, 50.0, 66.0, 67.0, 79.0, 61.0, 58.0, 63.0, 49.0, 49.0, 48.0, 43.0, 27.0, 21.0, 19.0, 10.0, 11.0, 8.0, 8.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.755859375, -2.6807861328125, -2.605712890625, -2.5306396484375, -2.45556640625, -2.3804931640625, -2.305419921875, -2.2303466796875, -2.1552734375, -2.0802001953125, -2.005126953125, -1.9300537109375, -1.85498046875, -1.7799072265625, -1.704833984375, -1.6297607421875, -1.5546875, -1.4796142578125, -1.404541015625, -1.3294677734375, -1.25439453125, -1.1793212890625, -1.104248046875, -1.0291748046875, -0.9541015625, -0.8790283203125, -0.803955078125, -0.7288818359375, -0.65380859375, -0.5787353515625, -0.503662109375, -0.4285888671875, -0.353515625, -0.2784423828125, -0.203369140625, -0.1282958984375, -0.05322265625, 0.0218505859375, 0.096923828125, 0.1719970703125, 0.2470703125, 0.3221435546875, 0.397216796875, 0.4722900390625, 0.54736328125, 0.6224365234375, 0.697509765625, 0.7725830078125, 0.84765625, 0.9227294921875, 0.997802734375, 1.0728759765625, 1.14794921875, 1.2230224609375, 1.298095703125, 1.3731689453125, 1.4482421875, 1.5233154296875, 1.598388671875, 1.6734619140625, 1.74853515625, 1.8236083984375, 1.898681640625, 1.9737548828125, 2.048828125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 3.0, 4.0, 13.0, 6.0, 10.0, 11.0, 16.0, 28.0, 56.0, 119.0, 909.0, 47024.0, 995990.0, 3841.0, 290.0, 99.0, 41.0, 22.0, 18.0, 11.0, 15.0, 12.0, 3.0, 4.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2939453125, -0.2842254638671875, -0.274505615234375, -0.2647857666015625, -0.25506591796875, -0.2453460693359375, -0.235626220703125, -0.2259063720703125, -0.2161865234375, -0.2064666748046875, -0.196746826171875, -0.1870269775390625, -0.17730712890625, -0.1675872802734375, -0.157867431640625, -0.1481475830078125, -0.138427734375, -0.1287078857421875, -0.118988037109375, -0.1092681884765625, -0.09954833984375, -0.0898284912109375, -0.080108642578125, -0.0703887939453125, -0.0606689453125, -0.0509490966796875, -0.041229248046875, -0.0315093994140625, -0.02178955078125, -0.0120697021484375, -0.002349853515625, 0.0073699951171875, 0.01708984375, 0.0268096923828125, 0.036529541015625, 0.0462493896484375, 0.05596923828125, 0.0656890869140625, 0.075408935546875, 0.0851287841796875, 0.0948486328125, 0.1045684814453125, 0.114288330078125, 0.1240081787109375, 0.13372802734375, 0.1434478759765625, 0.153167724609375, 0.1628875732421875, 0.172607421875, 0.1823272705078125, 0.192047119140625, 0.2017669677734375, 0.21148681640625, 0.2212066650390625, 0.230926513671875, 0.2406463623046875, 0.2503662109375, 0.2600860595703125, 0.269805908203125, 0.2795257568359375, 0.28924560546875, 0.2989654541015625, 0.308685302734375, 0.3184051513671875, 0.328125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 2.0, 9.0, 11.0, 11.0, 22.0, 24.0, 53.0, 76.0, 184.0, 223.0, 162.0, 68.0, 49.0, 29.0, 21.0, 7.0, 9.0, 12.0, 7.0, 5.0, 5.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.110004425048828e-05, -2.0592473447322845e-05, -2.008490264415741e-05, -1.9577331840991974e-05, -1.9069761037826538e-05, -1.8562190234661102e-05, -1.8054619431495667e-05, -1.754704862833023e-05, -1.7039477825164795e-05, -1.653190702199936e-05, -1.6024336218833923e-05, -1.5516765415668488e-05, -1.5009194612503052e-05, -1.4501623809337616e-05, -1.399405300617218e-05, -1.3486482203006744e-05, -1.2978911399841309e-05, -1.2471340596675873e-05, -1.1963769793510437e-05, -1.1456198990345001e-05, -1.0948628187179565e-05, -1.044105738401413e-05, -9.933486580848694e-06, -9.425915777683258e-06, -8.918344974517822e-06, -8.410774171352386e-06, -7.90320336818695e-06, -7.395632565021515e-06, -6.888061761856079e-06, -6.380490958690643e-06, -5.8729201555252075e-06, -5.365349352359772e-06, -4.857778549194336e-06, -4.3502077460289e-06, -3.842636942863464e-06, -3.3350661396980286e-06, -2.8274953365325928e-06, -2.319924533367157e-06, -1.8123537302017212e-06, -1.3047829270362854e-06, -7.972121238708496e-07, -2.896413207054138e-07, 2.1792948246002197e-07, 7.255002856254578e-07, 1.2330710887908936e-06, 1.7406418919563293e-06, 2.248212695121765e-06, 2.755783498287201e-06, 3.2633543014526367e-06, 3.7709251046180725e-06, 4.278495907783508e-06, 4.786066710948944e-06, 5.29363751411438e-06, 5.801208317279816e-06, 6.3087791204452515e-06, 6.816349923610687e-06, 7.323920726776123e-06, 7.831491529941559e-06, 8.339062333106995e-06, 8.84663313627243e-06, 9.354203939437866e-06, 9.861774742603302e-06, 1.0369345545768738e-05, 1.0876916348934174e-05, 1.138448715209961e-05]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 7.0, 8.0, 7.0, 6.0, 10.0, 31.0, 43.0, 45.0, 147.0, 408.0, 2067.0, 22442.0, 948740.0, 69620.0, 3908.0, 698.0, 151.0, 80.0, 50.0, 24.0, 16.0, 14.0, 8.0, 4.0, 1.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.177734375, -0.1726055145263672, -0.16747665405273438, -0.16234779357910156, -0.15721893310546875, -0.15209007263183594, -0.14696121215820312, -0.1418323516845703, -0.1367034912109375, -0.1315746307373047, -0.12644577026367188, -0.12131690979003906, -0.11618804931640625, -0.11105918884277344, -0.10593032836914062, -0.10080146789550781, -0.095672607421875, -0.09054374694824219, -0.08541488647460938, -0.08028602600097656, -0.07515716552734375, -0.07002830505371094, -0.06489944458007812, -0.05977058410644531, -0.0546417236328125, -0.04951286315917969, -0.044384002685546875, -0.03925514221191406, -0.03412628173828125, -0.028997421264648438, -0.023868560791015625, -0.018739700317382812, -0.01361083984375, -0.008481979370117188, -0.003353118896484375, 0.0017757415771484375, 0.00690460205078125, 0.012033462524414062, 0.017162322998046875, 0.022291183471679688, 0.0274200439453125, 0.03254890441894531, 0.037677764892578125, 0.04280662536621094, 0.04793548583984375, 0.05306434631347656, 0.058193206787109375, 0.06332206726074219, 0.068450927734375, 0.07357978820800781, 0.07870864868164062, 0.08383750915527344, 0.08896636962890625, 0.09409523010253906, 0.09922409057617188, 0.10435295104980469, 0.1094818115234375, 0.11461067199707031, 0.11973953247070312, 0.12486839294433594, 0.12999725341796875, 0.13512611389160156, 0.14025497436523438, 0.1453838348388672, 0.1505126953125]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 1.0, 4.0, 9.0, 14.0, 17.0, 22.0, 28.0, 41.0, 65.0, 91.0, 110.0, 137.0, 141.0, 91.0, 48.0, 44.0, 30.0, 21.0, 25.0, 11.0, 13.0, 12.0, 5.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0243988037109375, -0.023578405380249023, -0.022758007049560547, -0.02193760871887207, -0.021117210388183594, -0.020296812057495117, -0.01947641372680664, -0.018656015396118164, -0.017835617065429688, -0.01701521873474121, -0.016194820404052734, -0.015374422073364258, -0.014554023742675781, -0.013733625411987305, -0.012913227081298828, -0.012092828750610352, -0.011272430419921875, -0.010452032089233398, -0.009631633758544922, -0.008811235427856445, -0.007990837097167969, -0.007170438766479492, -0.006350040435791016, -0.005529642105102539, -0.0047092437744140625, -0.003888845443725586, -0.0030684471130371094, -0.002248048782348633, -0.0014276504516601562, -0.0006072521209716797, 0.00021314620971679688, 0.0010335445404052734, 0.00185394287109375, 0.0026743412017822266, 0.003494739532470703, 0.00431513786315918, 0.005135536193847656, 0.005955934524536133, 0.006776332855224609, 0.007596731185913086, 0.008417129516601562, 0.009237527847290039, 0.010057926177978516, 0.010878324508666992, 0.011698722839355469, 0.012519121170043945, 0.013339519500732422, 0.014159917831420898, 0.014980316162109375, 0.01580071449279785, 0.016621112823486328, 0.017441511154174805, 0.01826190948486328, 0.019082307815551758, 0.019902706146240234, 0.02072310447692871, 0.021543502807617188, 0.022363901138305664, 0.02318429946899414, 0.024004697799682617, 0.024825096130371094, 0.02564549446105957, 0.026465892791748047, 0.027286291122436523, 0.028106689453125]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 13.0, 35.0, 115.0, 333.0, 351.0, 114.0, 38.0, 9.0, 8.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8259516954421997, -0.7229790091514587, -0.6200063228607178, -0.5170336365699768, -0.41406095027923584, -0.3110882639884949, -0.2081155776977539, -0.10514289140701294, -0.0021702051162719727, 0.100802481174469, 0.20377516746520996, 0.3067478537559509, 0.4097205400466919, 0.5126932263374329, 0.6156659126281738, 0.7186385989189148, 0.8216112852096558, 0.9245839715003967, 1.0275566577911377, 1.1305294036865234, 1.2335020303726196, 1.3364746570587158, 1.4394474029541016, 1.5424201488494873, 1.6453927755355835, 1.7483654022216797, 1.8513381481170654, 1.9543108940124512, 2.057283401489258, 2.1602561473846436, 2.2632288932800293, 2.366201639175415, 2.469174385070801, 2.5721471309661865, 2.6751198768615723, 2.778092384338379, 2.8810651302337646, 2.9840378761291504, 3.087010383605957, 3.1899831295013428, 3.2929558753967285, 3.3959286212921143, 3.4989013671875, 3.6018738746643066, 3.7048466205596924, 3.807819366455078, 3.9107918739318848, 4.01376485824585, 4.116737365722656, 4.219709873199463, 4.322682857513428, 4.425655364990234, 4.528628349304199, 4.631600856781006, 4.7345733642578125, 4.837546348571777, 4.940518856048584, 5.043491363525391, 5.1464643478393555, 5.249436855316162, 5.352409362792969, 5.455382347106934, 5.55835485458374, 5.661327838897705, 5.764300346374512]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 8.0, 7.0, 6.0, 11.0, 12.0, 17.0, 15.0, 17.0, 19.0, 30.0, 24.0, 31.0, 43.0, 29.0, 30.0, 38.0, 35.0, 40.0, 43.0, 50.0, 57.0, 40.0, 48.0, 33.0, 42.0, 33.0, 42.0, 26.0, 33.0, 34.0, 30.0, 16.0, 14.0, 15.0, 9.0, 8.0, 10.0, 4.0, 5.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4271254539489746, -2.3518643379211426, -2.2766032218933105, -2.2013418674468994, -2.1260807514190674, -2.0508196353912354, -1.9755585193634033, -1.9002974033355713, -1.8250361680984497, -1.7497750520706177, -1.674513816833496, -1.599252700805664, -1.523991584777832, -1.4487303495407104, -1.3734692335128784, -1.2982079982757568, -1.2229468822479248, -1.1476857662200928, -1.0724245309829712, -0.9971634149551392, -0.9219022393226624, -0.8466410636901855, -0.7713799476623535, -0.6961187720298767, -0.6208575963973999, -0.5455964207649231, -0.4703352749347687, -0.39507412910461426, -0.31981295347213745, -0.24455177783966064, -0.16929063200950623, -0.0940294861793518, -0.018768310546875, 0.05649285018444061, 0.13175401091575623, 0.20701517164707184, 0.28227633237838745, 0.35753750801086426, 0.4327986538410187, 0.5080597996711731, 0.5833209753036499, 0.6585821509361267, 0.7338433265686035, 0.8091044425964355, 0.8843656182289124, 0.9596267938613892, 1.0348879098892212, 1.1101491451263428, 1.1854102611541748, 1.2606713771820068, 1.3359326124191284, 1.4111937284469604, 1.486454963684082, 1.561716079711914, 1.636977195739746, 1.7122383117675781, 1.7874995470046997, 1.8627606630325317, 1.9380218982696533, 2.0132830142974854, 2.0885441303253174, 2.1638054847717285, 2.2390666007995605, 2.3143277168273926, 2.3895888328552246]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 5.0, 3.0, 5.0, 5.0, 14.0, 10.0, 8.0, 13.0, 13.0, 18.0, 24.0, 26.0, 31.0, 31.0, 69.0, 130.0, 366.0, 1186.0, 4414.0, 29050.0, 3083652.0, 1051195.0, 18500.0, 3691.0, 1058.0, 363.0, 123.0, 64.0, 47.0, 37.0, 28.0, 30.0, 14.0, 13.0, 14.0, 13.0, 7.0, 9.0, 5.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.89453125, -1.836944580078125, -1.77935791015625, -1.721771240234375, -1.6641845703125, -1.606597900390625, -1.54901123046875, -1.491424560546875, -1.433837890625, -1.376251220703125, -1.31866455078125, -1.261077880859375, -1.2034912109375, -1.145904541015625, -1.08831787109375, -1.030731201171875, -0.97314453125, -0.915557861328125, -0.85797119140625, -0.800384521484375, -0.7427978515625, -0.685211181640625, -0.62762451171875, -0.570037841796875, -0.512451171875, -0.454864501953125, -0.39727783203125, -0.339691162109375, -0.2821044921875, -0.224517822265625, -0.16693115234375, -0.109344482421875, -0.0517578125, 0.005828857421875, 0.06341552734375, 0.121002197265625, 0.1785888671875, 0.236175537109375, 0.29376220703125, 0.351348876953125, 0.408935546875, 0.466522216796875, 0.52410888671875, 0.581695556640625, 0.6392822265625, 0.696868896484375, 0.75445556640625, 0.812042236328125, 0.86962890625, 0.927215576171875, 0.98480224609375, 1.042388916015625, 1.0999755859375, 1.157562255859375, 1.21514892578125, 1.272735595703125, 1.330322265625, 1.387908935546875, 1.44549560546875, 1.503082275390625, 1.5606689453125, 1.618255615234375, 1.67584228515625, 1.733428955078125, 1.791015625]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 13.0, 15.0, 18.0, 22.0, 23.0, 29.0, 40.0, 31.0, 43.0, 69.0, 74.0, 64.0, 54.0, 61.0, 84.0, 58.0, 54.0, 56.0, 45.0, 30.0, 35.0, 22.0, 16.0, 9.0, 9.0, 7.0, 5.0, 4.0, 2.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2958984375, -0.2823486328125, -0.268798828125, -0.2552490234375, -0.24169921875, -0.2281494140625, -0.214599609375, -0.2010498046875, -0.1875, -0.1739501953125, -0.160400390625, -0.1468505859375, -0.13330078125, -0.1197509765625, -0.106201171875, -0.0926513671875, -0.0791015625, -0.0655517578125, -0.052001953125, -0.0384521484375, -0.02490234375, -0.0113525390625, 0.002197265625, 0.0157470703125, 0.029296875, 0.0428466796875, 0.056396484375, 0.0699462890625, 0.08349609375, 0.0970458984375, 0.110595703125, 0.1241455078125, 0.1376953125, 0.1512451171875, 0.164794921875, 0.1783447265625, 0.19189453125, 0.2054443359375, 0.218994140625, 0.2325439453125, 0.24609375, 0.2596435546875, 0.273193359375, 0.2867431640625, 0.30029296875, 0.3138427734375, 0.327392578125, 0.3409423828125, 0.3544921875, 0.3680419921875, 0.381591796875, 0.3951416015625, 0.40869140625, 0.4222412109375, 0.435791015625, 0.4493408203125, 0.462890625, 0.4764404296875, 0.489990234375, 0.5035400390625, 0.51708984375, 0.5306396484375, 0.544189453125, 0.5577392578125, 0.5712890625]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 7.0, 5.0, 20.0, 40.0, 148.0, 432.0, 10353.0, 4181463.0, 1370.0, 298.0, 91.0, 29.0, 8.0, 4.0, 2.0, 4.0, 7.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.62890625, -5.37640380859375, -5.1239013671875, -4.87139892578125, -4.618896484375, -4.36639404296875, -4.1138916015625, -3.86138916015625, -3.60888671875, -3.35638427734375, -3.1038818359375, -2.85137939453125, -2.598876953125, -2.34637451171875, -2.0938720703125, -1.84136962890625, -1.5888671875, -1.33636474609375, -1.0838623046875, -0.83135986328125, -0.578857421875, -0.32635498046875, -0.0738525390625, 0.17864990234375, 0.43115234375, 0.68365478515625, 0.9361572265625, 1.18865966796875, 1.441162109375, 1.69366455078125, 1.9461669921875, 2.19866943359375, 2.451171875, 2.70367431640625, 2.9561767578125, 3.20867919921875, 3.461181640625, 3.71368408203125, 3.9661865234375, 4.21868896484375, 4.47119140625, 4.72369384765625, 4.9761962890625, 5.22869873046875, 5.481201171875, 5.73370361328125, 5.9862060546875, 6.23870849609375, 6.4912109375, 6.74371337890625, 6.9962158203125, 7.24871826171875, 7.501220703125, 7.75372314453125, 8.0062255859375, 8.25872802734375, 8.51123046875, 8.76373291015625, 9.0162353515625, 9.26873779296875, 9.521240234375, 9.77374267578125, 10.0262451171875, 10.27874755859375, 10.53125]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 4.0, 3.0, 7.0, 4.0, 8.0, 14.0, 12.0, 19.0, 30.0, 46.0, 68.0, 78.0, 149.0, 285.0, 612.0, 1065.0, 811.0, 360.0, 170.0, 89.0, 77.0, 39.0, 34.0, 26.0, 18.0, 13.0, 11.0, 7.0, 4.0, 4.0, 3.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2861328125, -0.2781181335449219, -0.27010345458984375, -0.2620887756347656, -0.2540740966796875, -0.24605941772460938, -0.23804473876953125, -0.23003005981445312, -0.222015380859375, -0.21400070190429688, -0.20598602294921875, -0.19797134399414062, -0.1899566650390625, -0.18194198608398438, -0.17392730712890625, -0.16591262817382812, -0.15789794921875, -0.14988327026367188, -0.14186859130859375, -0.13385391235351562, -0.1258392333984375, -0.11782455444335938, -0.10980987548828125, -0.10179519653320312, -0.093780517578125, -0.08576583862304688, -0.07775115966796875, -0.06973648071289062, -0.0617218017578125, -0.053707122802734375, -0.04569244384765625, -0.037677764892578125, -0.0296630859375, -0.021648406982421875, -0.01363372802734375, -0.005619049072265625, 0.0023956298828125, 0.010410308837890625, 0.01842498779296875, 0.026439666748046875, 0.034454345703125, 0.042469024658203125, 0.05048370361328125, 0.058498382568359375, 0.0665130615234375, 0.07452774047851562, 0.08254241943359375, 0.09055709838867188, 0.09857177734375, 0.10658645629882812, 0.11460113525390625, 0.12261581420898438, 0.1306304931640625, 0.13864517211914062, 0.14665985107421875, 0.15467453002929688, 0.162689208984375, 0.17070388793945312, 0.17871856689453125, 0.18673324584960938, 0.1947479248046875, 0.20276260375976562, 0.21077728271484375, 0.21879196166992188, 0.226806640625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 9.0, 17.0, 35.0, 44.0, 75.0, 125.0, 193.0, 187.0, 122.0, 68.0, 52.0, 26.0, 17.0, 11.0, 7.0, 2.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5024560689926147, -0.4691631495952606, -0.4358702003955841, -0.40257728099823, -0.36928433179855347, -0.33599141240119934, -0.3026984930038452, -0.2694055438041687, -0.23611262440681458, -0.20281969010829926, -0.16952675580978394, -0.1362338364124298, -0.10294090211391449, -0.06964796781539917, -0.036355048418045044, -0.003062114119529724, 0.030230820178985596, 0.06352375447750092, 0.09681668132543564, 0.13010960817337036, 0.16340254247188568, 0.196695476770401, 0.22998839616775513, 0.26328134536743164, 0.29657426476478577, 0.3298671841621399, 0.3631601333618164, 0.39645305275917053, 0.42974597215652466, 0.46303892135620117, 0.4963318407535553, 0.5296247601509094, 0.5629177093505859, 0.5962106585502625, 0.6295035481452942, 0.6627964973449707, 0.6960894465446472, 0.7293823957443237, 0.7626752853393555, 0.795968234539032, 0.8292611837387085, 0.862554132938385, 0.8958470225334167, 0.9291399717330933, 0.9624329209327698, 0.9957258701324463, 1.029018759727478, 1.0623116493225098, 1.095604658126831, 1.1288975477218628, 1.162190556526184, 1.1954834461212158, 1.2287763357162476, 1.2620693445205688, 1.2953622341156006, 1.3286551237106323, 1.361948013305664, 1.3952409029006958, 1.428533911705017, 1.4618268013000488, 1.4951196908950806, 1.5284126996994019, 1.5617055892944336, 1.5949984788894653, 1.6282914876937866]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 8.0, 4.0, 9.0, 16.0, 13.0, 13.0, 11.0, 24.0, 18.0, 21.0, 23.0, 39.0, 40.0, 48.0, 46.0, 49.0, 38.0, 44.0, 64.0, 46.0, 52.0, 38.0, 45.0, 52.0, 33.0, 28.0, 32.0, 43.0, 18.0, 13.0, 19.0, 13.0, 11.0, 9.0, 3.0, 8.0, 2.0, 3.0, 3.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3722960650920868, -0.35986608266830444, -0.3474361002445221, -0.33500614762306213, -0.3225761651992798, -0.31014618277549744, -0.2977162003517151, -0.2852862477302551, -0.2728562653064728, -0.26042628288269043, -0.24799631536006927, -0.23556633293628693, -0.22313636541366577, -0.21070638298988342, -0.19827640056610107, -0.18584643304347992, -0.17341645061969757, -0.16098646819591522, -0.14855650067329407, -0.13612651824951172, -0.12369655072689056, -0.11126656830310822, -0.09883659332990646, -0.08640661835670471, -0.07397664338350296, -0.06154666841030121, -0.04911669343709946, -0.03668671473860741, -0.024256739765405655, -0.011826764792203903, 0.000603213906288147, 0.013033188879489899, 0.02546316385269165, 0.0378931388258934, 0.050323113799095154, 0.0627530962228775, 0.07518306374549866, 0.087613046169281, 0.10004302114248276, 0.11247299611568451, 0.12490297108888626, 0.137332946062088, 0.14976292848587036, 0.16219289600849152, 0.17462287843227386, 0.18705284595489502, 0.19948282837867737, 0.21191281080245972, 0.22434277832508087, 0.23677276074886322, 0.24920272827148438, 0.2616327106952667, 0.2740626931190491, 0.28649264574050903, 0.2989226281642914, 0.31135261058807373, 0.3237825930118561, 0.3362125754356384, 0.3486425578594208, 0.36107251048088074, 0.3735024929046631, 0.38593247532844543, 0.3983624577522278, 0.41079241037368774, 0.4232223927974701]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 6.0, 4.0, 9.0, 8.0, 20.0, 23.0, 28.0, 47.0, 50.0, 75.0, 118.0, 175.0, 274.0, 399.0, 613.0, 966.0, 1692.0, 2866.0, 5055.0, 9299.0, 18621.0, 43428.0, 146776.0, 519884.0, 198565.0, 53478.0, 21740.0, 10668.0, 5629.0, 3165.0, 1802.0, 1067.0, 708.0, 461.0, 275.0, 172.0, 113.0, 84.0, 62.0, 36.0, 23.0, 23.0, 13.0, 9.0, 10.0, 5.0, 3.0, 9.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.18212890625, -0.17552947998046875, -0.1689300537109375, -0.16233062744140625, -0.155731201171875, -0.14913177490234375, -0.1425323486328125, -0.13593292236328125, -0.12933349609375, -0.12273406982421875, -0.1161346435546875, -0.10953521728515625, -0.102935791015625, -0.09633636474609375, -0.0897369384765625, -0.08313751220703125, -0.0765380859375, -0.06993865966796875, -0.0633392333984375, -0.05673980712890625, -0.050140380859375, -0.04354095458984375, -0.0369415283203125, -0.03034210205078125, -0.02374267578125, -0.01714324951171875, -0.0105438232421875, -0.00394439697265625, 0.002655029296875, 0.00925445556640625, 0.0158538818359375, 0.02245330810546875, 0.029052734375, 0.03565216064453125, 0.0422515869140625, 0.04885101318359375, 0.055450439453125, 0.06204986572265625, 0.0686492919921875, 0.07524871826171875, 0.08184814453125, 0.08844757080078125, 0.0950469970703125, 0.10164642333984375, 0.108245849609375, 0.11484527587890625, 0.1214447021484375, 0.12804412841796875, 0.1346435546875, 0.14124298095703125, 0.1478424072265625, 0.15444183349609375, 0.161041259765625, 0.16764068603515625, 0.1742401123046875, 0.18083953857421875, 0.18743896484375, 0.19403839111328125, 0.2006378173828125, 0.20723724365234375, 0.213836669921875, 0.22043609619140625, 0.2270355224609375, 0.23363494873046875, 0.240234375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 4.0, 5.0, 9.0, 6.0, 8.0, 17.0, 23.0, 23.0, 22.0, 33.0, 36.0, 47.0, 54.0, 57.0, 61.0, 60.0, 78.0, 61.0, 59.0, 52.0, 61.0, 48.0, 39.0, 35.0, 35.0, 24.0, 9.0, 11.0, 9.0, 5.0, 7.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26025390625, -0.2511138916015625, -0.241973876953125, -0.2328338623046875, -0.22369384765625, -0.2145538330078125, -0.205413818359375, -0.1962738037109375, -0.1871337890625, -0.1779937744140625, -0.168853759765625, -0.1597137451171875, -0.15057373046875, -0.1414337158203125, -0.132293701171875, -0.1231536865234375, -0.114013671875, -0.1048736572265625, -0.095733642578125, -0.0865936279296875, -0.07745361328125, -0.0683135986328125, -0.059173583984375, -0.0500335693359375, -0.0408935546875, -0.0317535400390625, -0.022613525390625, -0.0134735107421875, -0.00433349609375, 0.0048065185546875, 0.013946533203125, 0.0230865478515625, 0.0322265625, 0.0413665771484375, 0.050506591796875, 0.0596466064453125, 0.06878662109375, 0.0779266357421875, 0.087066650390625, 0.0962066650390625, 0.1053466796875, 0.1144866943359375, 0.123626708984375, 0.1327667236328125, 0.14190673828125, 0.1510467529296875, 0.160186767578125, 0.1693267822265625, 0.178466796875, 0.1876068115234375, 0.196746826171875, 0.2058868408203125, 0.21502685546875, 0.2241668701171875, 0.233306884765625, 0.2424468994140625, 0.2515869140625, 0.2607269287109375, 0.269866943359375, 0.2790069580078125, 0.28814697265625, 0.2972869873046875, 0.306427001953125, 0.3155670166015625, 0.32470703125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 2.0, 8.0, 2.0, 10.0, 23.0, 33.0, 45.0, 74.0, 154.0, 323.0, 810.0, 2030.0, 6321.0, 23856.0, 152287.0, 737888.0, 98991.0, 17819.0, 5017.0, 1637.0, 600.0, 282.0, 134.0, 63.0, 41.0, 26.0, 20.0, 12.0, 11.0, 11.0, 3.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.265625, -0.256591796875, -0.24755859375, -0.238525390625, -0.2294921875, -0.220458984375, -0.21142578125, -0.202392578125, -0.193359375, -0.184326171875, -0.17529296875, -0.166259765625, -0.1572265625, -0.148193359375, -0.13916015625, -0.130126953125, -0.12109375, -0.112060546875, -0.10302734375, -0.093994140625, -0.0849609375, -0.075927734375, -0.06689453125, -0.057861328125, -0.048828125, -0.039794921875, -0.03076171875, -0.021728515625, -0.0126953125, -0.003662109375, 0.00537109375, 0.014404296875, 0.0234375, 0.032470703125, 0.04150390625, 0.050537109375, 0.0595703125, 0.068603515625, 0.07763671875, 0.086669921875, 0.095703125, 0.104736328125, 0.11376953125, 0.122802734375, 0.1318359375, 0.140869140625, 0.14990234375, 0.158935546875, 0.16796875, 0.177001953125, 0.18603515625, 0.195068359375, 0.2041015625, 0.213134765625, 0.22216796875, 0.231201171875, 0.240234375, 0.249267578125, 0.25830078125, 0.267333984375, 0.2763671875, 0.285400390625, 0.29443359375, 0.303466796875, 0.3125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 8.0, 5.0, 8.0, 26.0, 16.0, 31.0, 30.0, 25.0, 44.0, 42.0, 49.0, 48.0, 58.0, 67.0, 70.0, 55.0, 62.0, 43.0, 43.0, 42.0, 36.0, 46.0, 36.0, 26.0, 19.0, 12.0, 12.0, 8.0, 10.0, 9.0, 3.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.50390625, -0.488800048828125, -0.47369384765625, -0.458587646484375, -0.4434814453125, -0.428375244140625, -0.41326904296875, -0.398162841796875, -0.383056640625, -0.367950439453125, -0.35284423828125, -0.337738037109375, -0.3226318359375, -0.307525634765625, -0.29241943359375, -0.277313232421875, -0.26220703125, -0.247100830078125, -0.23199462890625, -0.216888427734375, -0.2017822265625, -0.186676025390625, -0.17156982421875, -0.156463623046875, -0.141357421875, -0.126251220703125, -0.11114501953125, -0.096038818359375, -0.0809326171875, -0.065826416015625, -0.05072021484375, -0.035614013671875, -0.0205078125, -0.005401611328125, 0.00970458984375, 0.024810791015625, 0.0399169921875, 0.055023193359375, 0.07012939453125, 0.085235595703125, 0.100341796875, 0.115447998046875, 0.13055419921875, 0.145660400390625, 0.1607666015625, 0.175872802734375, 0.19097900390625, 0.206085205078125, 0.22119140625, 0.236297607421875, 0.25140380859375, 0.266510009765625, 0.2816162109375, 0.296722412109375, 0.31182861328125, 0.326934814453125, 0.342041015625, 0.357147216796875, 0.37225341796875, 0.387359619140625, 0.4024658203125, 0.417572021484375, 0.43267822265625, 0.447784423828125, 0.462890625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 6.0, 16.0, 17.0, 33.0, 31.0, 42.0, 69.0, 97.0, 158.0, 221.0, 370.0, 616.0, 1136.0, 2112.0, 4125.0, 8627.0, 21913.0, 77474.0, 462809.0, 369217.0, 64244.0, 19250.0, 7884.0, 3692.0, 1825.0, 974.0, 562.0, 347.0, 249.0, 128.0, 84.0, 51.0, 51.0, 26.0, 34.0, 16.0, 9.0, 8.0, 3.0, 6.0, 8.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.046844482421875, -0.045330047607421875, -0.04381561279296875, -0.042301177978515625, -0.0407867431640625, -0.039272308349609375, -0.03775787353515625, -0.036243438720703125, -0.03472900390625, -0.033214569091796875, -0.03170013427734375, -0.030185699462890625, -0.0286712646484375, -0.027156829833984375, -0.02564239501953125, -0.024127960205078125, -0.022613525390625, -0.021099090576171875, -0.01958465576171875, -0.018070220947265625, -0.0165557861328125, -0.015041351318359375, -0.01352691650390625, -0.012012481689453125, -0.010498046875, -0.008983612060546875, -0.00746917724609375, -0.005954742431640625, -0.0044403076171875, -0.002925872802734375, -0.00141143798828125, 0.000102996826171875, 0.001617431640625, 0.003131866455078125, 0.00464630126953125, 0.006160736083984375, 0.0076751708984375, 0.009189605712890625, 0.01070404052734375, 0.012218475341796875, 0.01373291015625, 0.015247344970703125, 0.01676177978515625, 0.018276214599609375, 0.0197906494140625, 0.021305084228515625, 0.02281951904296875, 0.024333953857421875, 0.025848388671875, 0.027362823486328125, 0.02887725830078125, 0.030391693115234375, 0.0319061279296875, 0.033420562744140625, 0.03493499755859375, 0.036449432373046875, 0.0379638671875, 0.039478302001953125, 0.04099273681640625, 0.042507171630859375, 0.0440216064453125, 0.045536041259765625, 0.04705047607421875, 0.048564910888671875, 0.050079345703125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 7.0, 9.0, 20.0, 24.0, 38.0, 70.0, 106.0, 157.0, 174.0, 140.0, 82.0, 66.0, 27.0, 14.0, 16.0, 10.0, 6.0, 8.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.029273986816406e-05, -3.904476761817932e-05, -3.779679536819458e-05, -3.654882311820984e-05, -3.53008508682251e-05, -3.4052878618240356e-05, -3.2804906368255615e-05, -3.1556934118270874e-05, -3.0308961868286133e-05, -2.906098961830139e-05, -2.781301736831665e-05, -2.656504511833191e-05, -2.5317072868347168e-05, -2.4069100618362427e-05, -2.2821128368377686e-05, -2.1573156118392944e-05, -2.0325183868408203e-05, -1.9077211618423462e-05, -1.782923936843872e-05, -1.658126711845398e-05, -1.5333294868469238e-05, -1.4085322618484497e-05, -1.2837350368499756e-05, -1.1589378118515015e-05, -1.0341405868530273e-05, -9.093433618545532e-06, -7.845461368560791e-06, -6.59748911857605e-06, -5.349516868591309e-06, -4.101544618606567e-06, -2.853572368621826e-06, -1.605600118637085e-06, -3.5762786865234375e-07, 8.903443813323975e-07, 2.1383166313171387e-06, 3.38628888130188e-06, 4.634261131286621e-06, 5.882233381271362e-06, 7.1302056312561035e-06, 8.378177881240845e-06, 9.626150131225586e-06, 1.0874122381210327e-05, 1.2122094631195068e-05, 1.337006688117981e-05, 1.461803913116455e-05, 1.5866011381149292e-05, 1.7113983631134033e-05, 1.8361955881118774e-05, 1.9609928131103516e-05, 2.0857900381088257e-05, 2.2105872631072998e-05, 2.335384488105774e-05, 2.460181713104248e-05, 2.584978938102722e-05, 2.7097761631011963e-05, 2.8345733880996704e-05, 2.9593706130981445e-05, 3.0841678380966187e-05, 3.208965063095093e-05, 3.333762288093567e-05, 3.458559513092041e-05, 3.583356738090515e-05, 3.708153963088989e-05, 3.8329511880874634e-05, 3.9577484130859375e-05]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 9.0, 7.0, 18.0, 27.0, 60.0, 127.0, 316.0, 1329.0, 8343.0, 139053.0, 865889.0, 29092.0, 3271.0, 610.0, 203.0, 85.0, 40.0, 29.0, 15.0, 11.0, 3.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1500244140625, -0.14577007293701172, -0.14151573181152344, -0.13726139068603516, -0.13300704956054688, -0.1287527084350586, -0.12449836730957031, -0.12024402618408203, -0.11598968505859375, -0.11173534393310547, -0.10748100280761719, -0.1032266616821289, -0.09897232055664062, -0.09471797943115234, -0.09046363830566406, -0.08620929718017578, -0.0819549560546875, -0.07770061492919922, -0.07344627380371094, -0.06919193267822266, -0.06493759155273438, -0.060683250427246094, -0.05642890930175781, -0.05217456817626953, -0.04792022705078125, -0.04366588592529297, -0.03941154479980469, -0.035157203674316406, -0.030902862548828125, -0.026648521423339844, -0.022394180297851562, -0.01813983917236328, -0.013885498046875, -0.009631156921386719, -0.0053768157958984375, -0.0011224746704101562, 0.003131866455078125, 0.007386207580566406, 0.011640548706054688, 0.01589488983154297, 0.02014923095703125, 0.02440357208251953, 0.028657913208007812, 0.032912254333496094, 0.037166595458984375, 0.041420936584472656, 0.04567527770996094, 0.04992961883544922, 0.0541839599609375, 0.05843830108642578, 0.06269264221191406, 0.06694698333740234, 0.07120132446289062, 0.0754556655883789, 0.07971000671386719, 0.08396434783935547, 0.08821868896484375, 0.09247303009033203, 0.09672737121582031, 0.1009817123413086, 0.10523605346679688, 0.10949039459228516, 0.11374473571777344, 0.11799907684326172, 0.12225341796875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 5.0, 1.0, 3.0, 3.0, 5.0, 5.0, 10.0, 9.0, 9.0, 18.0, 15.0, 10.0, 23.0, 40.0, 24.0, 48.0, 46.0, 55.0, 75.0, 70.0, 73.0, 72.0, 69.0, 44.0, 45.0, 40.0, 29.0, 25.0, 30.0, 16.0, 19.0, 18.0, 13.0, 5.0, 8.0, 3.0, 3.0, 5.0, 3.0, 1.0, 4.0, 0.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.01088714599609375, -0.010561227798461914, -0.010235309600830078, -0.009909391403198242, -0.009583473205566406, -0.00925755500793457, -0.008931636810302734, -0.008605718612670898, -0.008279800415039062, -0.007953882217407227, -0.007627964019775391, -0.007302045822143555, -0.006976127624511719, -0.006650209426879883, -0.006324291229248047, -0.005998373031616211, -0.005672454833984375, -0.005346536636352539, -0.005020618438720703, -0.004694700241088867, -0.004368782043457031, -0.004042863845825195, -0.0037169456481933594, -0.0033910274505615234, -0.0030651092529296875, -0.0027391910552978516, -0.0024132728576660156, -0.0020873546600341797, -0.0017614364624023438, -0.0014355182647705078, -0.0011096000671386719, -0.0007836818695068359, -0.000457763671875, -0.00013184547424316406, 0.00019407272338867188, 0.0005199909210205078, 0.0008459091186523438, 0.0011718273162841797, 0.0014977455139160156, 0.0018236637115478516, 0.0021495819091796875, 0.0024755001068115234, 0.0028014183044433594, 0.0031273365020751953, 0.0034532546997070312, 0.003779172897338867, 0.004105091094970703, 0.004431009292602539, 0.004756927490234375, 0.005082845687866211, 0.005408763885498047, 0.005734682083129883, 0.006060600280761719, 0.006386518478393555, 0.006712436676025391, 0.0070383548736572266, 0.0073642730712890625, 0.0076901912689208984, 0.008016109466552734, 0.00834202766418457, 0.008667945861816406, 0.008993864059448242, 0.009319782257080078, 0.009645700454711914, 0.00997161865234375]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 12.0, 11.0, 14.0, 13.0, 21.0, 24.0, 45.0, 55.0, 72.0, 112.0, 113.0, 129.0, 107.0, 64.0, 41.0, 47.0, 31.0, 21.0, 16.0, 9.0, 8.0, 5.0, 8.0, 2.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3130538761615753, -0.30230289697647095, -0.29155194759368896, -0.2808009684085846, -0.2700500190258026, -0.25929903984069824, -0.24854807555675507, -0.2377971112728119, -0.2270461469888687, -0.21629518270492554, -0.20554421842098236, -0.19479325413703918, -0.18404227495193481, -0.17329132556915283, -0.16254034638404846, -0.15178938210010529, -0.1410384178161621, -0.13028745353221893, -0.11953648924827576, -0.10878551751375198, -0.09803455322980881, -0.08728358894586563, -0.07653261721134186, -0.06578165292739868, -0.055030688643455505, -0.04427972435951233, -0.033528756350278854, -0.02277778834104538, -0.012026824057102203, -0.001275859773159027, 0.009475111961364746, 0.020226076245307922, 0.03097701072692871, 0.04172797501087189, 0.05247894302010536, 0.06322991102933884, 0.07398087531328201, 0.08473183959722519, 0.09548281133174896, 0.10623377561569214, 0.11698473989963531, 0.1277357041835785, 0.13848666846752167, 0.14923763275146484, 0.1599886119365692, 0.1707395613193512, 0.18149054050445557, 0.19224150478839874, 0.20299246907234192, 0.2137434333562851, 0.22449439764022827, 0.23524537682533264, 0.24599632620811462, 0.256747305393219, 0.267498254776001, 0.27824923396110535, 0.2890002131462097, 0.2997511923313141, 0.31050214171409607, 0.32125312089920044, 0.3320040702819824, 0.3427550494670868, 0.35350602865219116, 0.36425697803497314, 0.3750079274177551]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 9.0, 11.0, 10.0, 21.0, 10.0, 20.0, 20.0, 35.0, 21.0, 39.0, 52.0, 51.0, 61.0, 52.0, 47.0, 70.0, 65.0, 67.0, 47.0, 48.0, 46.0, 43.0, 31.0, 29.0, 23.0, 24.0, 9.0, 13.0, 8.0, 8.0, 4.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23378704488277435, -0.2255488783121109, -0.21731069684028625, -0.2090725302696228, -0.20083436369895935, -0.1925961971282959, -0.18435801565647125, -0.1761198490858078, -0.16788166761398315, -0.1596435010433197, -0.15140531957149506, -0.1431671530008316, -0.13492898643016815, -0.1266908049583435, -0.11845263838768005, -0.1102144718170166, -0.10197630524635315, -0.0937381312251091, -0.08549996465444565, -0.0772617906332016, -0.06902362406253815, -0.0607854500412941, -0.05254727602005005, -0.0443091057240963, -0.03607093542814255, -0.027832765132188797, -0.019594592973589897, -0.011356420814990997, -0.0031182505190372467, 0.005119919776916504, 0.013358093798160553, 0.021596264094114304, 0.029834449291229248, 0.038072619587183, 0.04631078988313675, 0.0545489639043808, 0.06278713047504425, 0.0710253044962883, 0.07926347851753235, 0.0875016450881958, 0.09573981910943985, 0.1039779931306839, 0.11221615970134735, 0.1204543337225914, 0.12869250774383545, 0.1369306743144989, 0.14516884088516235, 0.153407022356987, 0.16164518892765045, 0.1698833554983139, 0.17812153697013855, 0.186359703540802, 0.19459787011146545, 0.2028360366821289, 0.21107421815395355, 0.219312384724617, 0.22755056619644165, 0.2357887327671051, 0.24402691423892975, 0.2522650957107544, 0.26050326228141785, 0.2687414288520813, 0.27697959542274475, 0.2852177619934082, 0.29345592856407166]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 2.0, 9.0, 6.0, 13.0, 22.0, 36.0, 37.0, 58.0, 94.0, 140.0, 195.0, 277.0, 422.0, 728.0, 1172.0, 1996.0, 3694.0, 7413.0, 16022.0, 39532.0, 115221.0, 402043.0, 311053.0, 88605.0, 32041.0, 13562.0, 6249.0, 3267.0, 1805.0, 1009.0, 592.0, 428.0, 257.0, 167.0, 103.0, 73.0, 63.0, 43.0, 40.0, 23.0, 9.0, 11.0, 6.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10504150390625, -0.10164070129394531, -0.09823989868164062, -0.09483909606933594, -0.09143829345703125, -0.08803749084472656, -0.08463668823242188, -0.08123588562011719, -0.0778350830078125, -0.07443428039550781, -0.07103347778320312, -0.06763267517089844, -0.06423187255859375, -0.06083106994628906, -0.057430267333984375, -0.05402946472167969, -0.050628662109375, -0.04722785949707031, -0.043827056884765625, -0.04042625427246094, -0.03702545166015625, -0.03362464904785156, -0.030223846435546875, -0.026823043823242188, -0.0234222412109375, -0.020021438598632812, -0.016620635986328125, -0.013219833374023438, -0.00981903076171875, -0.0064182281494140625, -0.003017425537109375, 0.0003833770751953125, 0.0037841796875, 0.0071849822998046875, 0.010585784912109375, 0.013986587524414062, 0.01738739013671875, 0.020788192749023438, 0.024188995361328125, 0.027589797973632812, 0.0309906005859375, 0.03439140319824219, 0.037792205810546875, 0.04119300842285156, 0.04459381103515625, 0.04799461364746094, 0.051395416259765625, 0.05479621887207031, 0.058197021484375, 0.06159782409667969, 0.06499862670898438, 0.06839942932128906, 0.07180023193359375, 0.07520103454589844, 0.07860183715820312, 0.08200263977050781, 0.0854034423828125, 0.08880424499511719, 0.09220504760742188, 0.09560585021972656, 0.09900665283203125, 0.10240745544433594, 0.10580825805664062, 0.10920906066894531, 0.11260986328125]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 6.0, 2.0, 6.0, 7.0, 5.0, 11.0, 17.0, 18.0, 27.0, 14.0, 29.0, 31.0, 36.0, 37.0, 47.0, 47.0, 49.0, 36.0, 50.0, 63.0, 63.0, 61.0, 53.0, 52.0, 27.0, 37.0, 27.0, 27.0, 21.0, 16.0, 14.0, 14.0, 13.0, 7.0, 8.0, 10.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.62158203125, -0.603240966796875, -0.58489990234375, -0.566558837890625, -0.5482177734375, -0.529876708984375, -0.51153564453125, -0.493194580078125, -0.474853515625, -0.456512451171875, -0.43817138671875, -0.419830322265625, -0.4014892578125, -0.383148193359375, -0.36480712890625, -0.346466064453125, -0.328125, -0.309783935546875, -0.29144287109375, -0.273101806640625, -0.2547607421875, -0.236419677734375, -0.21807861328125, -0.199737548828125, -0.181396484375, -0.163055419921875, -0.14471435546875, -0.126373291015625, -0.1080322265625, -0.089691162109375, -0.07135009765625, -0.053009033203125, -0.03466796875, -0.016326904296875, 0.00201416015625, 0.020355224609375, 0.0386962890625, 0.057037353515625, 0.07537841796875, 0.093719482421875, 0.112060546875, 0.130401611328125, 0.14874267578125, 0.167083740234375, 0.1854248046875, 0.203765869140625, 0.22210693359375, 0.240447998046875, 0.2587890625, 0.277130126953125, 0.29547119140625, 0.313812255859375, 0.3321533203125, 0.350494384765625, 0.36883544921875, 0.387176513671875, 0.405517578125, 0.423858642578125, 0.44219970703125, 0.460540771484375, 0.4788818359375, 0.497222900390625, 0.51556396484375, 0.533905029296875, 0.55224609375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 2.0, 9.0, 10.0, 10.0, 6.0, 20.0, 21.0, 25.0, 31.0, 23.0, 29.0, 37.0, 26.0, 37.0, 43.0, 48.0, 67.0, 374.0, 1043886.0, 3353.0, 78.0, 45.0, 35.0, 42.0, 45.0, 35.0, 29.0, 30.0, 23.0, 16.0, 20.0, 19.0, 15.0, 7.0, 9.0, 7.0, 9.0, 8.0, 5.0, 7.0, 3.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0], "bins": [-2.23828125, -2.171844482421875, -2.10540771484375, -2.038970947265625, -1.9725341796875, -1.906097412109375, -1.83966064453125, -1.773223876953125, -1.706787109375, -1.640350341796875, -1.57391357421875, -1.507476806640625, -1.4410400390625, -1.374603271484375, -1.30816650390625, -1.241729736328125, -1.17529296875, -1.108856201171875, -1.04241943359375, -0.975982666015625, -0.9095458984375, -0.843109130859375, -0.77667236328125, -0.710235595703125, -0.643798828125, -0.577362060546875, -0.51092529296875, -0.444488525390625, -0.3780517578125, -0.311614990234375, -0.24517822265625, -0.178741455078125, -0.1123046875, -0.045867919921875, 0.02056884765625, 0.087005615234375, 0.1534423828125, 0.219879150390625, 0.28631591796875, 0.352752685546875, 0.419189453125, 0.485626220703125, 0.55206298828125, 0.618499755859375, 0.6849365234375, 0.751373291015625, 0.81781005859375, 0.884246826171875, 0.95068359375, 1.017120361328125, 1.08355712890625, 1.149993896484375, 1.2164306640625, 1.282867431640625, 1.34930419921875, 1.415740966796875, 1.482177734375, 1.548614501953125, 1.61505126953125, 1.681488037109375, 1.7479248046875, 1.814361572265625, 1.88079833984375, 1.947235107421875, 2.013671875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 3.0, 10.0, 11.0, 9.0, 10.0, 21.0, 23.0, 30.0, 28.0, 28.0, 42.0, 28.0, 34.0, 37.0, 51.0, 43.0, 41.0, 56.0, 50.0, 32.0, 42.0, 30.0, 38.0, 42.0, 36.0, 44.0, 22.0, 21.0, 17.0, 14.0, 21.0, 10.0, 11.0, 13.0, 11.0, 4.0, 4.0, 7.0, 8.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0], "bins": [-0.54345703125, -0.5277862548828125, -0.512115478515625, -0.4964447021484375, -0.48077392578125, -0.4651031494140625, -0.449432373046875, -0.4337615966796875, -0.4180908203125, -0.4024200439453125, -0.386749267578125, -0.3710784912109375, -0.35540771484375, -0.3397369384765625, -0.324066162109375, -0.3083953857421875, -0.292724609375, -0.2770538330078125, -0.261383056640625, -0.2457122802734375, -0.23004150390625, -0.2143707275390625, -0.198699951171875, -0.1830291748046875, -0.1673583984375, -0.1516876220703125, -0.136016845703125, -0.1203460693359375, -0.10467529296875, -0.0890045166015625, -0.073333740234375, -0.0576629638671875, -0.0419921875, -0.0263214111328125, -0.010650634765625, 0.0050201416015625, 0.02069091796875, 0.0363616943359375, 0.052032470703125, 0.0677032470703125, 0.0833740234375, 0.0990447998046875, 0.114715576171875, 0.1303863525390625, 0.14605712890625, 0.1617279052734375, 0.177398681640625, 0.1930694580078125, 0.208740234375, 0.2244110107421875, 0.240081787109375, 0.2557525634765625, 0.27142333984375, 0.2870941162109375, 0.302764892578125, 0.3184356689453125, 0.3341064453125, 0.3497772216796875, 0.365447998046875, 0.3811187744140625, 0.39678955078125, 0.4124603271484375, 0.428131103515625, 0.4438018798828125, 0.45947265625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 7.0, 4.0, 3.0, 8.0, 5.0, 17.0, 16.0, 37.0, 52.0, 149.0, 320.0, 1250.0, 11520.0, 952338.0, 78973.0, 2863.0, 557.0, 179.0, 102.0, 46.0, 37.0, 20.0, 13.0, 8.0, 6.0, 5.0, 6.0, 5.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1253662109375, -0.11932182312011719, -0.11327743530273438, -0.10723304748535156, -0.10118865966796875, -0.09514427185058594, -0.08909988403320312, -0.08305549621582031, -0.0770111083984375, -0.07096672058105469, -0.06492233276367188, -0.05887794494628906, -0.05283355712890625, -0.04678916931152344, -0.040744781494140625, -0.03470039367675781, -0.028656005859375, -0.022611618041992188, -0.016567230224609375, -0.010522842407226562, -0.00447845458984375, 0.0015659332275390625, 0.007610321044921875, 0.013654708862304688, 0.0196990966796875, 0.025743484497070312, 0.031787872314453125, 0.03783226013183594, 0.04387664794921875, 0.04992103576660156, 0.055965423583984375, 0.06200981140136719, 0.06805419921875, 0.07409858703613281, 0.08014297485351562, 0.08618736267089844, 0.09223175048828125, 0.09827613830566406, 0.10432052612304688, 0.11036491394042969, 0.1164093017578125, 0.12245368957519531, 0.12849807739257812, 0.13454246520996094, 0.14058685302734375, 0.14663124084472656, 0.15267562866210938, 0.1587200164794922, 0.164764404296875, 0.1708087921142578, 0.17685317993164062, 0.18289756774902344, 0.18894195556640625, 0.19498634338378906, 0.20103073120117188, 0.2070751190185547, 0.2131195068359375, 0.2191638946533203, 0.22520828247070312, 0.23125267028808594, 0.23729705810546875, 0.24334144592285156, 0.24938583374023438, 0.2554302215576172, 0.261474609375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 9.0, 5.0, 3.0, 3.0, 7.0, 10.0, 7.0, 11.0, 26.0, 31.0, 30.0, 49.0, 66.0, 111.0, 129.0, 137.0, 104.0, 81.0, 48.0, 35.0, 30.0, 18.0, 10.0, 7.0, 8.0, 3.0, 7.0, 4.0, 1.0, 3.0, 4.0, 5.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.0311603546142578e-05, -1.0007061064243317e-05, -9.702518582344055e-06, -9.397976100444794e-06, -9.093433618545532e-06, -8.78889113664627e-06, -8.48434865474701e-06, -8.179806172847748e-06, -7.875263690948486e-06, -7.570721209049225e-06, -7.266178727149963e-06, -6.961636245250702e-06, -6.6570937633514404e-06, -6.352551281452179e-06, -6.0480087995529175e-06, -5.743466317653656e-06, -5.4389238357543945e-06, -5.134381353855133e-06, -4.829838871955872e-06, -4.52529639005661e-06, -4.220753908157349e-06, -3.916211426258087e-06, -3.6116689443588257e-06, -3.307126462459564e-06, -3.0025839805603027e-06, -2.6980414986610413e-06, -2.3934990167617798e-06, -2.0889565348625183e-06, -1.7844140529632568e-06, -1.4798715710639954e-06, -1.1753290891647339e-06, -8.707866072654724e-07, -5.662441253662109e-07, -2.6170164346694946e-07, 4.284083843231201e-08, 3.473833203315735e-07, 6.51925802230835e-07, 9.564682841300964e-07, 1.261010766029358e-06, 1.5655532479286194e-06, 1.8700957298278809e-06, 2.1746382117271423e-06, 2.479180693626404e-06, 2.7837231755256653e-06, 3.0882656574249268e-06, 3.3928081393241882e-06, 3.6973506212234497e-06, 4.001893103122711e-06, 4.306435585021973e-06, 4.610978066921234e-06, 4.915520548820496e-06, 5.220063030719757e-06, 5.5246055126190186e-06, 5.82914799451828e-06, 6.1336904764175415e-06, 6.438232958316803e-06, 6.7427754402160645e-06, 7.047317922115326e-06, 7.351860404014587e-06, 7.656402885913849e-06, 7.96094536781311e-06, 8.265487849712372e-06, 8.570030331611633e-06, 8.874572813510895e-06, 9.179115295410156e-06]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 7.0, 7.0, 6.0, 18.0, 10.0, 24.0, 45.0, 67.0, 107.0, 203.0, 442.0, 921.0, 2390.0, 7765.0, 40146.0, 751812.0, 215915.0, 20373.0, 4933.0, 1802.0, 714.0, 370.0, 207.0, 107.0, 58.0, 36.0, 23.0, 12.0, 10.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.1103515625, -0.10735416412353516, -0.10435676574707031, -0.10135936737060547, -0.09836196899414062, -0.09536457061767578, -0.09236717224121094, -0.0893697738647461, -0.08637237548828125, -0.0833749771118164, -0.08037757873535156, -0.07738018035888672, -0.07438278198242188, -0.07138538360595703, -0.06838798522949219, -0.06539058685302734, -0.0623931884765625, -0.059395790100097656, -0.05639839172363281, -0.05340099334716797, -0.050403594970703125, -0.04740619659423828, -0.04440879821777344, -0.041411399841308594, -0.03841400146484375, -0.035416603088378906, -0.03241920471191406, -0.02942180633544922, -0.026424407958984375, -0.02342700958251953, -0.020429611206054688, -0.017432212829589844, -0.014434814453125, -0.011437416076660156, -0.008440017700195312, -0.005442619323730469, -0.002445220947265625, 0.0005521774291992188, 0.0035495758056640625, 0.006546974182128906, 0.00954437255859375, 0.012541770935058594, 0.015539169311523438, 0.01853656768798828, 0.021533966064453125, 0.02453136444091797, 0.027528762817382812, 0.030526161193847656, 0.0335235595703125, 0.036520957946777344, 0.03951835632324219, 0.04251575469970703, 0.045513153076171875, 0.04851055145263672, 0.05150794982910156, 0.054505348205566406, 0.05750274658203125, 0.060500144958496094, 0.06349754333496094, 0.06649494171142578, 0.06949234008789062, 0.07248973846435547, 0.07548713684082031, 0.07848453521728516, 0.08148193359375]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 7.0, 4.0, 7.0, 5.0, 4.0, 13.0, 19.0, 24.0, 18.0, 32.0, 64.0, 99.0, 104.0, 209.0, 114.0, 92.0, 58.0, 34.0, 27.0, 23.0, 14.0, 5.0, 10.0, 6.0, 5.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.021820068359375, -0.020803451538085938, -0.019786834716796875, -0.018770217895507812, -0.01775360107421875, -0.016736984252929688, -0.015720367431640625, -0.014703750610351562, -0.0136871337890625, -0.012670516967773438, -0.011653900146484375, -0.010637283325195312, -0.00962066650390625, -0.008604049682617188, -0.007587432861328125, -0.0065708160400390625, -0.00555419921875, -0.0045375823974609375, -0.003520965576171875, -0.0025043487548828125, -0.00148773193359375, -0.0004711151123046875, 0.000545501708984375, 0.0015621185302734375, 0.0025787353515625, 0.0035953521728515625, 0.004611968994140625, 0.0056285858154296875, 0.00664520263671875, 0.0076618194580078125, 0.008678436279296875, 0.009695053100585938, 0.010711669921875, 0.011728286743164062, 0.012744903564453125, 0.013761520385742188, 0.01477813720703125, 0.015794754028320312, 0.016811370849609375, 0.017827987670898438, 0.0188446044921875, 0.019861221313476562, 0.020877838134765625, 0.021894454956054688, 0.02291107177734375, 0.023927688598632812, 0.024944305419921875, 0.025960922241210938, 0.0269775390625, 0.027994155883789062, 0.029010772705078125, 0.030027389526367188, 0.03104400634765625, 0.03206062316894531, 0.033077239990234375, 0.03409385681152344, 0.0351104736328125, 0.03612709045410156, 0.037143707275390625, 0.03816032409667969, 0.03917694091796875, 0.04019355773925781, 0.041210174560546875, 0.04222679138183594, 0.043243408203125]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 9.0, 30.0, 63.0, 198.0, 349.0, 213.0, 82.0, 30.0, 18.0, 4.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.687655448913574, -2.624556064605713, -2.5614569187164307, -2.4983575344085693, -2.435258150100708, -2.372159004211426, -2.3090596199035645, -2.245960235595703, -2.182861089706421, -2.1197617053985596, -2.0566625595092773, -1.993563175201416, -1.9304639101028442, -1.8673646450042725, -1.8042652606964111, -1.7411659955978394, -1.678066611289978, -1.6149673461914062, -1.551867961883545, -1.4887686967849731, -1.4256694316864014, -1.36257004737854, -1.2994707822799683, -1.2363715171813965, -1.1732721328735352, -1.1101728677749634, -1.047073483467102, -0.9839742183685303, -0.9208749532699585, -0.8577756285667419, -0.7946763038635254, -0.7315770387649536, -0.6684778928756714, -0.6053785681724548, -0.5422793030738831, -0.4791799783706665, -0.41608068346977234, -0.3529813885688782, -0.2898820638656616, -0.22678276896476746, -0.1636834740638733, -0.10058417171239853, -0.03748486936092377, 0.025614440441131592, 0.08871373534202576, 0.15181303024291992, 0.21491235494613647, 0.27801164984703064, 0.3411109447479248, 0.40421023964881897, 0.46730953454971313, 0.5304088592529297, 0.5935081243515015, 0.656607449054718, 0.7197067737579346, 0.7828060388565063, 0.8459053635597229, 0.9090046882629395, 0.9721039533615112, 1.035203218460083, 1.0983026027679443, 1.1614018678665161, 1.224501132965088, 1.2876005172729492, 1.350699782371521]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 6.0, 4.0, 5.0, 11.0, 11.0, 12.0, 9.0, 20.0, 23.0, 27.0, 24.0, 26.0, 40.0, 38.0, 37.0, 37.0, 35.0, 53.0, 42.0, 48.0, 43.0, 48.0, 43.0, 48.0, 37.0, 32.0, 37.0, 26.0, 35.0, 20.0, 32.0, 24.0, 15.0, 16.0, 15.0, 8.0, 3.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8283340334892273, -0.8035085797309875, -0.7786831855773926, -0.7538577318191528, -0.7290323376655579, -0.7042068839073181, -0.6793814897537231, -0.6545560359954834, -0.6297305822372437, -0.6049051284790039, -0.5800797343254089, -0.5552542805671692, -0.5304288864135742, -0.5056034326553345, -0.4807780086994171, -0.45595258474349976, -0.4311271905899048, -0.4063017666339874, -0.38147634267807007, -0.3566508889198303, -0.33182549476623535, -0.3070000410079956, -0.28217461705207825, -0.2573491930961609, -0.23252376914024353, -0.20769834518432617, -0.1828729212284088, -0.15804748237133026, -0.1332220584154129, -0.10839663445949554, -0.08357119560241699, -0.058745771646499634, -0.033920347690582275, -0.009094920009374619, 0.01573050767183304, 0.040555939078330994, 0.06538136303424835, 0.09020678699016571, 0.11503222584724426, 0.13985764980316162, 0.16468307375907898, 0.18950849771499634, 0.2143339216709137, 0.23915936052799225, 0.2639847993850708, 0.28881019353866577, 0.3136356472969055, 0.3384610712528229, 0.36328649520874023, 0.3881119191646576, 0.41293734312057495, 0.4377627968788147, 0.46258819103240967, 0.4874136447906494, 0.5122390985488892, 0.5370644927024841, 0.5618898868560791, 0.5867153406143188, 0.6115407347679138, 0.6363661885261536, 0.6611915826797485, 0.6860170364379883, 0.710842490196228, 0.735667884349823, 0.7604933381080627]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 5.0, 5.0, 4.0, 9.0, 10.0, 15.0, 20.0, 21.0, 38.0, 38.0, 65.0, 106.0, 173.0, 271.0, 447.0, 826.0, 1448.0, 3037.0, 6493.0, 19750.0, 170285.0, 3270290.0, 668688.0, 34601.0, 9210.0, 3880.0, 1998.0, 1010.0, 605.0, 323.0, 226.0, 140.0, 82.0, 64.0, 35.0, 25.0, 14.0, 9.0, 6.0, 8.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7021484375, -0.67999267578125, -0.6578369140625, -0.63568115234375, -0.613525390625, -0.59136962890625, -0.5692138671875, -0.54705810546875, -0.52490234375, -0.50274658203125, -0.4805908203125, -0.45843505859375, -0.436279296875, -0.41412353515625, -0.3919677734375, -0.36981201171875, -0.34765625, -0.32550048828125, -0.3033447265625, -0.28118896484375, -0.259033203125, -0.23687744140625, -0.2147216796875, -0.19256591796875, -0.17041015625, -0.14825439453125, -0.1260986328125, -0.10394287109375, -0.081787109375, -0.05963134765625, -0.0374755859375, -0.01531982421875, 0.0068359375, 0.02899169921875, 0.0511474609375, 0.07330322265625, 0.095458984375, 0.11761474609375, 0.1397705078125, 0.16192626953125, 0.18408203125, 0.20623779296875, 0.2283935546875, 0.25054931640625, 0.272705078125, 0.29486083984375, 0.3170166015625, 0.33917236328125, 0.361328125, 0.38348388671875, 0.4056396484375, 0.42779541015625, 0.449951171875, 0.47210693359375, 0.4942626953125, 0.51641845703125, 0.53857421875, 0.56072998046875, 0.5828857421875, 0.60504150390625, 0.627197265625, 0.64935302734375, 0.6715087890625, 0.69366455078125, 0.7158203125]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 5.0, 5.0, 11.0, 6.0, 8.0, 13.0, 12.0, 14.0, 19.0, 17.0, 26.0, 31.0, 43.0, 42.0, 62.0, 56.0, 57.0, 65.0, 47.0, 67.0, 52.0, 51.0, 39.0, 33.0, 44.0, 42.0, 25.0, 27.0, 27.0, 14.0, 12.0, 7.0, 7.0, 6.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.302978515625, -0.2938880920410156, -0.28479766845703125, -0.2757072448730469, -0.2666168212890625, -0.2575263977050781, -0.24843597412109375, -0.23934555053710938, -0.230255126953125, -0.22116470336914062, -0.21207427978515625, -0.20298385620117188, -0.1938934326171875, -0.18480300903320312, -0.17571258544921875, -0.16662216186523438, -0.15753173828125, -0.14844131469726562, -0.13935089111328125, -0.13026046752929688, -0.1211700439453125, -0.11207962036132812, -0.10298919677734375, -0.09389877319335938, -0.084808349609375, -0.07571792602539062, -0.06662750244140625, -0.057537078857421875, -0.0484466552734375, -0.039356231689453125, -0.03026580810546875, -0.021175384521484375, -0.0120849609375, -0.002994537353515625, 0.00609588623046875, 0.015186309814453125, 0.0242767333984375, 0.033367156982421875, 0.04245758056640625, 0.051548004150390625, 0.060638427734375, 0.06972885131835938, 0.07881927490234375, 0.08790969848632812, 0.0970001220703125, 0.10609054565429688, 0.11518096923828125, 0.12427139282226562, 0.13336181640625, 0.14245223999023438, 0.15154266357421875, 0.16063308715820312, 0.1697235107421875, 0.17881393432617188, 0.18790435791015625, 0.19699478149414062, 0.206085205078125, 0.21517562866210938, 0.22426605224609375, 0.23335647583007812, 0.2424468994140625, 0.2515373229980469, 0.26062774658203125, 0.2697181701660156, 0.27880859375]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 4.0, 11.0, 9.0, 8.0, 6.0, 11.0, 19.0, 25.0, 29.0, 56.0, 101.0, 187.0, 657.0, 3553.0, 69914.0, 4088250.0, 28278.0, 2256.0, 488.0, 167.0, 75.0, 49.0, 39.0, 29.0, 11.0, 5.0, 9.0, 10.0, 5.0, 2.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4072265625, -1.3576507568359375, -1.308074951171875, -1.2584991455078125, -1.20892333984375, -1.1593475341796875, -1.109771728515625, -1.0601959228515625, -1.0106201171875, -0.9610443115234375, -0.911468505859375, -0.8618927001953125, -0.81231689453125, -0.7627410888671875, -0.713165283203125, -0.6635894775390625, -0.614013671875, -0.5644378662109375, -0.514862060546875, -0.4652862548828125, -0.41571044921875, -0.3661346435546875, -0.316558837890625, -0.2669830322265625, -0.2174072265625, -0.1678314208984375, -0.118255615234375, -0.0686798095703125, -0.01910400390625, 0.0304718017578125, 0.080047607421875, 0.1296234130859375, 0.17919921875, 0.2287750244140625, 0.278350830078125, 0.3279266357421875, 0.37750244140625, 0.4270782470703125, 0.476654052734375, 0.5262298583984375, 0.5758056640625, 0.6253814697265625, 0.674957275390625, 0.7245330810546875, 0.77410888671875, 0.8236846923828125, 0.873260498046875, 0.9228363037109375, 0.972412109375, 1.0219879150390625, 1.071563720703125, 1.1211395263671875, 1.17071533203125, 1.2202911376953125, 1.269866943359375, 1.3194427490234375, 1.3690185546875, 1.4185943603515625, 1.468170166015625, 1.5177459716796875, 1.56732177734375, 1.6168975830078125, 1.666473388671875, 1.7160491943359375, 1.765625]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 3.0, 6.0, 9.0, 7.0, 8.0, 14.0, 22.0, 31.0, 52.0, 49.0, 89.0, 165.0, 328.0, 624.0, 1000.0, 753.0, 386.0, 207.0, 92.0, 54.0, 49.0, 24.0, 16.0, 15.0, 12.0, 8.0, 5.0, 8.0, 10.0, 8.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.1834716796875, -0.17847251892089844, -0.17347335815429688, -0.1684741973876953, -0.16347503662109375, -0.1584758758544922, -0.15347671508789062, -0.14847755432128906, -0.1434783935546875, -0.13847923278808594, -0.13348007202148438, -0.1284809112548828, -0.12348175048828125, -0.11848258972167969, -0.11348342895507812, -0.10848426818847656, -0.103485107421875, -0.09848594665527344, -0.09348678588867188, -0.08848762512207031, -0.08348846435546875, -0.07848930358886719, -0.07349014282226562, -0.06849098205566406, -0.0634918212890625, -0.05849266052246094, -0.053493499755859375, -0.04849433898925781, -0.04349517822265625, -0.03849601745605469, -0.033496856689453125, -0.028497695922851562, -0.02349853515625, -0.018499374389648438, -0.013500213623046875, -0.008501052856445312, -0.00350189208984375, 0.0014972686767578125, 0.006496429443359375, 0.011495590209960938, 0.0164947509765625, 0.021493911743164062, 0.026493072509765625, 0.03149223327636719, 0.03649139404296875, 0.04149055480957031, 0.046489715576171875, 0.05148887634277344, 0.056488037109375, 0.06148719787597656, 0.06648635864257812, 0.07148551940917969, 0.07648468017578125, 0.08148384094238281, 0.08648300170898438, 0.09148216247558594, 0.0964813232421875, 0.10148048400878906, 0.10647964477539062, 0.11147880554199219, 0.11647796630859375, 0.12147712707519531, 0.12647628784179688, 0.13147544860839844, 0.136474609375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 5.0, 8.0, 7.0, 6.0, 17.0, 15.0, 32.0, 51.0, 67.0, 78.0, 109.0, 156.0, 116.0, 102.0, 67.0, 58.0, 42.0, 22.0, 21.0, 9.0, 6.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37770017981529236, -0.3595159947872162, -0.3413317799568176, -0.32314759492874146, -0.3049634099006653, -0.2867791950702667, -0.26859501004219055, -0.250410795211792, -0.23222661018371582, -0.21404241025447845, -0.1958582103252411, -0.17767402529716492, -0.15948982536792755, -0.14130562543869019, -0.12312143296003342, -0.10493724048137665, -0.08675304055213928, -0.06856884062290192, -0.05038464814424515, -0.03220045194029808, -0.014016255736351013, 0.0041679441928863525, 0.02235213667154312, 0.04053632915019989, 0.058720529079437256, 0.07690472900867462, 0.09508892148733139, 0.11327311396598816, 0.13145731389522552, 0.1496415138244629, 0.16782569885253906, 0.18600989878177643, 0.20419412851333618, 0.22237832844257355, 0.2405625283718109, 0.2587467133998871, 0.27693092823028564, 0.2951151132583618, 0.313299298286438, 0.33148348331451416, 0.3496676981449127, 0.3678518831729889, 0.38603609800338745, 0.4042202830314636, 0.4224044680595398, 0.44058868288993835, 0.4587728679180145, 0.4769570827484131, 0.49514126777648926, 0.5133254528045654, 0.5315096378326416, 0.5496938824653625, 0.5678780674934387, 0.5860622525215149, 0.6042464375495911, 0.6224306225776672, 0.6406148672103882, 0.6587990522384644, 0.6769832372665405, 0.6951674818992615, 0.7133516669273376, 0.7315358519554138, 0.74972003698349, 0.7679042220115662, 0.7860884070396423]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 8.0, 4.0, 4.0, 11.0, 13.0, 11.0, 9.0, 20.0, 21.0, 22.0, 38.0, 37.0, 43.0, 35.0, 32.0, 37.0, 50.0, 46.0, 44.0, 37.0, 44.0, 39.0, 34.0, 45.0, 42.0, 53.0, 30.0, 32.0, 27.0, 28.0, 20.0, 20.0, 9.0, 12.0, 14.0, 11.0, 7.0, 2.0, 3.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2518153488636017, -0.24294771254062653, -0.23408006131649017, -0.22521242499351501, -0.21634477376937866, -0.2074771374464035, -0.19860950112342834, -0.189741849899292, -0.18087421357631683, -0.17200657725334167, -0.16313892602920532, -0.15427128970623016, -0.145403653383255, -0.13653600215911865, -0.1276683658361435, -0.11880072206258774, -0.10993307828903198, -0.10106543451547623, -0.09219779074192047, -0.08333015441894531, -0.07446251064538956, -0.0655948668718338, -0.056727226823568344, -0.04785958677530289, -0.03899194300174713, -0.030124301090836525, -0.02125665917992592, -0.012389017269015312, -0.003521375358104706, 0.00534626841545105, 0.014213908463716507, 0.023081548511981964, 0.03194919228553772, 0.040816836059093475, 0.04968447610735893, 0.05855211615562439, 0.06741975992918015, 0.0762874037027359, 0.08515504002571106, 0.09402268379926682, 0.10289032757282257, 0.11175797134637833, 0.12062561511993408, 0.12949325144290924, 0.1383608877658844, 0.14722853899002075, 0.1560961753129959, 0.16496381163597107, 0.17383146286010742, 0.18269909918308258, 0.19156675040721893, 0.2004343867301941, 0.20930203795433044, 0.2181696742773056, 0.22703731060028076, 0.23590496182441711, 0.24477259814739227, 0.25364023447036743, 0.2625078856945038, 0.27137553691864014, 0.2802431583404541, 0.28911080956459045, 0.2979784607887268, 0.30684608221054077, 0.3157137334346771]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 11.0, 6.0, 17.0, 15.0, 37.0, 59.0, 109.0, 189.0, 389.0, 869.0, 2096.0, 6622.0, 27468.0, 383015.0, 583091.0, 32642.0, 7634.0, 2438.0, 976.0, 390.0, 180.0, 113.0, 71.0, 43.0, 27.0, 12.0, 12.0, 8.0, 11.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2381591796875, -0.22684669494628906, -0.21553421020507812, -0.2042217254638672, -0.19290924072265625, -0.1815967559814453, -0.17028427124023438, -0.15897178649902344, -0.1476593017578125, -0.13634681701660156, -0.12503433227539062, -0.11372184753417969, -0.10240936279296875, -0.09109687805175781, -0.07978439331054688, -0.06847190856933594, -0.057159423828125, -0.04584693908691406, -0.034534454345703125, -0.023221969604492188, -0.01190948486328125, -0.0005970001220703125, 0.010715484619140625, 0.022027969360351562, 0.0333404541015625, 0.04465293884277344, 0.055965423583984375, 0.06727790832519531, 0.07859039306640625, 0.08990287780761719, 0.10121536254882812, 0.11252784729003906, 0.12384033203125, 0.13515281677246094, 0.14646530151367188, 0.1577777862548828, 0.16909027099609375, 0.1804027557373047, 0.19171524047851562, 0.20302772521972656, 0.2143402099609375, 0.22565269470214844, 0.23696517944335938, 0.2482776641845703, 0.25959014892578125, 0.2709026336669922, 0.2822151184082031, 0.29352760314941406, 0.304840087890625, 0.31615257263183594, 0.3274650573730469, 0.3387775421142578, 0.35009002685546875, 0.3614025115966797, 0.3727149963378906, 0.38402748107910156, 0.3953399658203125, 0.40665245056152344, 0.4179649353027344, 0.4292774200439453, 0.44058990478515625, 0.4519023895263672, 0.4632148742675781, 0.47452735900878906, 0.48583984375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 2.0, 7.0, 5.0, 16.0, 14.0, 13.0, 39.0, 47.0, 61.0, 54.0, 71.0, 75.0, 78.0, 82.0, 69.0, 79.0, 78.0, 54.0, 39.0, 36.0, 32.0, 18.0, 16.0, 8.0, 6.0, 6.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1494140625, -0.14076614379882812, -0.13211822509765625, -0.12347030639648438, -0.1148223876953125, -0.10617446899414062, -0.09752655029296875, -0.08887863159179688, -0.080230712890625, -0.07158279418945312, -0.06293487548828125, -0.054286956787109375, -0.0456390380859375, -0.036991119384765625, -0.02834320068359375, -0.019695281982421875, -0.01104736328125, -0.002399444580078125, 0.00624847412109375, 0.014896392822265625, 0.0235443115234375, 0.032192230224609375, 0.04084014892578125, 0.049488067626953125, 0.058135986328125, 0.06678390502929688, 0.07543182373046875, 0.08407974243164062, 0.0927276611328125, 0.10137557983398438, 0.11002349853515625, 0.11867141723632812, 0.1273193359375, 0.13596725463867188, 0.14461517333984375, 0.15326309204101562, 0.1619110107421875, 0.17055892944335938, 0.17920684814453125, 0.18785476684570312, 0.196502685546875, 0.20515060424804688, 0.21379852294921875, 0.22244644165039062, 0.2310943603515625, 0.23974227905273438, 0.24839019775390625, 0.2570381164550781, 0.26568603515625, 0.2743339538574219, 0.28298187255859375, 0.2916297912597656, 0.3002777099609375, 0.3089256286621094, 0.31757354736328125, 0.3262214660644531, 0.334869384765625, 0.3435173034667969, 0.35216522216796875, 0.3608131408691406, 0.3694610595703125, 0.3781089782714844, 0.38675689697265625, 0.3954048156738281, 0.404052734375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 3.0, 7.0, 4.0, 4.0, 7.0, 15.0, 15.0, 17.0, 25.0, 53.0, 90.0, 140.0, 305.0, 643.0, 1651.0, 4650.0, 15976.0, 79999.0, 630864.0, 263139.0, 36709.0, 9221.0, 2919.0, 1129.0, 395.0, 230.0, 122.0, 61.0, 51.0, 30.0, 11.0, 11.0, 9.0, 8.0, 6.0, 6.0, 8.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1776123046875, -0.17235374450683594, -0.16709518432617188, -0.1618366241455078, -0.15657806396484375, -0.1513195037841797, -0.14606094360351562, -0.14080238342285156, -0.1355438232421875, -0.13028526306152344, -0.12502670288085938, -0.11976814270019531, -0.11450958251953125, -0.10925102233886719, -0.10399246215820312, -0.09873390197753906, -0.093475341796875, -0.08821678161621094, -0.08295822143554688, -0.07769966125488281, -0.07244110107421875, -0.06718254089355469, -0.061923980712890625, -0.05666542053222656, -0.0514068603515625, -0.04614830017089844, -0.040889739990234375, -0.03563117980957031, -0.03037261962890625, -0.025114059448242188, -0.019855499267578125, -0.014596939086914062, -0.00933837890625, -0.0040798187255859375, 0.001178741455078125, 0.0064373016357421875, 0.01169586181640625, 0.016954421997070312, 0.022212982177734375, 0.027471542358398438, 0.0327301025390625, 0.03798866271972656, 0.043247222900390625, 0.04850578308105469, 0.05376434326171875, 0.05902290344238281, 0.06428146362304688, 0.06954002380371094, 0.074798583984375, 0.08005714416503906, 0.08531570434570312, 0.09057426452636719, 0.09583282470703125, 0.10109138488769531, 0.10634994506835938, 0.11160850524902344, 0.1168670654296875, 0.12212562561035156, 0.12738418579101562, 0.1326427459716797, 0.13790130615234375, 0.1431598663330078, 0.14841842651367188, 0.15367698669433594, 0.158935546875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 5.0, 11.0, 6.0, 6.0, 6.0, 20.0, 16.0, 7.0, 19.0, 14.0, 28.0, 28.0, 36.0, 40.0, 40.0, 28.0, 47.0, 38.0, 43.0, 42.0, 48.0, 48.0, 57.0, 27.0, 48.0, 35.0, 38.0, 42.0, 37.0, 18.0, 25.0, 19.0, 17.0, 15.0, 13.0, 5.0, 8.0, 3.0, 5.0, 5.0, 3.0, 5.0, 4.0, 4.0, 0.0, 1.0, 2.0, 4.0], "bins": [-0.331787109375, -0.322662353515625, -0.31353759765625, -0.304412841796875, -0.2952880859375, -0.286163330078125, -0.27703857421875, -0.267913818359375, -0.2587890625, -0.249664306640625, -0.24053955078125, -0.231414794921875, -0.2222900390625, -0.213165283203125, -0.20404052734375, -0.194915771484375, -0.185791015625, -0.176666259765625, -0.16754150390625, -0.158416748046875, -0.1492919921875, -0.140167236328125, -0.13104248046875, -0.121917724609375, -0.11279296875, -0.103668212890625, -0.09454345703125, -0.085418701171875, -0.0762939453125, -0.067169189453125, -0.05804443359375, -0.048919677734375, -0.039794921875, -0.030670166015625, -0.02154541015625, -0.012420654296875, -0.0032958984375, 0.005828857421875, 0.01495361328125, 0.024078369140625, 0.033203125, 0.042327880859375, 0.05145263671875, 0.060577392578125, 0.0697021484375, 0.078826904296875, 0.08795166015625, 0.097076416015625, 0.106201171875, 0.115325927734375, 0.12445068359375, 0.133575439453125, 0.1427001953125, 0.151824951171875, 0.16094970703125, 0.170074462890625, 0.17919921875, 0.188323974609375, 0.19744873046875, 0.206573486328125, 0.2156982421875, 0.224822998046875, 0.23394775390625, 0.243072509765625, 0.252197265625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 8.0, 10.0, 12.0, 13.0, 37.0, 40.0, 49.0, 103.0, 141.0, 219.0, 388.0, 616.0, 1215.0, 2223.0, 4602.0, 10938.0, 34632.0, 172833.0, 633183.0, 139494.0, 29456.0, 9636.0, 4001.0, 1979.0, 1151.0, 582.0, 364.0, 191.0, 141.0, 91.0, 63.0, 55.0, 30.0, 14.0, 9.0, 11.0, 8.0, 4.0, 5.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0294036865234375, -0.02843785285949707, -0.02747201919555664, -0.02650618553161621, -0.02554035186767578, -0.02457451820373535, -0.023608684539794922, -0.022642850875854492, -0.021677017211914062, -0.020711183547973633, -0.019745349884033203, -0.018779516220092773, -0.017813682556152344, -0.016847848892211914, -0.015882015228271484, -0.014916181564331055, -0.013950347900390625, -0.012984514236450195, -0.012018680572509766, -0.011052846908569336, -0.010087013244628906, -0.009121179580688477, -0.008155345916748047, -0.007189512252807617, -0.0062236785888671875, -0.005257844924926758, -0.004292011260986328, -0.0033261775970458984, -0.0023603439331054688, -0.001394510269165039, -0.0004286766052246094, 0.0005371570587158203, 0.00150299072265625, 0.0024688243865966797, 0.0034346580505371094, 0.004400491714477539, 0.005366325378417969, 0.0063321590423583984, 0.007297992706298828, 0.008263826370239258, 0.009229660034179688, 0.010195493698120117, 0.011161327362060547, 0.012127161026000977, 0.013092994689941406, 0.014058828353881836, 0.015024662017822266, 0.015990495681762695, 0.016956329345703125, 0.017922163009643555, 0.018887996673583984, 0.019853830337524414, 0.020819664001464844, 0.021785497665405273, 0.022751331329345703, 0.023717164993286133, 0.024682998657226562, 0.025648832321166992, 0.026614665985107422, 0.02758049964904785, 0.02854633331298828, 0.02951216697692871, 0.03047800064086914, 0.03144383430480957, 0.03240966796875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 0.0, 4.0, 6.0, 5.0, 4.0, 8.0, 5.0, 10.0, 19.0, 24.0, 36.0, 50.0, 80.0, 96.0, 122.0, 138.0, 119.0, 75.0, 49.0, 47.0, 31.0, 18.0, 11.0, 14.0, 4.0, 7.0, 3.0, 5.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.0265579223632812e-05, -1.968909054994583e-05, -1.911260187625885e-05, -1.853611320257187e-05, -1.7959624528884888e-05, -1.7383135855197906e-05, -1.6806647181510925e-05, -1.6230158507823944e-05, -1.5653669834136963e-05, -1.5077181160449982e-05, -1.4500692486763e-05, -1.392420381307602e-05, -1.3347715139389038e-05, -1.2771226465702057e-05, -1.2194737792015076e-05, -1.1618249118328094e-05, -1.1041760444641113e-05, -1.0465271770954132e-05, -9.888783097267151e-06, -9.31229442358017e-06, -8.735805749893188e-06, -8.159317076206207e-06, -7.582828402519226e-06, -7.006339728832245e-06, -6.429851055145264e-06, -5.8533623814582825e-06, -5.276873707771301e-06, -4.70038503408432e-06, -4.123896360397339e-06, -3.5474076867103577e-06, -2.9709190130233765e-06, -2.3944303393363953e-06, -1.817941665649414e-06, -1.2414529919624329e-06, -6.649643182754517e-07, -8.847564458847046e-08, 4.880130290985107e-07, 1.064501702785492e-06, 1.6409903764724731e-06, 2.2174790501594543e-06, 2.7939677238464355e-06, 3.3704563975334167e-06, 3.946945071220398e-06, 4.523433744907379e-06, 5.09992241859436e-06, 5.6764110922813416e-06, 6.252899765968323e-06, 6.829388439655304e-06, 7.405877113342285e-06, 7.982365787029266e-06, 8.558854460716248e-06, 9.135343134403229e-06, 9.71183180809021e-06, 1.0288320481777191e-05, 1.0864809155464172e-05, 1.1441297829151154e-05, 1.2017786502838135e-05, 1.2594275176525116e-05, 1.3170763850212097e-05, 1.3747252523899078e-05, 1.432374119758606e-05, 1.490022987127304e-05, 1.5476718544960022e-05, 1.6053207218647003e-05, 1.6629695892333984e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 9.0, 13.0, 10.0, 14.0, 24.0, 32.0, 52.0, 100.0, 181.0, 458.0, 1176.0, 4146.0, 19579.0, 153131.0, 746594.0, 103078.0, 14776.0, 3433.0, 1021.0, 370.0, 148.0, 75.0, 36.0, 34.0, 18.0, 15.0, 9.0, 4.0, 8.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042816162109375, -0.041408538818359375, -0.04000091552734375, -0.038593292236328125, -0.0371856689453125, -0.035778045654296875, -0.03437042236328125, -0.032962799072265625, -0.03155517578125, -0.030147552490234375, -0.02873992919921875, -0.027332305908203125, -0.0259246826171875, -0.024517059326171875, -0.02310943603515625, -0.021701812744140625, -0.020294189453125, -0.018886566162109375, -0.01747894287109375, -0.016071319580078125, -0.0146636962890625, -0.013256072998046875, -0.01184844970703125, -0.010440826416015625, -0.009033203125, -0.007625579833984375, -0.00621795654296875, -0.004810333251953125, -0.0034027099609375, -0.001995086669921875, -0.00058746337890625, 0.000820159912109375, 0.002227783203125, 0.003635406494140625, 0.00504302978515625, 0.006450653076171875, 0.0078582763671875, 0.009265899658203125, 0.01067352294921875, 0.012081146240234375, 0.01348876953125, 0.014896392822265625, 0.01630401611328125, 0.017711639404296875, 0.0191192626953125, 0.020526885986328125, 0.02193450927734375, 0.023342132568359375, 0.024749755859375, 0.026157379150390625, 0.02756500244140625, 0.028972625732421875, 0.0303802490234375, 0.031787872314453125, 0.03319549560546875, 0.034603118896484375, 0.0360107421875, 0.037418365478515625, 0.03882598876953125, 0.040233612060546875, 0.0416412353515625, 0.043048858642578125, 0.04445648193359375, 0.045864105224609375, 0.047271728515625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 3.0, 5.0, 9.0, 10.0, 14.0, 14.0, 17.0, 27.0, 36.0, 41.0, 45.0, 48.0, 63.0, 74.0, 94.0, 118.0, 67.0, 60.0, 36.0, 35.0, 39.0, 31.0, 20.0, 28.0, 17.0, 12.0, 5.0, 6.0, 9.0, 7.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006473541259765625, -0.006262838840484619, -0.006052136421203613, -0.005841434001922607, -0.0056307315826416016, -0.005420029163360596, -0.00520932674407959, -0.004998624324798584, -0.004787921905517578, -0.004577219486236572, -0.004366517066955566, -0.0041558146476745605, -0.003945112228393555, -0.003734409809112549, -0.003523707389831543, -0.003313004970550537, -0.0031023025512695312, -0.0028916001319885254, -0.0026808977127075195, -0.0024701952934265137, -0.002259492874145508, -0.002048790454864502, -0.001838088035583496, -0.0016273856163024902, -0.0014166831970214844, -0.0012059807777404785, -0.0009952783584594727, -0.0007845759391784668, -0.0005738735198974609, -0.0003631711006164551, -0.00015246868133544922, 5.823373794555664e-05, 0.0002689361572265625, 0.00047963857650756836, 0.0006903409957885742, 0.0009010434150695801, 0.001111745834350586, 0.0013224482536315918, 0.0015331506729125977, 0.0017438530921936035, 0.0019545555114746094, 0.0021652579307556152, 0.002375960350036621, 0.002586662769317627, 0.002797365188598633, 0.0030080676078796387, 0.0032187700271606445, 0.0034294724464416504, 0.0036401748657226562, 0.003850877285003662, 0.004061579704284668, 0.004272282123565674, 0.00448298454284668, 0.0046936869621276855, 0.004904389381408691, 0.005115091800689697, 0.005325794219970703, 0.005536496639251709, 0.005747199058532715, 0.005957901477813721, 0.0061686038970947266, 0.006379306316375732, 0.006590008735656738, 0.006800711154937744, 0.00701141357421875]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 11.0, 10.0, 32.0, 34.0, 52.0, 62.0, 90.0, 101.0, 148.0, 119.0, 94.0, 71.0, 55.0, 34.0, 23.0, 19.0, 7.0, 10.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28356653451919556, -0.2743428945541382, -0.2651192545890808, -0.25589561462402344, -0.24667198956012726, -0.23744834959506989, -0.2282247245311737, -0.21900108456611633, -0.20977744460105896, -0.2005538046360016, -0.1913301646709442, -0.18210653960704803, -0.17288289964199066, -0.1636592596769333, -0.1544356346130371, -0.14521199464797974, -0.13598835468292236, -0.126764714717865, -0.11754108220338821, -0.10831744968891144, -0.09909380972385406, -0.08987016975879669, -0.08064653724431992, -0.07142290472984314, -0.06219926476478577, -0.05297562852501869, -0.04375199228525162, -0.03452835604548454, -0.025304719805717468, -0.016081083565950394, -0.006857447326183319, 0.002366185188293457, 0.011589854955673218, 0.020813491195440292, 0.030037127435207367, 0.03926076367497444, 0.048484399914741516, 0.05770803615450859, 0.06693167239427567, 0.07615530490875244, 0.08537894487380981, 0.09460258483886719, 0.10382621735334396, 0.11304984986782074, 0.12227348983287811, 0.13149712979793549, 0.14072075486183167, 0.14994439482688904, 0.1591680347919464, 0.16839167475700378, 0.17761531472206116, 0.18683893978595734, 0.1960625797510147, 0.20528621971607208, 0.21450984477996826, 0.22373348474502563, 0.232957124710083, 0.24218076467514038, 0.25140440464019775, 0.2606280446052551, 0.2698516845703125, 0.2790752947330475, 0.28829893469810486, 0.29752257466316223, 0.3067462146282196]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 4.0, 10.0, 13.0, 18.0, 22.0, 30.0, 45.0, 69.0, 76.0, 68.0, 81.0, 80.0, 77.0, 71.0, 85.0, 74.0, 59.0, 35.0, 32.0, 23.0, 14.0, 11.0, 8.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13032345473766327, -0.12155041843652725, -0.11277738213539124, -0.10400435328483582, -0.0952313095331192, -0.08645828068256378, -0.07768524438142776, -0.06891220808029175, -0.06013917177915573, -0.051366135478019714, -0.0425930991768837, -0.03382006660103798, -0.025047030299901962, -0.016273993998765945, -0.007500961422920227, 0.0012720748782157898, 0.010045111179351807, 0.018818147480487823, 0.02759118191897869, 0.03636421635746956, 0.045137252658605576, 0.05391028895974159, 0.06268332153558731, 0.07145635783672333, 0.08022939413785934, 0.08900243043899536, 0.09777546674013138, 0.1065485030412674, 0.11532153189182281, 0.12409457564353943, 0.13286760449409485, 0.14164063334465027, 0.1504136621952057, 0.1591866910457611, 0.16795973479747772, 0.17673276364803314, 0.18550580739974976, 0.19427883625030518, 0.2030518651008606, 0.2118249088525772, 0.22059795260429382, 0.22937098145484924, 0.23814402520656586, 0.24691705405712128, 0.2556900978088379, 0.2644631266593933, 0.27323615550994873, 0.28200918436050415, 0.29078221321105957, 0.299555242061615, 0.3083282709121704, 0.3171013295650482, 0.32587435841560364, 0.33464738726615906, 0.3434204161167145, 0.3521934747695923, 0.3609665036201477, 0.3697395324707031, 0.37851256132125854, 0.38728561997413635, 0.3960586488246918, 0.4048316776752472, 0.4136047065258026, 0.4223777651786804, 0.43115079402923584]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 10.0, 19.0, 25.0, 47.0, 57.0, 102.0, 190.0, 284.0, 506.0, 929.0, 1525.0, 3015.0, 5802.0, 12667.0, 32302.0, 122543.0, 657589.0, 147304.0, 36200.0, 13835.0, 6325.0, 3309.0, 1687.0, 927.0, 541.0, 308.0, 200.0, 116.0, 60.0, 52.0, 24.0, 20.0, 5.0, 7.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.335205078125, -0.3252143859863281, -0.31522369384765625, -0.3052330017089844, -0.2952423095703125, -0.2852516174316406, -0.27526092529296875, -0.2652702331542969, -0.255279541015625, -0.24528884887695312, -0.23529815673828125, -0.22530746459960938, -0.2153167724609375, -0.20532608032226562, -0.19533538818359375, -0.18534469604492188, -0.17535400390625, -0.16536331176757812, -0.15537261962890625, -0.14538192749023438, -0.1353912353515625, -0.12540054321289062, -0.11540985107421875, -0.10541915893554688, -0.095428466796875, -0.08543777465820312, -0.07544708251953125, -0.06545639038085938, -0.0554656982421875, -0.045475006103515625, -0.03548431396484375, -0.025493621826171875, -0.0155029296875, -0.005512237548828125, 0.00447845458984375, 0.014469146728515625, 0.0244598388671875, 0.034450531005859375, 0.04444122314453125, 0.054431915283203125, 0.064422607421875, 0.07441329956054688, 0.08440399169921875, 0.09439468383789062, 0.1043853759765625, 0.11437606811523438, 0.12436676025390625, 0.13435745239257812, 0.14434814453125, 0.15433883666992188, 0.16432952880859375, 0.17432022094726562, 0.1843109130859375, 0.19430160522460938, 0.20429229736328125, 0.21428298950195312, 0.224273681640625, 0.23426437377929688, 0.24425506591796875, 0.2542457580566406, 0.2642364501953125, 0.2742271423339844, 0.28421783447265625, 0.2942085266113281, 0.30419921875]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 8.0, 9.0, 20.0, 11.0, 31.0, 36.0, 55.0, 64.0, 62.0, 77.0, 93.0, 74.0, 76.0, 84.0, 63.0, 73.0, 52.0, 35.0, 26.0, 20.0, 9.0, 9.0, 7.0, 6.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28125, -0.2651519775390625, -0.249053955078125, -0.2329559326171875, -0.21685791015625, -0.2007598876953125, -0.184661865234375, -0.1685638427734375, -0.1524658203125, -0.1363677978515625, -0.120269775390625, -0.1041717529296875, -0.08807373046875, -0.0719757080078125, -0.055877685546875, -0.0397796630859375, -0.023681640625, -0.0075836181640625, 0.008514404296875, 0.0246124267578125, 0.04071044921875, 0.0568084716796875, 0.072906494140625, 0.0890045166015625, 0.1051025390625, 0.1212005615234375, 0.137298583984375, 0.1533966064453125, 0.16949462890625, 0.1855926513671875, 0.201690673828125, 0.2177886962890625, 0.23388671875, 0.2499847412109375, 0.266082763671875, 0.2821807861328125, 0.29827880859375, 0.3143768310546875, 0.330474853515625, 0.3465728759765625, 0.3626708984375, 0.3787689208984375, 0.394866943359375, 0.4109649658203125, 0.42706298828125, 0.4431610107421875, 0.459259033203125, 0.4753570556640625, 0.491455078125, 0.5075531005859375, 0.523651123046875, 0.5397491455078125, 0.55584716796875, 0.5719451904296875, 0.588043212890625, 0.6041412353515625, 0.6202392578125, 0.6363372802734375, 0.652435302734375, 0.6685333251953125, 0.68463134765625, 0.7007293701171875, 0.716827392578125, 0.7329254150390625, 0.7490234375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 6.0, 3.0, 5.0, 8.0, 14.0, 11.0, 14.0, 13.0, 25.0, 26.0, 42.0, 40.0, 58.0, 75.0, 74.0, 188.0, 409.0, 1666.0, 20922.0, 948494.0, 71593.0, 3587.0, 546.0, 220.0, 140.0, 79.0, 71.0, 51.0, 35.0, 27.0, 26.0, 23.0, 21.0, 10.0, 9.0, 10.0, 5.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.0751953125, -1.044189453125, -1.01318359375, -0.982177734375, -0.951171875, -0.920166015625, -0.88916015625, -0.858154296875, -0.8271484375, -0.796142578125, -0.76513671875, -0.734130859375, -0.703125, -0.672119140625, -0.64111328125, -0.610107421875, -0.5791015625, -0.548095703125, -0.51708984375, -0.486083984375, -0.455078125, -0.424072265625, -0.39306640625, -0.362060546875, -0.3310546875, -0.300048828125, -0.26904296875, -0.238037109375, -0.20703125, -0.176025390625, -0.14501953125, -0.114013671875, -0.0830078125, -0.052001953125, -0.02099609375, 0.010009765625, 0.041015625, 0.072021484375, 0.10302734375, 0.134033203125, 0.1650390625, 0.196044921875, 0.22705078125, 0.258056640625, 0.2890625, 0.320068359375, 0.35107421875, 0.382080078125, 0.4130859375, 0.444091796875, 0.47509765625, 0.506103515625, 0.537109375, 0.568115234375, 0.59912109375, 0.630126953125, 0.6611328125, 0.692138671875, 0.72314453125, 0.754150390625, 0.78515625, 0.816162109375, 0.84716796875, 0.878173828125, 0.9091796875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 8.0, 11.0, 6.0, 6.0, 7.0, 14.0, 14.0, 20.0, 17.0, 27.0, 33.0, 38.0, 44.0, 37.0, 50.0, 45.0, 56.0, 46.0, 59.0, 44.0, 47.0, 49.0, 49.0, 41.0, 47.0, 30.0, 34.0, 23.0, 20.0, 23.0, 11.0, 12.0, 10.0, 9.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33447265625, -0.3241767883300781, -0.31388092041015625, -0.3035850524902344, -0.2932891845703125, -0.2829933166503906, -0.27269744873046875, -0.2624015808105469, -0.252105712890625, -0.24180984497070312, -0.23151397705078125, -0.22121810913085938, -0.2109222412109375, -0.20062637329101562, -0.19033050537109375, -0.18003463745117188, -0.16973876953125, -0.15944290161132812, -0.14914703369140625, -0.13885116577148438, -0.1285552978515625, -0.11825942993164062, -0.10796356201171875, -0.09766769409179688, -0.087371826171875, -0.07707595825195312, -0.06678009033203125, -0.056484222412109375, -0.0461883544921875, -0.035892486572265625, -0.02559661865234375, -0.015300750732421875, -0.0050048828125, 0.005290985107421875, 0.01558685302734375, 0.025882720947265625, 0.0361785888671875, 0.046474456787109375, 0.05677032470703125, 0.06706619262695312, 0.077362060546875, 0.08765792846679688, 0.09795379638671875, 0.10824966430664062, 0.1185455322265625, 0.12884140014648438, 0.13913726806640625, 0.14943313598632812, 0.15972900390625, 0.17002487182617188, 0.18032073974609375, 0.19061660766601562, 0.2009124755859375, 0.21120834350585938, 0.22150421142578125, 0.23180007934570312, 0.242095947265625, 0.2523918151855469, 0.26268768310546875, 0.2729835510253906, 0.2832794189453125, 0.2935752868652344, 0.30387115478515625, 0.3141670227050781, 0.324462890625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 5.0, 6.0, 6.0, 2.0, 7.0, 9.0, 9.0, 7.0, 18.0, 19.0, 52.0, 97.0, 250.0, 886.0, 3959.0, 39459.0, 954423.0, 43568.0, 4198.0, 995.0, 292.0, 117.0, 55.0, 43.0, 22.0, 14.0, 10.0, 8.0, 8.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.18310546875, -0.17729568481445312, -0.17148590087890625, -0.16567611694335938, -0.1598663330078125, -0.15405654907226562, -0.14824676513671875, -0.14243698120117188, -0.136627197265625, -0.13081741333007812, -0.12500762939453125, -0.11919784545898438, -0.1133880615234375, -0.10757827758789062, -0.10176849365234375, -0.09595870971679688, -0.09014892578125, -0.08433914184570312, -0.07852935791015625, -0.07271957397460938, -0.0669097900390625, -0.061100006103515625, -0.05529022216796875, -0.049480438232421875, -0.043670654296875, -0.037860870361328125, -0.03205108642578125, -0.026241302490234375, -0.0204315185546875, -0.014621734619140625, -0.00881195068359375, -0.003002166748046875, 0.0028076171875, 0.008617401123046875, 0.01442718505859375, 0.020236968994140625, 0.0260467529296875, 0.031856536865234375, 0.03766632080078125, 0.043476104736328125, 0.049285888671875, 0.055095672607421875, 0.06090545654296875, 0.06671524047851562, 0.0725250244140625, 0.07833480834960938, 0.08414459228515625, 0.08995437622070312, 0.09576416015625, 0.10157394409179688, 0.10738372802734375, 0.11319351196289062, 0.1190032958984375, 0.12481307983398438, 0.13062286376953125, 0.13643264770507812, 0.142242431640625, 0.14805221557617188, 0.15386199951171875, 0.15967178344726562, 0.1654815673828125, 0.17129135131835938, 0.17710113525390625, 0.18291091918945312, 0.188720703125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 2.0, 4.0, 4.0, 4.0, 14.0, 10.0, 16.0, 33.0, 36.0, 83.0, 153.0, 212.0, 160.0, 83.0, 53.0, 39.0, 25.0, 15.0, 8.0, 11.0, 8.0, 2.0, 7.0, 3.0, 8.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7940998077392578e-05, -1.7449259757995605e-05, -1.6957521438598633e-05, -1.646578311920166e-05, -1.5974044799804688e-05, -1.5482306480407715e-05, -1.4990568161010742e-05, -1.449882984161377e-05, -1.4007091522216797e-05, -1.3515353202819824e-05, -1.3023614883422852e-05, -1.2531876564025879e-05, -1.2040138244628906e-05, -1.1548399925231934e-05, -1.1056661605834961e-05, -1.0564923286437988e-05, -1.0073184967041016e-05, -9.581446647644043e-06, -9.08970832824707e-06, -8.597970008850098e-06, -8.106231689453125e-06, -7.614493370056152e-06, -7.12275505065918e-06, -6.631016731262207e-06, -6.139278411865234e-06, -5.647540092468262e-06, -5.155801773071289e-06, -4.664063453674316e-06, -4.172325134277344e-06, -3.680586814880371e-06, -3.1888484954833984e-06, -2.6971101760864258e-06, -2.205371856689453e-06, -1.7136335372924805e-06, -1.2218952178955078e-06, -7.301568984985352e-07, -2.384185791015625e-07, 2.5331974029541016e-07, 7.450580596923828e-07, 1.2367963790893555e-06, 1.7285346984863281e-06, 2.2202730178833008e-06, 2.7120113372802734e-06, 3.203749656677246e-06, 3.6954879760742188e-06, 4.187226295471191e-06, 4.678964614868164e-06, 5.170702934265137e-06, 5.662441253662109e-06, 6.154179573059082e-06, 6.645917892456055e-06, 7.137656211853027e-06, 7.62939453125e-06, 8.121132850646973e-06, 8.612871170043945e-06, 9.104609489440918e-06, 9.59634780883789e-06, 1.0088086128234863e-05, 1.0579824447631836e-05, 1.1071562767028809e-05, 1.1563301086425781e-05, 1.2055039405822754e-05, 1.2546777725219727e-05, 1.30385160446167e-05, 1.3530254364013672e-05]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 10.0, 10.0, 14.0, 15.0, 24.0, 37.0, 62.0, 100.0, 211.0, 465.0, 1269.0, 3856.0, 17912.0, 304661.0, 686248.0, 26189.0, 4837.0, 1509.0, 557.0, 234.0, 109.0, 67.0, 52.0, 31.0, 21.0, 10.0, 8.0, 5.0, 6.0, 0.0, 4.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.150390625, -0.1461048126220703, -0.14181900024414062, -0.13753318786621094, -0.13324737548828125, -0.12896156311035156, -0.12467575073242188, -0.12038993835449219, -0.1161041259765625, -0.11181831359863281, -0.10753250122070312, -0.10324668884277344, -0.09896087646484375, -0.09467506408691406, -0.09038925170898438, -0.08610343933105469, -0.081817626953125, -0.07753181457519531, -0.07324600219726562, -0.06896018981933594, -0.06467437744140625, -0.06038856506347656, -0.056102752685546875, -0.05181694030761719, -0.0475311279296875, -0.04324531555175781, -0.038959503173828125, -0.03467369079589844, -0.03038787841796875, -0.026102066040039062, -0.021816253662109375, -0.017530441284179688, -0.01324462890625, -0.008958816528320312, -0.004673004150390625, -0.0003871917724609375, 0.00389862060546875, 0.008184432983398438, 0.012470245361328125, 0.016756057739257812, 0.0210418701171875, 0.025327682495117188, 0.029613494873046875, 0.03389930725097656, 0.03818511962890625, 0.04247093200683594, 0.046756744384765625, 0.05104255676269531, 0.055328369140625, 0.05961418151855469, 0.06389999389648438, 0.06818580627441406, 0.07247161865234375, 0.07675743103027344, 0.08104324340820312, 0.08532905578613281, 0.0896148681640625, 0.09390068054199219, 0.09818649291992188, 0.10247230529785156, 0.10675811767578125, 0.11104393005371094, 0.11532974243164062, 0.11961555480957031, 0.1239013671875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 4.0, 8.0, 12.0, 14.0, 13.0, 18.0, 32.0, 39.0, 54.0, 79.0, 117.0, 153.0, 127.0, 76.0, 80.0, 48.0, 37.0, 29.0, 18.0, 12.0, 6.0, 3.0, 5.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.03936767578125, -0.038074493408203125, -0.03678131103515625, -0.035488128662109375, -0.0341949462890625, -0.032901763916015625, -0.03160858154296875, -0.030315399169921875, -0.029022216796875, -0.027729034423828125, -0.02643585205078125, -0.025142669677734375, -0.0238494873046875, -0.022556304931640625, -0.02126312255859375, -0.019969940185546875, -0.0186767578125, -0.017383575439453125, -0.01609039306640625, -0.014797210693359375, -0.0135040283203125, -0.012210845947265625, -0.01091766357421875, -0.009624481201171875, -0.008331298828125, -0.007038116455078125, -0.00574493408203125, -0.004451751708984375, -0.0031585693359375, -0.001865386962890625, -0.00057220458984375, 0.000720977783203125, 0.00201416015625, 0.003307342529296875, 0.00460052490234375, 0.005893707275390625, 0.0071868896484375, 0.008480072021484375, 0.00977325439453125, 0.011066436767578125, 0.012359619140625, 0.013652801513671875, 0.01494598388671875, 0.016239166259765625, 0.0175323486328125, 0.018825531005859375, 0.02011871337890625, 0.021411895751953125, 0.022705078125, 0.023998260498046875, 0.02529144287109375, 0.026584625244140625, 0.0278778076171875, 0.029170989990234375, 0.03046417236328125, 0.031757354736328125, 0.033050537109375, 0.034343719482421875, 0.03563690185546875, 0.036930084228515625, 0.0382232666015625, 0.039516448974609375, 0.04080963134765625, 0.042102813720703125, 0.04339599609375]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 9.0, 23.0, 37.0, 47.0, 140.0, 180.0, 204.0, 153.0, 91.0, 51.0, 22.0, 18.0, 7.0, 9.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5272629857063293, -0.4985676407814026, -0.46987229585647583, -0.44117698073387146, -0.4124816358089447, -0.38378629088401794, -0.3550909757614136, -0.3263956308364868, -0.29770028591156006, -0.2690049409866333, -0.24030961096286774, -0.21161428093910217, -0.18291893601417542, -0.15422359108924866, -0.1255282610654831, -0.09683293104171753, -0.06813758611679077, -0.03944224864244461, -0.01074691116809845, 0.01794842630624771, 0.04664376378059387, 0.07533910870552063, 0.1040344387292862, 0.13272976875305176, 0.16142511367797852, 0.19012045860290527, 0.21881578862667084, 0.2475111186504364, 0.27620646357536316, 0.3049018085002899, 0.3335971236228943, 0.36229246854782104, 0.390987753868103, 0.4196830987930298, 0.44837844371795654, 0.4770737588405609, 0.5057691335678101, 0.5344644784927368, 0.5631597638130188, 0.5918551087379456, 0.6205504536628723, 0.6492457985877991, 0.6779411435127258, 0.7066364884376526, 0.7353317737579346, 0.7640271186828613, 0.7927224636077881, 0.8214178085327148, 0.8501131534576416, 0.8788084983825684, 0.9075038433074951, 0.9361991882324219, 0.9648945331573486, 0.9935898780822754, 1.0222852230072021, 1.050980567932129, 1.0796759128570557, 1.1083712577819824, 1.1370666027069092, 1.165761947631836, 1.1944572925567627, 1.2231526374816895, 1.2518479824066162, 1.280543327331543, 1.3092385530471802]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 7.0, 7.0, 7.0, 9.0, 18.0, 12.0, 22.0, 12.0, 24.0, 30.0, 24.0, 33.0, 35.0, 22.0, 40.0, 38.0, 51.0, 42.0, 53.0, 44.0, 42.0, 54.0, 43.0, 41.0, 37.0, 36.0, 35.0, 32.0, 25.0, 26.0, 16.0, 22.0, 12.0, 13.0, 9.0, 7.0, 10.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37177786231040955, -0.35603827238082886, -0.3402986526489258, -0.3245590627193451, -0.3088194727897644, -0.29307985305786133, -0.27734026312828064, -0.26160067319869995, -0.24586106836795807, -0.2301214635372162, -0.2143818736076355, -0.19864226877689362, -0.18290266394615173, -0.16716307401657104, -0.15142346918582916, -0.13568386435508728, -0.11994427442550659, -0.1042046770453453, -0.08846507966518402, -0.07272547483444214, -0.05698587745428085, -0.04124628007411957, -0.025506675243377686, -0.0097670778632164, 0.005972519516944885, 0.02171211875975132, 0.037451718002557755, 0.05319131910800934, 0.06893091648817062, 0.08467051386833191, 0.10041011869907379, 0.11614971607923508, 0.13188934326171875, 0.14762894809246063, 0.16336853802204132, 0.1791081428527832, 0.1948477327823639, 0.21058733761310577, 0.22632694244384766, 0.24206653237342834, 0.25780612230300903, 0.2735457122325897, 0.2892853319644928, 0.3050249218940735, 0.3207645118236542, 0.33650410175323486, 0.35224372148513794, 0.36798331141471863, 0.3837229311466217, 0.3994625210762024, 0.41520214080810547, 0.43094173073768616, 0.44668132066726685, 0.4624209403991699, 0.4781605303287506, 0.4939001202583313, 0.5096397399902344, 0.5253793597221375, 0.5411189198493958, 0.5568585395812988, 0.5725981593132019, 0.5883377194404602, 0.6040773391723633, 0.6198169589042664, 0.6355565190315247]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 5.0, 5.0, 10.0, 8.0, 8.0, 17.0, 23.0, 31.0, 29.0, 42.0, 69.0, 72.0, 118.0, 177.0, 283.0, 408.0, 656.0, 1187.0, 2088.0, 4385.0, 10444.0, 42519.0, 825234.0, 3049629.0, 222437.0, 20239.0, 7002.0, 3046.0, 1606.0, 884.0, 554.0, 309.0, 223.0, 160.0, 96.0, 57.0, 68.0, 42.0, 29.0, 22.0, 11.0, 15.0, 7.0, 4.0, 5.0, 10.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.423583984375, -0.40959930419921875, -0.3956146240234375, -0.38162994384765625, -0.367645263671875, -0.35366058349609375, -0.3396759033203125, -0.32569122314453125, -0.31170654296875, -0.29772186279296875, -0.2837371826171875, -0.26975250244140625, -0.255767822265625, -0.24178314208984375, -0.2277984619140625, -0.21381378173828125, -0.1998291015625, -0.18584442138671875, -0.1718597412109375, -0.15787506103515625, -0.143890380859375, -0.12990570068359375, -0.1159210205078125, -0.10193634033203125, -0.08795166015625, -0.07396697998046875, -0.0599822998046875, -0.04599761962890625, -0.032012939453125, -0.01802825927734375, -0.0040435791015625, 0.00994110107421875, 0.02392578125, 0.03791046142578125, 0.0518951416015625, 0.06587982177734375, 0.079864501953125, 0.09384918212890625, 0.1078338623046875, 0.12181854248046875, 0.13580322265625, 0.14978790283203125, 0.1637725830078125, 0.17775726318359375, 0.191741943359375, 0.20572662353515625, 0.2197113037109375, 0.23369598388671875, 0.2476806640625, 0.26166534423828125, 0.2756500244140625, 0.28963470458984375, 0.303619384765625, 0.31760406494140625, 0.3315887451171875, 0.34557342529296875, 0.35955810546875, 0.37354278564453125, 0.3875274658203125, 0.40151214599609375, 0.415496826171875, 0.42948150634765625, 0.4434661865234375, 0.45745086669921875, 0.471435546875]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 6.0, 5.0, 10.0, 1.0, 8.0, 6.0, 7.0, 13.0, 8.0, 13.0, 17.0, 16.0, 21.0, 14.0, 32.0, 27.0, 33.0, 30.0, 28.0, 34.0, 38.0, 30.0, 46.0, 33.0, 47.0, 43.0, 43.0, 46.0, 35.0, 32.0, 25.0, 29.0, 28.0, 34.0, 22.0, 15.0, 15.0, 25.0, 20.0, 15.0, 10.0, 7.0, 10.0, 5.0, 2.0, 5.0, 6.0, 2.0, 8.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.184814453125, -0.17955780029296875, -0.1743011474609375, -0.16904449462890625, -0.163787841796875, -0.15853118896484375, -0.1532745361328125, -0.14801788330078125, -0.14276123046875, -0.13750457763671875, -0.1322479248046875, -0.12699127197265625, -0.121734619140625, -0.11647796630859375, -0.1112213134765625, -0.10596466064453125, -0.1007080078125, -0.09545135498046875, -0.0901947021484375, -0.08493804931640625, -0.079681396484375, -0.07442474365234375, -0.0691680908203125, -0.06391143798828125, -0.05865478515625, -0.05339813232421875, -0.0481414794921875, -0.04288482666015625, -0.037628173828125, -0.03237152099609375, -0.0271148681640625, -0.02185821533203125, -0.0166015625, -0.01134490966796875, -0.0060882568359375, -0.00083160400390625, 0.004425048828125, 0.00968170166015625, 0.0149383544921875, 0.02019500732421875, 0.02545166015625, 0.03070831298828125, 0.0359649658203125, 0.04122161865234375, 0.046478271484375, 0.05173492431640625, 0.0569915771484375, 0.06224822998046875, 0.0675048828125, 0.07276153564453125, 0.0780181884765625, 0.08327484130859375, 0.088531494140625, 0.09378814697265625, 0.0990447998046875, 0.10430145263671875, 0.10955810546875, 0.11481475830078125, 0.1200714111328125, 0.12532806396484375, 0.130584716796875, 0.13584136962890625, 0.1410980224609375, 0.14635467529296875, 0.151611328125]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 3.0, 3.0, 6.0, 5.0, 10.0, 7.0, 11.0, 11.0, 15.0, 15.0, 37.0, 39.0, 46.0, 77.0, 122.0, 206.0, 748.0, 5431.0, 1522983.0, 2657565.0, 5659.0, 726.0, 191.0, 91.0, 65.0, 68.0, 31.0, 29.0, 13.0, 15.0, 18.0, 5.0, 9.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.62890625, -1.58489990234375, -1.5408935546875, -1.49688720703125, -1.452880859375, -1.40887451171875, -1.3648681640625, -1.32086181640625, -1.27685546875, -1.23284912109375, -1.1888427734375, -1.14483642578125, -1.100830078125, -1.05682373046875, -1.0128173828125, -0.96881103515625, -0.9248046875, -0.88079833984375, -0.8367919921875, -0.79278564453125, -0.748779296875, -0.70477294921875, -0.6607666015625, -0.61676025390625, -0.57275390625, -0.52874755859375, -0.4847412109375, -0.44073486328125, -0.396728515625, -0.35272216796875, -0.3087158203125, -0.26470947265625, -0.220703125, -0.17669677734375, -0.1326904296875, -0.08868408203125, -0.044677734375, -0.00067138671875, 0.0433349609375, 0.08734130859375, 0.13134765625, 0.17535400390625, 0.2193603515625, 0.26336669921875, 0.307373046875, 0.35137939453125, 0.3953857421875, 0.43939208984375, 0.4833984375, 0.52740478515625, 0.5714111328125, 0.61541748046875, 0.659423828125, 0.70343017578125, 0.7474365234375, 0.79144287109375, 0.83544921875, 0.87945556640625, 0.9234619140625, 0.96746826171875, 1.011474609375, 1.05548095703125, 1.0994873046875, 1.14349365234375, 1.1875]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 2.0, 4.0, 5.0, 11.0, 22.0, 27.0, 31.0, 40.0, 64.0, 126.0, 296.0, 724.0, 1213.0, 808.0, 332.0, 137.0, 70.0, 45.0, 31.0, 23.0, 10.0, 9.0, 16.0, 10.0, 6.0, 4.0, 2.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10369873046875, -0.0993051528930664, -0.09491157531738281, -0.09051799774169922, -0.08612442016601562, -0.08173084259033203, -0.07733726501464844, -0.07294368743896484, -0.06855010986328125, -0.06415653228759766, -0.05976295471191406, -0.05536937713623047, -0.050975799560546875, -0.04658222198486328, -0.04218864440917969, -0.037795066833496094, -0.0334014892578125, -0.029007911682128906, -0.024614334106445312, -0.02022075653076172, -0.015827178955078125, -0.011433601379394531, -0.0070400238037109375, -0.0026464462280273438, 0.00174713134765625, 0.006140708923339844, 0.010534286499023438, 0.014927864074707031, 0.019321441650390625, 0.02371501922607422, 0.028108596801757812, 0.032502174377441406, 0.036895751953125, 0.041289329528808594, 0.04568290710449219, 0.05007648468017578, 0.054470062255859375, 0.05886363983154297, 0.06325721740722656, 0.06765079498291016, 0.07204437255859375, 0.07643795013427734, 0.08083152770996094, 0.08522510528564453, 0.08961868286132812, 0.09401226043701172, 0.09840583801269531, 0.1027994155883789, 0.1071929931640625, 0.1115865707397461, 0.11598014831542969, 0.12037372589111328, 0.12476730346679688, 0.12916088104248047, 0.13355445861816406, 0.13794803619384766, 0.14234161376953125, 0.14673519134521484, 0.15112876892089844, 0.15552234649658203, 0.15991592407226562, 0.16430950164794922, 0.1687030792236328, 0.1730966567993164, 0.177490234375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 6.0, 10.0, 12.0, 31.0, 39.0, 52.0, 82.0, 104.0, 139.0, 110.0, 116.0, 70.0, 59.0, 37.0, 32.0, 27.0, 23.0, 12.0, 9.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2836915850639343, -0.2709067463874817, -0.25812193751335144, -0.24533711373806, -0.23255228996276855, -0.21976745128631592, -0.20698264241218567, -0.19419780373573303, -0.18141299486160278, -0.16862817108631134, -0.1558433473110199, -0.14305852353572845, -0.130273699760437, -0.11748886853456497, -0.10470404475927353, -0.09191922098398209, -0.07913438975811005, -0.0663495659828186, -0.05356474220752716, -0.04077991470694542, -0.027995090931653976, -0.015210263431072235, -0.0024254396557807922, 0.01035938411951065, 0.023144207894802094, 0.035929031670093536, 0.04871385544538498, 0.06149868294596672, 0.07428351044654846, 0.0870683342218399, 0.09985315799713135, 0.11263798177242279, 0.12542280554771423, 0.13820762932300568, 0.15099245309829712, 0.16377727687358856, 0.17656210064888, 0.18934693932533264, 0.2021317481994629, 0.21491658687591553, 0.22770139575004578, 0.24048621952533722, 0.25327104330062866, 0.2660558819770813, 0.27884069085121155, 0.2916255295276642, 0.30441033840179443, 0.31719517707824707, 0.3299800157546997, 0.34276485443115234, 0.3555496633052826, 0.36833450198173523, 0.3811193108558655, 0.3939041495323181, 0.40668895840644836, 0.419473797082901, 0.43225860595703125, 0.4450434446334839, 0.45782825350761414, 0.4706130921840668, 0.483397901058197, 0.49618273973464966, 0.5089675784111023, 0.5217523574829102, 0.5345371961593628]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 5.0, 10.0, 3.0, 5.0, 13.0, 6.0, 13.0, 18.0, 24.0, 15.0, 29.0, 31.0, 34.0, 33.0, 30.0, 36.0, 44.0, 44.0, 41.0, 48.0, 42.0, 53.0, 41.0, 39.0, 39.0, 42.0, 43.0, 36.0, 36.0, 27.0, 22.0, 18.0, 16.0, 16.0, 7.0, 9.0, 8.0, 8.0, 3.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2305736392736435, -0.22390788793563843, -0.21724213659763336, -0.2105763852596283, -0.20391061902046204, -0.19724488258361816, -0.1905791163444519, -0.18391336500644684, -0.17724761366844177, -0.1705818623304367, -0.16391611099243164, -0.15725035965442657, -0.1505846083164215, -0.14391884207725525, -0.13725309073925018, -0.13058733940124512, -0.12392158806324005, -0.11725583672523499, -0.11059008538722992, -0.10392432659864426, -0.09725857526063919, -0.09059282392263412, -0.08392706513404846, -0.0772613137960434, -0.07059556245803833, -0.06392981112003326, -0.0572640560567379, -0.050598300993442535, -0.04393254965543747, -0.037266798317432404, -0.03060104325413704, -0.023935288190841675, -0.017269551753997803, -0.010603798553347588, -0.0039380453526973724, 0.0027277078479528427, 0.009393461048603058, 0.016059212386608124, 0.022724967449903488, 0.029390722513198853, 0.03605647385120392, 0.042722225189208984, 0.04938798025250435, 0.05605373531579971, 0.06271948665380478, 0.06938523799180984, 0.07605099678039551, 0.08271674811840057, 0.08938249945640564, 0.0960482507944107, 0.10271400213241577, 0.10937976092100143, 0.1160455122590065, 0.12271126359701157, 0.12937702238559723, 0.1360427737236023, 0.14270852506160736, 0.14937427639961243, 0.1560400277376175, 0.16270577907562256, 0.16937154531478882, 0.1760372817516327, 0.18270304799079895, 0.18936879932880402, 0.19603455066680908]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 7.0, 5.0, 12.0, 19.0, 25.0, 36.0, 59.0, 69.0, 133.0, 181.0, 259.0, 441.0, 831.0, 1404.0, 2723.0, 5952.0, 14071.0, 41521.0, 170920.0, 560404.0, 179648.0, 42631.0, 14581.0, 6222.0, 2941.0, 1449.0, 789.0, 484.0, 252.0, 183.0, 84.0, 70.0, 40.0, 36.0, 20.0, 14.0, 13.0, 9.0, 2.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.091552734375, -0.0891122817993164, -0.08667182922363281, -0.08423137664794922, -0.08179092407226562, -0.07935047149658203, -0.07691001892089844, -0.07446956634521484, -0.07202911376953125, -0.06958866119384766, -0.06714820861816406, -0.06470775604248047, -0.062267303466796875, -0.05982685089111328, -0.05738639831542969, -0.054945945739746094, -0.0525054931640625, -0.050065040588378906, -0.04762458801269531, -0.04518413543701172, -0.042743682861328125, -0.04030323028564453, -0.03786277770996094, -0.035422325134277344, -0.03298187255859375, -0.030541419982910156, -0.028100967407226562, -0.02566051483154297, -0.023220062255859375, -0.02077960968017578, -0.018339157104492188, -0.015898704528808594, -0.013458251953125, -0.011017799377441406, -0.008577346801757812, -0.006136894226074219, -0.003696441650390625, -0.0012559890747070312, 0.0011844635009765625, 0.0036249160766601562, 0.00606536865234375, 0.008505821228027344, 0.010946273803710938, 0.013386726379394531, 0.015827178955078125, 0.01826763153076172, 0.020708084106445312, 0.023148536682128906, 0.0255889892578125, 0.028029441833496094, 0.030469894409179688, 0.03291034698486328, 0.035350799560546875, 0.03779125213623047, 0.04023170471191406, 0.042672157287597656, 0.04511260986328125, 0.047553062438964844, 0.04999351501464844, 0.05243396759033203, 0.054874420166015625, 0.05731487274169922, 0.05975532531738281, 0.062195777893066406, 0.06463623046875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 3.0, 5.0, 7.0, 13.0, 14.0, 16.0, 18.0, 37.0, 35.0, 36.0, 37.0, 56.0, 42.0, 69.0, 57.0, 64.0, 66.0, 76.0, 50.0, 38.0, 60.0, 50.0, 32.0, 25.0, 31.0, 19.0, 11.0, 4.0, 6.0, 8.0, 4.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.184814453125, -0.178985595703125, -0.17315673828125, -0.167327880859375, -0.1614990234375, -0.155670166015625, -0.14984130859375, -0.144012451171875, -0.13818359375, -0.132354736328125, -0.12652587890625, -0.120697021484375, -0.1148681640625, -0.109039306640625, -0.10321044921875, -0.097381591796875, -0.091552734375, -0.085723876953125, -0.07989501953125, -0.074066162109375, -0.0682373046875, -0.062408447265625, -0.05657958984375, -0.050750732421875, -0.044921875, -0.039093017578125, -0.03326416015625, -0.027435302734375, -0.0216064453125, -0.015777587890625, -0.00994873046875, -0.004119873046875, 0.001708984375, 0.007537841796875, 0.01336669921875, 0.019195556640625, 0.0250244140625, 0.030853271484375, 0.03668212890625, 0.042510986328125, 0.04833984375, 0.054168701171875, 0.05999755859375, 0.065826416015625, 0.0716552734375, 0.077484130859375, 0.08331298828125, 0.089141845703125, 0.094970703125, 0.100799560546875, 0.10662841796875, 0.112457275390625, 0.1182861328125, 0.124114990234375, 0.12994384765625, 0.135772705078125, 0.1416015625, 0.147430419921875, 0.15325927734375, 0.159088134765625, 0.1649169921875, 0.170745849609375, 0.17657470703125, 0.182403564453125, 0.188232421875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 3.0, 5.0, 4.0, 4.0, 5.0, 14.0, 20.0, 29.0, 54.0, 79.0, 163.0, 381.0, 1024.0, 3487.0, 15701.0, 115726.0, 735406.0, 151688.0, 18646.0, 4093.0, 1178.0, 443.0, 170.0, 71.0, 50.0, 36.0, 24.0, 13.0, 7.0, 5.0, 6.0, 7.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12310791015625, -0.11943912506103516, -0.11577033996582031, -0.11210155487060547, -0.10843276977539062, -0.10476398468017578, -0.10109519958496094, -0.0974264144897461, -0.09375762939453125, -0.0900888442993164, -0.08642005920410156, -0.08275127410888672, -0.07908248901367188, -0.07541370391845703, -0.07174491882324219, -0.06807613372802734, -0.0644073486328125, -0.060738563537597656, -0.05706977844238281, -0.05340099334716797, -0.049732208251953125, -0.04606342315673828, -0.04239463806152344, -0.038725852966308594, -0.03505706787109375, -0.031388282775878906, -0.027719497680664062, -0.02405071258544922, -0.020381927490234375, -0.01671314239501953, -0.013044357299804688, -0.009375572204589844, -0.005706787109375, -0.0020380020141601562, 0.0016307830810546875, 0.005299568176269531, 0.008968353271484375, 0.012637138366699219, 0.016305923461914062, 0.019974708557128906, 0.02364349365234375, 0.027312278747558594, 0.030981063842773438, 0.03464984893798828, 0.038318634033203125, 0.04198741912841797, 0.04565620422363281, 0.049324989318847656, 0.0529937744140625, 0.056662559509277344, 0.06033134460449219, 0.06400012969970703, 0.06766891479492188, 0.07133769989013672, 0.07500648498535156, 0.0786752700805664, 0.08234405517578125, 0.0860128402709961, 0.08968162536621094, 0.09335041046142578, 0.09701919555664062, 0.10068798065185547, 0.10435676574707031, 0.10802555084228516, 0.1116943359375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 9.0, 8.0, 11.0, 8.0, 13.0, 14.0, 24.0, 17.0, 27.0, 26.0, 35.0, 35.0, 42.0, 38.0, 45.0, 36.0, 49.0, 52.0, 49.0, 41.0, 44.0, 47.0, 36.0, 42.0, 35.0, 30.0, 35.0, 21.0, 20.0, 16.0, 14.0, 18.0, 11.0, 12.0, 6.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.269775390625, -0.2617378234863281, -0.25370025634765625, -0.24566268920898438, -0.2376251220703125, -0.22958755493164062, -0.22154998779296875, -0.21351242065429688, -0.205474853515625, -0.19743728637695312, -0.18939971923828125, -0.18136215209960938, -0.1733245849609375, -0.16528701782226562, -0.15724945068359375, -0.14921188354492188, -0.14117431640625, -0.13313674926757812, -0.12509918212890625, -0.11706161499023438, -0.1090240478515625, -0.10098648071289062, -0.09294891357421875, -0.08491134643554688, -0.076873779296875, -0.06883621215820312, -0.06079864501953125, -0.052761077880859375, -0.0447235107421875, -0.036685943603515625, -0.02864837646484375, -0.020610809326171875, -0.0125732421875, -0.004535675048828125, 0.00350189208984375, 0.011539459228515625, 0.0195770263671875, 0.027614593505859375, 0.03565216064453125, 0.043689727783203125, 0.051727294921875, 0.059764862060546875, 0.06780242919921875, 0.07583999633789062, 0.0838775634765625, 0.09191513061523438, 0.09995269775390625, 0.10799026489257812, 0.11602783203125, 0.12406539916992188, 0.13210296630859375, 0.14014053344726562, 0.1481781005859375, 0.15621566772460938, 0.16425323486328125, 0.17229080200195312, 0.180328369140625, 0.18836593627929688, 0.19640350341796875, 0.20444107055664062, 0.2124786376953125, 0.22051620483398438, 0.22855377197265625, 0.23659133911132812, 0.24462890625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 0.0, 6.0, 4.0, 4.0, 7.0, 5.0, 19.0, 11.0, 25.0, 23.0, 53.0, 100.0, 190.0, 387.0, 924.0, 2851.0, 10806.0, 67567.0, 760950.0, 178755.0, 19040.0, 4429.0, 1358.0, 530.0, 227.0, 124.0, 74.0, 30.0, 27.0, 11.0, 3.0, 9.0, 5.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0287628173828125, -0.02749466896057129, -0.026226520538330078, -0.024958372116088867, -0.023690223693847656, -0.022422075271606445, -0.021153926849365234, -0.019885778427124023, -0.018617630004882812, -0.0173494815826416, -0.01608133316040039, -0.01481318473815918, -0.013545036315917969, -0.012276887893676758, -0.011008739471435547, -0.009740591049194336, -0.008472442626953125, -0.007204294204711914, -0.005936145782470703, -0.004667997360229492, -0.0033998489379882812, -0.0021317005157470703, -0.0008635520935058594, 0.00040459632873535156, 0.0016727447509765625, 0.0029408931732177734, 0.004209041595458984, 0.005477190017700195, 0.006745338439941406, 0.008013486862182617, 0.009281635284423828, 0.010549783706665039, 0.01181793212890625, 0.013086080551147461, 0.014354228973388672, 0.015622377395629883, 0.016890525817871094, 0.018158674240112305, 0.019426822662353516, 0.020694971084594727, 0.021963119506835938, 0.02323126792907715, 0.02449941635131836, 0.02576756477355957, 0.02703571319580078, 0.028303861618041992, 0.029572010040283203, 0.030840158462524414, 0.032108306884765625, 0.033376455307006836, 0.03464460372924805, 0.03591275215148926, 0.03718090057373047, 0.03844904899597168, 0.03971719741821289, 0.0409853458404541, 0.04225349426269531, 0.04352164268493652, 0.044789791107177734, 0.046057939529418945, 0.047326087951660156, 0.04859423637390137, 0.04986238479614258, 0.05113053321838379, 0.052398681640625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 7.0, 12.0, 9.0, 15.0, 16.0, 27.0, 37.0, 69.0, 74.0, 101.0, 112.0, 151.0, 101.0, 77.0, 55.0, 28.0, 23.0, 22.0, 18.0, 16.0, 9.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3232231140136719e-05, -1.2774020433425903e-05, -1.2315809726715088e-05, -1.1857599020004272e-05, -1.1399388313293457e-05, -1.0941177606582642e-05, -1.0482966899871826e-05, -1.002475619316101e-05, -9.566545486450195e-06, -9.10833477973938e-06, -8.650124073028564e-06, -8.191913366317749e-06, -7.733702659606934e-06, -7.275491952896118e-06, -6.817281246185303e-06, -6.359070539474487e-06, -5.900859832763672e-06, -5.4426491260528564e-06, -4.984438419342041e-06, -4.526227712631226e-06, -4.06801700592041e-06, -3.6098062992095947e-06, -3.1515955924987793e-06, -2.693384885787964e-06, -2.2351741790771484e-06, -1.776963472366333e-06, -1.3187527656555176e-06, -8.605420589447021e-07, -4.023313522338867e-07, 5.587935447692871e-08, 5.140900611877441e-07, 9.723007678985596e-07, 1.430511474609375e-06, 1.8887221813201904e-06, 2.346932888031006e-06, 2.8051435947418213e-06, 3.2633543014526367e-06, 3.721565008163452e-06, 4.179775714874268e-06, 4.637986421585083e-06, 5.0961971282958984e-06, 5.554407835006714e-06, 6.012618541717529e-06, 6.470829248428345e-06, 6.92903995513916e-06, 7.387250661849976e-06, 7.845461368560791e-06, 8.303672075271606e-06, 8.761882781982422e-06, 9.220093488693237e-06, 9.678304195404053e-06, 1.0136514902114868e-05, 1.0594725608825684e-05, 1.1052936315536499e-05, 1.1511147022247314e-05, 1.196935772895813e-05, 1.2427568435668945e-05, 1.288577914237976e-05, 1.3343989849090576e-05, 1.3802200555801392e-05, 1.4260411262512207e-05, 1.4718621969223022e-05, 1.5176832675933838e-05, 1.5635043382644653e-05, 1.609325408935547e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 2.0, 5.0, 4.0, 3.0, 6.0, 8.0, 18.0, 15.0, 21.0, 30.0, 25.0, 45.0, 87.0, 161.0, 279.0, 549.0, 1352.0, 3207.0, 8798.0, 31547.0, 218522.0, 659542.0, 95574.0, 18530.0, 5979.0, 2251.0, 931.0, 426.0, 251.0, 131.0, 80.0, 53.0, 30.0, 23.0, 12.0, 11.0, 6.0, 9.0, 8.0, 8.0, 5.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03094482421875, -0.029987096786499023, -0.029029369354248047, -0.02807164192199707, -0.027113914489746094, -0.026156187057495117, -0.02519845962524414, -0.024240732192993164, -0.023283004760742188, -0.02232527732849121, -0.021367549896240234, -0.020409822463989258, -0.01945209503173828, -0.018494367599487305, -0.017536640167236328, -0.01657891273498535, -0.015621185302734375, -0.014663457870483398, -0.013705730438232422, -0.012748003005981445, -0.011790275573730469, -0.010832548141479492, -0.009874820709228516, -0.008917093276977539, -0.007959365844726562, -0.007001638412475586, -0.006043910980224609, -0.005086183547973633, -0.004128456115722656, -0.0031707286834716797, -0.002213001251220703, -0.0012552738189697266, -0.00029754638671875, 0.0006601810455322266, 0.0016179084777832031, 0.0025756359100341797, 0.0035333633422851562, 0.004491090774536133, 0.005448818206787109, 0.006406545639038086, 0.0073642730712890625, 0.008322000503540039, 0.009279727935791016, 0.010237455368041992, 0.011195182800292969, 0.012152910232543945, 0.013110637664794922, 0.014068365097045898, 0.015026092529296875, 0.01598381996154785, 0.016941547393798828, 0.017899274826049805, 0.01885700225830078, 0.019814729690551758, 0.020772457122802734, 0.02173018455505371, 0.022687911987304688, 0.023645639419555664, 0.02460336685180664, 0.025561094284057617, 0.026518821716308594, 0.02747654914855957, 0.028434276580810547, 0.029392004013061523, 0.0303497314453125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 7.0, 6.0, 8.0, 7.0, 15.0, 16.0, 17.0, 30.0, 39.0, 49.0, 43.0, 58.0, 95.0, 64.0, 93.0, 65.0, 89.0, 60.0, 54.0, 41.0, 24.0, 27.0, 22.0, 14.0, 10.0, 2.0, 5.0, 7.0, 4.0, 4.0, 7.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004848480224609375, -0.0046749114990234375, -0.0045013427734375, -0.0043277740478515625, -0.004154205322265625, -0.0039806365966796875, -0.00380706787109375, -0.0036334991455078125, -0.003459930419921875, -0.0032863616943359375, -0.00311279296875, -0.0029392242431640625, -0.002765655517578125, -0.0025920867919921875, -0.00241851806640625, -0.0022449493408203125, -0.002071380615234375, -0.0018978118896484375, -0.0017242431640625, -0.0015506744384765625, -0.001377105712890625, -0.0012035369873046875, -0.00102996826171875, -0.0008563995361328125, -0.000682830810546875, -0.0005092620849609375, -0.000335693359375, -0.0001621246337890625, 1.1444091796875e-05, 0.0001850128173828125, 0.00035858154296875, 0.0005321502685546875, 0.000705718994140625, 0.0008792877197265625, 0.0010528564453125, 0.0012264251708984375, 0.001399993896484375, 0.0015735626220703125, 0.00174713134765625, 0.0019207000732421875, 0.002094268798828125, 0.0022678375244140625, 0.00244140625, 0.0026149749755859375, 0.002788543701171875, 0.0029621124267578125, 0.00313568115234375, 0.0033092498779296875, 0.003482818603515625, 0.0036563873291015625, 0.0038299560546875, 0.0040035247802734375, 0.004177093505859375, 0.0043506622314453125, 0.00452423095703125, 0.0046977996826171875, 0.004871368408203125, 0.0050449371337890625, 0.005218505859375, 0.0053920745849609375, 0.005565643310546875, 0.0057392120361328125, 0.00591278076171875, 0.0060863494873046875, 0.006259918212890625]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 7.0, 11.0, 16.0, 45.0, 58.0, 144.0, 171.0, 209.0, 129.0, 73.0, 55.0, 35.0, 18.0, 8.0, 8.0, 4.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42667779326438904, -0.4148869514465332, -0.40309613943099976, -0.3913052976131439, -0.3795144557952881, -0.36772364377975464, -0.3559328019618988, -0.34414196014404297, -0.3323511481285095, -0.3205603063106537, -0.30876949429512024, -0.2969786524772644, -0.28518784046173096, -0.2733969986438751, -0.2616061568260193, -0.24981532990932465, -0.23802450299263, -0.22623367607593536, -0.21444284915924072, -0.2026520073413849, -0.19086118042469025, -0.1790703535079956, -0.16727951169013977, -0.15548868477344513, -0.1436978578567505, -0.13190703094005585, -0.12011619657278061, -0.10832536220550537, -0.09653453528881073, -0.08474370837211609, -0.07295287400484085, -0.06116203963756561, -0.04937121272087097, -0.03758038207888603, -0.025789551436901093, -0.013998720794916153, -0.0022078901529312134, 0.009582940489053726, 0.021373771131038666, 0.033164605498313904, 0.044955432415008545, 0.056746263056993484, 0.06853709369897842, 0.08032792806625366, 0.0921187549829483, 0.10390958189964294, 0.11570041626691818, 0.12749125063419342, 0.13928207755088806, 0.1510729044675827, 0.16286373138427734, 0.17465457320213318, 0.18644540011882782, 0.19823622703552246, 0.2100270688533783, 0.22181789577007294, 0.23360872268676758, 0.24539954960346222, 0.25719037652015686, 0.2689812183380127, 0.28077203035354614, 0.292562872171402, 0.3043537139892578, 0.31614452600479126, 0.3279353678226471]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 4.0, 9.0, 2.0, 5.0, 8.0, 14.0, 11.0, 20.0, 19.0, 30.0, 34.0, 51.0, 42.0, 47.0, 55.0, 53.0, 55.0, 71.0, 59.0, 52.0, 60.0, 56.0, 46.0, 51.0, 35.0, 27.0, 26.0, 15.0, 14.0, 4.0, 7.0, 7.0, 7.0, 8.0, 4.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15987694263458252, -0.15445472300052643, -0.14903250336647034, -0.14361026883125305, -0.13818804919719696, -0.13276582956314087, -0.12734359502792358, -0.12192137539386749, -0.1164991557598114, -0.11107693612575531, -0.10565470904111862, -0.10023248195648193, -0.09481026232242584, -0.08938804268836975, -0.08396581560373306, -0.07854358851909637, -0.07312136888504028, -0.06769914925098419, -0.062276922166347504, -0.056854698807001114, -0.051432475447654724, -0.046010252088308334, -0.040588028728961945, -0.035165805369615555, -0.029743582010269165, -0.024321358650922775, -0.018899135291576385, -0.013476911932229996, -0.008054688572883606, -0.002632465213537216, 0.0027897581458091736, 0.008211981505155563, 0.01363418996334076, 0.01905641332268715, 0.02447863668203354, 0.02990086004137993, 0.03532308340072632, 0.04074530676007271, 0.0461675301194191, 0.05158975347876549, 0.05701197683811188, 0.06243420019745827, 0.06785642355680466, 0.07327865064144135, 0.07870087027549744, 0.08412308990955353, 0.08954531699419022, 0.0949675440788269, 0.100389763712883, 0.10581198334693909, 0.11123421043157578, 0.11665643751621246, 0.12207865715026855, 0.12750087678432465, 0.13292309641838074, 0.13834533095359802, 0.1437675505876541, 0.1491897702217102, 0.1546120047569275, 0.16003422439098358, 0.16545644402503967, 0.17087866365909576, 0.17630088329315186, 0.18172311782836914, 0.18714533746242523]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 7.0, 2.0, 8.0, 3.0, 9.0, 16.0, 19.0, 47.0, 56.0, 98.0, 120.0, 180.0, 252.0, 368.0, 561.0, 863.0, 1337.0, 2078.0, 3264.0, 5380.0, 9599.0, 18808.0, 43497.0, 138106.0, 501233.0, 212344.0, 58422.0, 23396.0, 11487.0, 6459.0, 3699.0, 2334.0, 1545.0, 970.0, 631.0, 425.0, 300.0, 194.0, 131.0, 101.0, 56.0, 53.0, 28.0, 26.0, 20.0, 9.0, 2.0, 7.0, 3.0, 6.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.1549072265625, -0.15030288696289062, -0.14569854736328125, -0.14109420776367188, -0.1364898681640625, -0.13188552856445312, -0.12728118896484375, -0.12267684936523438, -0.118072509765625, -0.11346817016601562, -0.10886383056640625, -0.10425949096679688, -0.0996551513671875, -0.09505081176757812, -0.09044647216796875, -0.08584213256835938, -0.08123779296875, -0.07663345336914062, -0.07202911376953125, -0.06742477416992188, -0.0628204345703125, -0.058216094970703125, -0.05361175537109375, -0.049007415771484375, -0.044403076171875, -0.039798736572265625, -0.03519439697265625, -0.030590057373046875, -0.0259857177734375, -0.021381378173828125, -0.01677703857421875, -0.012172698974609375, -0.007568359375, -0.002964019775390625, 0.00164031982421875, 0.006244659423828125, 0.0108489990234375, 0.015453338623046875, 0.02005767822265625, 0.024662017822265625, 0.029266357421875, 0.033870697021484375, 0.03847503662109375, 0.043079376220703125, 0.0476837158203125, 0.052288055419921875, 0.05689239501953125, 0.061496734619140625, 0.06610107421875, 0.07070541381835938, 0.07530975341796875, 0.07991409301757812, 0.0845184326171875, 0.08912277221679688, 0.09372711181640625, 0.09833145141601562, 0.102935791015625, 0.10754013061523438, 0.11214447021484375, 0.11674880981445312, 0.1213531494140625, 0.12595748901367188, 0.13056182861328125, 0.13516616821289062, 0.1397705078125]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 8.0, 13.0, 30.0, 40.0, 55.0, 67.0, 85.0, 103.0, 117.0, 115.0, 94.0, 86.0, 78.0, 40.0, 42.0, 12.0, 13.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.381591796875, -0.3613548278808594, -0.34111785888671875, -0.3208808898925781, -0.3006439208984375, -0.2804069519042969, -0.26016998291015625, -0.23993301391601562, -0.219696044921875, -0.19945907592773438, -0.17922210693359375, -0.15898513793945312, -0.1387481689453125, -0.11851119995117188, -0.09827423095703125, -0.07803726196289062, -0.05780029296875, -0.037563323974609375, -0.01732635498046875, 0.002910614013671875, 0.0231475830078125, 0.043384552001953125, 0.06362152099609375, 0.08385848999023438, 0.104095458984375, 0.12433242797851562, 0.14456939697265625, 0.16480636596679688, 0.1850433349609375, 0.20528030395507812, 0.22551727294921875, 0.24575424194335938, 0.2659912109375, 0.2862281799316406, 0.30646514892578125, 0.3267021179199219, 0.3469390869140625, 0.3671760559082031, 0.38741302490234375, 0.4076499938964844, 0.427886962890625, 0.4481239318847656, 0.46836090087890625, 0.4885978698730469, 0.5088348388671875, 0.5290718078613281, 0.5493087768554688, 0.5695457458496094, 0.58978271484375, 0.6100196838378906, 0.6302566528320312, 0.6504936218261719, 0.6707305908203125, 0.6909675598144531, 0.7112045288085938, 0.7314414978027344, 0.751678466796875, 0.7719154357910156, 0.7921524047851562, 0.8123893737792969, 0.8326263427734375, 0.8528633117675781, 0.8731002807617188, 0.8933372497558594, 0.91357421875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 7.0, 7.0, 17.0, 11.0, 19.0, 18.0, 26.0, 38.0, 46.0, 64.0, 85.0, 95.0, 131.0, 207.0, 379.0, 973.0, 4717.0, 42419.0, 906391.0, 83161.0, 7188.0, 1283.0, 423.0, 236.0, 129.0, 109.0, 85.0, 63.0, 40.0, 44.0, 28.0, 27.0, 19.0, 11.0, 14.0, 8.0, 12.0, 5.0, 4.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.458251953125, -0.4441986083984375, -0.430145263671875, -0.4160919189453125, -0.40203857421875, -0.3879852294921875, -0.373931884765625, -0.3598785400390625, -0.3458251953125, -0.3317718505859375, -0.317718505859375, -0.3036651611328125, -0.28961181640625, -0.2755584716796875, -0.261505126953125, -0.2474517822265625, -0.2333984375, -0.2193450927734375, -0.205291748046875, -0.1912384033203125, -0.17718505859375, -0.1631317138671875, -0.149078369140625, -0.1350250244140625, -0.1209716796875, -0.1069183349609375, -0.092864990234375, -0.0788116455078125, -0.06475830078125, -0.0507049560546875, -0.036651611328125, -0.0225982666015625, -0.008544921875, 0.0055084228515625, 0.019561767578125, 0.0336151123046875, 0.04766845703125, 0.0617218017578125, 0.075775146484375, 0.0898284912109375, 0.1038818359375, 0.1179351806640625, 0.131988525390625, 0.1460418701171875, 0.16009521484375, 0.1741485595703125, 0.188201904296875, 0.2022552490234375, 0.21630859375, 0.2303619384765625, 0.244415283203125, 0.2584686279296875, 0.27252197265625, 0.2865753173828125, 0.300628662109375, 0.3146820068359375, 0.3287353515625, 0.3427886962890625, 0.356842041015625, 0.3708953857421875, 0.38494873046875, 0.3990020751953125, 0.413055419921875, 0.4271087646484375, 0.441162109375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 4.0, 5.0, 10.0, 5.0, 12.0, 14.0, 16.0, 17.0, 26.0, 27.0, 33.0, 24.0, 42.0, 32.0, 43.0, 51.0, 48.0, 45.0, 51.0, 59.0, 51.0, 41.0, 50.0, 32.0, 41.0, 35.0, 29.0, 31.0, 18.0, 19.0, 18.0, 18.0, 13.0, 6.0, 10.0, 5.0, 6.0, 4.0, 5.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.27978515625, -0.2710380554199219, -0.26229095458984375, -0.2535438537597656, -0.2447967529296875, -0.23604965209960938, -0.22730255126953125, -0.21855545043945312, -0.209808349609375, -0.20106124877929688, -0.19231414794921875, -0.18356704711914062, -0.1748199462890625, -0.16607284545898438, -0.15732574462890625, -0.14857864379882812, -0.13983154296875, -0.13108444213867188, -0.12233734130859375, -0.11359024047851562, -0.1048431396484375, -0.09609603881835938, -0.08734893798828125, -0.07860183715820312, -0.069854736328125, -0.061107635498046875, -0.05236053466796875, -0.043613433837890625, -0.0348663330078125, -0.026119232177734375, -0.01737213134765625, -0.008625030517578125, 0.0001220703125, 0.008869171142578125, 0.01761627197265625, 0.026363372802734375, 0.0351104736328125, 0.043857574462890625, 0.05260467529296875, 0.061351776123046875, 0.070098876953125, 0.07884597778320312, 0.08759307861328125, 0.09634017944335938, 0.1050872802734375, 0.11383438110351562, 0.12258148193359375, 0.13132858276367188, 0.14007568359375, 0.14882278442382812, 0.15756988525390625, 0.16631698608398438, 0.1750640869140625, 0.18381118774414062, 0.19255828857421875, 0.20130538940429688, 0.210052490234375, 0.21879959106445312, 0.22754669189453125, 0.23629379272460938, 0.2450408935546875, 0.2537879943847656, 0.26253509521484375, 0.2712821960449219, 0.280029296875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 6.0, 15.0, 13.0, 16.0, 19.0, 42.0, 56.0, 110.0, 229.0, 523.0, 1566.0, 5718.0, 40438.0, 872883.0, 112799.0, 10338.0, 2406.0, 743.0, 265.0, 155.0, 85.0, 39.0, 33.0, 18.0, 9.0, 4.0, 5.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.1707763671875, -0.16598892211914062, -0.16120147705078125, -0.15641403198242188, -0.1516265869140625, -0.14683914184570312, -0.14205169677734375, -0.13726425170898438, -0.132476806640625, -0.12768936157226562, -0.12290191650390625, -0.11811447143554688, -0.1133270263671875, -0.10853958129882812, -0.10375213623046875, -0.09896469116210938, -0.09417724609375, -0.08938980102539062, -0.08460235595703125, -0.07981491088867188, -0.0750274658203125, -0.07024002075195312, -0.06545257568359375, -0.060665130615234375, -0.055877685546875, -0.051090240478515625, -0.04630279541015625, -0.041515350341796875, -0.0367279052734375, -0.031940460205078125, -0.02715301513671875, -0.022365570068359375, -0.017578125, -0.012790679931640625, -0.00800323486328125, -0.003215789794921875, 0.0015716552734375, 0.006359100341796875, 0.01114654541015625, 0.015933990478515625, 0.020721435546875, 0.025508880615234375, 0.03029632568359375, 0.035083770751953125, 0.0398712158203125, 0.044658660888671875, 0.04944610595703125, 0.054233551025390625, 0.05902099609375, 0.06380844116210938, 0.06859588623046875, 0.07338333129882812, 0.0781707763671875, 0.08295822143554688, 0.08774566650390625, 0.09253311157226562, 0.097320556640625, 0.10210800170898438, 0.10689544677734375, 0.11168289184570312, 0.1164703369140625, 0.12125778198242188, 0.12604522705078125, 0.13083267211914062, 0.1356201171875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 2.0, 3.0, 14.0, 10.0, 19.0, 31.0, 28.0, 48.0, 74.0, 88.0, 167.0, 170.0, 97.0, 64.0, 59.0, 25.0, 23.0, 25.0, 11.0, 10.0, 5.0, 7.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5616416931152344e-05, -1.5128403902053833e-05, -1.4640390872955322e-05, -1.4152377843856812e-05, -1.36643648147583e-05, -1.317635178565979e-05, -1.268833875656128e-05, -1.2200325727462769e-05, -1.1712312698364258e-05, -1.1224299669265747e-05, -1.0736286640167236e-05, -1.0248273611068726e-05, -9.760260581970215e-06, -9.272247552871704e-06, -8.784234523773193e-06, -8.296221494674683e-06, -7.808208465576172e-06, -7.320195436477661e-06, -6.83218240737915e-06, -6.34416937828064e-06, -5.856156349182129e-06, -5.368143320083618e-06, -4.880130290985107e-06, -4.392117261886597e-06, -3.904104232788086e-06, -3.416091203689575e-06, -2.9280781745910645e-06, -2.4400651454925537e-06, -1.952052116394043e-06, -1.4640390872955322e-06, -9.760260581970215e-07, -4.880130290985107e-07, 0.0, 4.880130290985107e-07, 9.760260581970215e-07, 1.4640390872955322e-06, 1.952052116394043e-06, 2.4400651454925537e-06, 2.9280781745910645e-06, 3.416091203689575e-06, 3.904104232788086e-06, 4.392117261886597e-06, 4.880130290985107e-06, 5.368143320083618e-06, 5.856156349182129e-06, 6.34416937828064e-06, 6.83218240737915e-06, 7.320195436477661e-06, 7.808208465576172e-06, 8.296221494674683e-06, 8.784234523773193e-06, 9.272247552871704e-06, 9.760260581970215e-06, 1.0248273611068726e-05, 1.0736286640167236e-05, 1.1224299669265747e-05, 1.1712312698364258e-05, 1.2200325727462769e-05, 1.268833875656128e-05, 1.317635178565979e-05, 1.36643648147583e-05, 1.4152377843856812e-05, 1.4640390872955322e-05, 1.5128403902053833e-05, 1.5616416931152344e-05]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 6.0, 2.0, 8.0, 4.0, 7.0, 10.0, 17.0, 23.0, 30.0, 25.0, 54.0, 90.0, 150.0, 351.0, 1019.0, 3974.0, 26115.0, 905590.0, 100095.0, 8219.0, 1714.0, 549.0, 203.0, 88.0, 60.0, 38.0, 27.0, 17.0, 14.0, 14.0, 8.0, 5.0, 8.0, 8.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1922607421875, -0.18556594848632812, -0.17887115478515625, -0.17217636108398438, -0.1654815673828125, -0.15878677368164062, -0.15209197998046875, -0.14539718627929688, -0.138702392578125, -0.13200759887695312, -0.12531280517578125, -0.11861801147460938, -0.1119232177734375, -0.10522842407226562, -0.09853363037109375, -0.09183883666992188, -0.08514404296875, -0.07844924926757812, -0.07175445556640625, -0.06505966186523438, -0.0583648681640625, -0.051670074462890625, -0.04497528076171875, -0.038280487060546875, -0.031585693359375, -0.024890899658203125, -0.01819610595703125, -0.011501312255859375, -0.0048065185546875, 0.001888275146484375, 0.00858306884765625, 0.015277862548828125, 0.02197265625, 0.028667449951171875, 0.03536224365234375, 0.042057037353515625, 0.0487518310546875, 0.055446624755859375, 0.06214141845703125, 0.06883621215820312, 0.075531005859375, 0.08222579956054688, 0.08892059326171875, 0.09561538696289062, 0.1023101806640625, 0.10900497436523438, 0.11569976806640625, 0.12239456176757812, 0.12908935546875, 0.13578414916992188, 0.14247894287109375, 0.14917373657226562, 0.1558685302734375, 0.16256332397460938, 0.16925811767578125, 0.17595291137695312, 0.182647705078125, 0.18934249877929688, 0.19603729248046875, 0.20273208618164062, 0.2094268798828125, 0.21612167358398438, 0.22281646728515625, 0.22951126098632812, 0.2362060546875]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 2.0, 2.0, 4.0, 3.0, 5.0, 7.0, 6.0, 9.0, 9.0, 14.0, 12.0, 34.0, 48.0, 80.0, 123.0, 166.0, 156.0, 98.0, 60.0, 38.0, 28.0, 21.0, 17.0, 14.0, 7.0, 8.0, 7.0, 4.0, 6.0, 4.0, 0.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048309326171875, -0.046781063079833984, -0.04525279998779297, -0.04372453689575195, -0.04219627380371094, -0.04066801071166992, -0.039139747619628906, -0.03761148452758789, -0.036083221435546875, -0.03455495834350586, -0.033026695251464844, -0.03149843215942383, -0.029970169067382812, -0.028441905975341797, -0.02691364288330078, -0.025385379791259766, -0.02385711669921875, -0.022328853607177734, -0.02080059051513672, -0.019272327423095703, -0.017744064331054688, -0.016215801239013672, -0.014687538146972656, -0.01315927505493164, -0.011631011962890625, -0.01010274887084961, -0.008574485778808594, -0.007046222686767578, -0.0055179595947265625, -0.003989696502685547, -0.0024614334106445312, -0.0009331703186035156, 0.0005950927734375, 0.0021233558654785156, 0.0036516189575195312, 0.005179882049560547, 0.0067081451416015625, 0.008236408233642578, 0.009764671325683594, 0.01129293441772461, 0.012821197509765625, 0.01434946060180664, 0.015877723693847656, 0.017405986785888672, 0.018934249877929688, 0.020462512969970703, 0.02199077606201172, 0.023519039154052734, 0.02504730224609375, 0.026575565338134766, 0.02810382843017578, 0.029632091522216797, 0.031160354614257812, 0.03268861770629883, 0.034216880798339844, 0.03574514389038086, 0.037273406982421875, 0.03880167007446289, 0.040329933166503906, 0.04185819625854492, 0.04338645935058594, 0.04491472244262695, 0.04644298553466797, 0.047971248626708984, 0.04949951171875]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 8.0, 18.0, 53.0, 95.0, 233.0, 290.0, 167.0, 77.0, 31.0, 15.0, 9.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5648092031478882, -1.530989170074463, -1.497169017791748, -1.4633489847183228, -1.429528832435608, -1.3957087993621826, -1.3618886470794678, -1.3280686140060425, -1.2942485809326172, -1.260428547859192, -1.226608395576477, -1.1927883625030518, -1.158968210220337, -1.1251481771469116, -1.0913281440734863, -1.0575079917907715, -1.0236878395080566, -0.9898677468299866, -0.9560476541519165, -0.9222276210784912, -0.8884075284004211, -0.8545874357223511, -0.820767343044281, -0.7869472503662109, -0.7531272172927856, -0.7193071246147156, -0.6854870319366455, -0.6516669988632202, -0.6178469061851501, -0.5840268135070801, -0.55020672082901, -0.5163866281509399, -0.48256659507751465, -0.4487465023994446, -0.4149264395236969, -0.38110634684562683, -0.34728628396987915, -0.3134661912918091, -0.279646098613739, -0.24582602083683014, -0.21200594305992126, -0.1781858652830124, -0.14436578750610352, -0.11054569482803345, -0.07672561705112457, -0.0429055392742157, -0.00908544659614563, 0.024734631180763245, 0.05855470895767212, 0.092374786734581, 0.12619486451148987, 0.16001495718955994, 0.1938350349664688, 0.22765511274337769, 0.26147520542144775, 0.2952952980995178, 0.3291153609752655, 0.36293545365333557, 0.39675551652908325, 0.4305756092071533, 0.4643957018852234, 0.49821576476097107, 0.5320358276367188, 0.5658559203147888, 0.5996760129928589]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 6.0, 8.0, 13.0, 24.0, 22.0, 43.0, 54.0, 44.0, 44.0, 74.0, 67.0, 67.0, 70.0, 63.0, 74.0, 58.0, 55.0, 51.0, 37.0, 29.0, 25.0, 18.0, 22.0, 11.0, 8.0, 6.0, 6.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49517568945884705, -0.47226420044898987, -0.4493526816368103, -0.4264411926269531, -0.40352967381477356, -0.3806181848049164, -0.3577066659927368, -0.33479517698287964, -0.31188368797302246, -0.2889721989631653, -0.2660606801509857, -0.24314919114112854, -0.22023767232894897, -0.1973261833190918, -0.17441467940807343, -0.15150317549705505, -0.1285916566848755, -0.10568015277385712, -0.08276864886283875, -0.05985715240240097, -0.0369456484913826, -0.014034144580364227, 0.008877351880073547, 0.03178885579109192, 0.05470035970211029, 0.07761186361312866, 0.10052336752414703, 0.12343486398458481, 0.14634636044502258, 0.16925787925720215, 0.19216936826705933, 0.2150808721780777, 0.23799240589141846, 0.26090389490127563, 0.2838154137134552, 0.3067269027233124, 0.32963842153549194, 0.3525499105453491, 0.3754613995552063, 0.39837291836738586, 0.42128443717956543, 0.4441959261894226, 0.4671074450016022, 0.49001893401145935, 0.5129304528236389, 0.5358419418334961, 0.5587534308433533, 0.5816649198532104, 0.6045764684677124, 0.6274879574775696, 0.6503994464874268, 0.6733109951019287, 0.6962224841117859, 0.7191339731216431, 0.7420454621315002, 0.7649569511413574, 0.7878684401512146, 0.8107799291610718, 0.833691418170929, 0.8566029667854309, 0.8795144557952881, 0.9024259448051453, 0.9253374338150024, 0.9482489824295044, 0.9711604714393616]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 11.0, 7.0, 10.0, 14.0, 23.0, 25.0, 37.0, 45.0, 88.0, 129.0, 172.0, 248.0, 367.0, 560.0, 911.0, 1515.0, 2492.0, 4735.0, 9707.0, 30600.0, 250841.0, 2427804.0, 1311144.0, 115765.0, 20135.0, 7778.0, 3837.0, 1991.0, 1164.0, 712.0, 478.0, 314.0, 185.0, 128.0, 91.0, 59.0, 45.0, 27.0, 25.0, 16.0, 7.0, 10.0, 6.0, 11.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.2822265625, -0.2736320495605469, -0.26503753662109375, -0.2564430236816406, -0.2478485107421875, -0.23925399780273438, -0.23065948486328125, -0.22206497192382812, -0.213470458984375, -0.20487594604492188, -0.19628143310546875, -0.18768692016601562, -0.1790924072265625, -0.17049789428710938, -0.16190338134765625, -0.15330886840820312, -0.14471435546875, -0.13611984252929688, -0.12752532958984375, -0.11893081665039062, -0.1103363037109375, -0.10174179077148438, -0.09314727783203125, -0.08455276489257812, -0.075958251953125, -0.06736373901367188, -0.05876922607421875, -0.050174713134765625, -0.0415802001953125, -0.032985687255859375, -0.02439117431640625, -0.015796661376953125, -0.0072021484375, 0.001392364501953125, 0.00998687744140625, 0.018581390380859375, 0.0271759033203125, 0.035770416259765625, 0.04436492919921875, 0.052959442138671875, 0.061553955078125, 0.07014846801757812, 0.07874298095703125, 0.08733749389648438, 0.0959320068359375, 0.10452651977539062, 0.11312103271484375, 0.12171554565429688, 0.13031005859375, 0.13890457153320312, 0.14749908447265625, 0.15609359741210938, 0.1646881103515625, 0.17328262329101562, 0.18187713623046875, 0.19047164916992188, 0.199066162109375, 0.20766067504882812, 0.21625518798828125, 0.22484970092773438, 0.2334442138671875, 0.24203872680664062, 0.25063323974609375, 0.2592277526855469, 0.267822265625]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 6.0, 4.0, 5.0, 15.0, 8.0, 22.0, 14.0, 18.0, 36.0, 44.0, 49.0, 45.0, 44.0, 53.0, 56.0, 47.0, 62.0, 65.0, 47.0, 49.0, 51.0, 35.0, 39.0, 40.0, 26.0, 26.0, 23.0, 18.0, 15.0, 11.0, 10.0, 6.0, 9.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.2568359375, -0.2503662109375, -0.243896484375, -0.2374267578125, -0.23095703125, -0.2244873046875, -0.218017578125, -0.2115478515625, -0.205078125, -0.1986083984375, -0.192138671875, -0.1856689453125, -0.17919921875, -0.1727294921875, -0.166259765625, -0.1597900390625, -0.1533203125, -0.1468505859375, -0.140380859375, -0.1339111328125, -0.12744140625, -0.1209716796875, -0.114501953125, -0.1080322265625, -0.1015625, -0.0950927734375, -0.088623046875, -0.0821533203125, -0.07568359375, -0.0692138671875, -0.062744140625, -0.0562744140625, -0.0498046875, -0.0433349609375, -0.036865234375, -0.0303955078125, -0.02392578125, -0.0174560546875, -0.010986328125, -0.0045166015625, 0.001953125, 0.0084228515625, 0.014892578125, 0.0213623046875, 0.02783203125, 0.0343017578125, 0.040771484375, 0.0472412109375, 0.0537109375, 0.0601806640625, 0.066650390625, 0.0731201171875, 0.07958984375, 0.0860595703125, 0.092529296875, 0.0989990234375, 0.10546875, 0.1119384765625, 0.118408203125, 0.1248779296875, 0.13134765625, 0.1378173828125, 0.144287109375, 0.1507568359375, 0.1572265625]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 5.0, 3.0, 12.0, 13.0, 13.0, 16.0, 23.0, 28.0, 46.0, 62.0, 127.0, 305.0, 961.0, 5287.0, 94076.0, 4050887.0, 37992.0, 3259.0, 674.0, 225.0, 85.0, 62.0, 35.0, 20.0, 15.0, 7.0, 11.0, 9.0, 7.0, 6.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74169921875, -0.7187957763671875, -0.695892333984375, -0.6729888916015625, -0.65008544921875, -0.6271820068359375, -0.604278564453125, -0.5813751220703125, -0.5584716796875, -0.5355682373046875, -0.512664794921875, -0.4897613525390625, -0.46685791015625, -0.4439544677734375, -0.421051025390625, -0.3981475830078125, -0.375244140625, -0.3523406982421875, -0.329437255859375, -0.3065338134765625, -0.28363037109375, -0.2607269287109375, -0.237823486328125, -0.2149200439453125, -0.1920166015625, -0.1691131591796875, -0.146209716796875, -0.1233062744140625, -0.10040283203125, -0.0774993896484375, -0.054595947265625, -0.0316925048828125, -0.0087890625, 0.0141143798828125, 0.037017822265625, 0.0599212646484375, 0.08282470703125, 0.1057281494140625, 0.128631591796875, 0.1515350341796875, 0.1744384765625, 0.1973419189453125, 0.220245361328125, 0.2431488037109375, 0.26605224609375, 0.2889556884765625, 0.311859130859375, 0.3347625732421875, 0.357666015625, 0.3805694580078125, 0.403472900390625, 0.4263763427734375, 0.44927978515625, 0.4721832275390625, 0.495086669921875, 0.5179901123046875, 0.5408935546875, 0.5637969970703125, 0.586700439453125, 0.6096038818359375, 0.63250732421875, 0.6554107666015625, 0.678314208984375, 0.7012176513671875, 0.72412109375]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 5.0, 6.0, 8.0, 7.0, 14.0, 11.0, 17.0, 25.0, 47.0, 61.0, 99.0, 186.0, 338.0, 566.0, 898.0, 687.0, 468.0, 209.0, 142.0, 70.0, 42.0, 32.0, 33.0, 20.0, 12.0, 19.0, 11.0, 12.0, 5.0, 1.0, 9.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08184814453125, -0.07934188842773438, -0.07683563232421875, -0.07432937622070312, -0.0718231201171875, -0.06931686401367188, -0.06681060791015625, -0.06430435180664062, -0.061798095703125, -0.059291839599609375, -0.05678558349609375, -0.054279327392578125, -0.0517730712890625, -0.049266815185546875, -0.04676055908203125, -0.044254302978515625, -0.041748046875, -0.039241790771484375, -0.03673553466796875, -0.034229278564453125, -0.0317230224609375, -0.029216766357421875, -0.02671051025390625, -0.024204254150390625, -0.021697998046875, -0.019191741943359375, -0.01668548583984375, -0.014179229736328125, -0.0116729736328125, -0.009166717529296875, -0.00666046142578125, -0.004154205322265625, -0.00164794921875, 0.000858306884765625, 0.00336456298828125, 0.005870819091796875, 0.0083770751953125, 0.010883331298828125, 0.01338958740234375, 0.015895843505859375, 0.018402099609375, 0.020908355712890625, 0.02341461181640625, 0.025920867919921875, 0.0284271240234375, 0.030933380126953125, 0.03343963623046875, 0.035945892333984375, 0.0384521484375, 0.040958404541015625, 0.04346466064453125, 0.045970916748046875, 0.0484771728515625, 0.050983428955078125, 0.05348968505859375, 0.055995941162109375, 0.058502197265625, 0.061008453369140625, 0.06351470947265625, 0.06602096557617188, 0.0685272216796875, 0.07103347778320312, 0.07353973388671875, 0.07604598999023438, 0.07855224609375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 8.0, 5.0, 8.0, 16.0, 16.0, 15.0, 28.0, 50.0, 93.0, 134.0, 174.0, 158.0, 97.0, 75.0, 49.0, 28.0, 18.0, 9.0, 9.0, 9.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45745858550071716, -0.4438287913799286, -0.43019899725914, -0.41656923294067383, -0.40293943881988525, -0.3893096446990967, -0.3756798505783081, -0.36205005645751953, -0.34842029213905334, -0.33479049801826477, -0.3211607038974762, -0.30753093957901, -0.29390114545822144, -0.28027135133743286, -0.2666415572166443, -0.2530117630958557, -0.23938198387622833, -0.22575218975543976, -0.21212241053581238, -0.1984926164150238, -0.18486283719539642, -0.17123304307460785, -0.15760326385498047, -0.1439734697341919, -0.13034367561340332, -0.11671388894319534, -0.10308410227298737, -0.08945430815219879, -0.07582452893257141, -0.06219473481178284, -0.04856494814157486, -0.03493516147136688, -0.021305382251739502, -0.00767559465020895, 0.005954192951321602, 0.01958398148417473, 0.033213768154382706, 0.04684355854988098, 0.06047334522008896, 0.07410313189029694, 0.08773291856050491, 0.10136270523071289, 0.11499249190092087, 0.12862227857112885, 0.14225207269191742, 0.1558818519115448, 0.16951164603233337, 0.18314144015312195, 0.19677121937274933, 0.2104010134935379, 0.22403079271316528, 0.23766058683395386, 0.25129038095474243, 0.264920175075531, 0.2785499393939972, 0.29217973351478577, 0.30580952763557434, 0.3194393217563629, 0.3330691158771515, 0.3466988801956177, 0.36032867431640625, 0.3739584684371948, 0.3875882625579834, 0.401218056678772, 0.41484782099723816]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 9.0, 13.0, 9.0, 20.0, 16.0, 20.0, 18.0, 23.0, 33.0, 46.0, 35.0, 46.0, 59.0, 57.0, 39.0, 37.0, 47.0, 40.0, 44.0, 49.0, 54.0, 42.0, 35.0, 36.0, 29.0, 32.0, 26.0, 18.0, 18.0, 16.0, 9.0, 10.0, 4.0, 5.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.21785898506641388, -0.21156637370586395, -0.20527376234531403, -0.1989811509847641, -0.19268853962421417, -0.18639592826366425, -0.18010330200195312, -0.1738106906414032, -0.16751807928085327, -0.16122546792030334, -0.15493285655975342, -0.1486402451992035, -0.14234763383865356, -0.13605502247810364, -0.1297624111175537, -0.12346979230642319, -0.11717718839645386, -0.11088457703590393, -0.104591965675354, -0.09829935431480408, -0.09200674295425415, -0.08571413159370422, -0.0794215127825737, -0.07312890142202377, -0.06683629006147385, -0.06054367870092392, -0.05425106734037399, -0.04795845225453377, -0.04166584089398384, -0.035373229533433914, -0.02908061444759369, -0.022788003087043762, -0.01649537682533264, -0.01020276453346014, -0.003910152241587639, 0.002382460981607437, 0.008675072342157364, 0.01496768370270729, 0.021260298788547516, 0.027552910149097443, 0.03384552150964737, 0.040138132870197296, 0.04643074423074722, 0.05272335931658745, 0.059015970677137375, 0.0653085857629776, 0.07160119712352753, 0.07789380848407745, 0.08418641984462738, 0.09047903120517731, 0.09677164256572723, 0.10306425392627716, 0.10935686528682709, 0.11564947664737701, 0.12194209545850754, 0.12823471426963806, 0.134527325630188, 0.14081993699073792, 0.14711254835128784, 0.15340515971183777, 0.1596977710723877, 0.16599038243293762, 0.17228299379348755, 0.17857560515403748, 0.1848682165145874]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 6.0, 1.0, 3.0, 4.0, 4.0, 4.0, 5.0, 3.0, 7.0, 9.0, 28.0, 21.0, 38.0, 57.0, 64.0, 111.0, 196.0, 266.0, 501.0, 868.0, 1529.0, 2752.0, 5301.0, 12075.0, 41414.0, 328998.0, 560613.0, 64244.0, 15599.0, 6316.0, 3206.0, 1718.0, 1012.0, 612.0, 328.0, 211.0, 139.0, 92.0, 74.0, 35.0, 25.0, 19.0, 7.0, 8.0, 5.0, 4.0, 8.0, 7.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.08587646484375, -0.08328437805175781, -0.08069229125976562, -0.07810020446777344, -0.07550811767578125, -0.07291603088378906, -0.07032394409179688, -0.06773185729980469, -0.0651397705078125, -0.06254768371582031, -0.059955596923828125, -0.05736351013183594, -0.05477142333984375, -0.05217933654785156, -0.049587249755859375, -0.04699516296386719, -0.044403076171875, -0.04181098937988281, -0.039218902587890625, -0.03662681579589844, -0.03403472900390625, -0.03144264221191406, -0.028850555419921875, -0.026258468627929688, -0.0236663818359375, -0.021074295043945312, -0.018482208251953125, -0.015890121459960938, -0.01329803466796875, -0.010705947875976562, -0.008113861083984375, -0.0055217742919921875, -0.0029296875, -0.0003376007080078125, 0.002254486083984375, 0.0048465728759765625, 0.00743865966796875, 0.010030746459960938, 0.012622833251953125, 0.015214920043945312, 0.0178070068359375, 0.020399093627929688, 0.022991180419921875, 0.025583267211914062, 0.02817535400390625, 0.030767440795898438, 0.033359527587890625, 0.03595161437988281, 0.038543701171875, 0.04113578796386719, 0.043727874755859375, 0.04631996154785156, 0.04891204833984375, 0.05150413513183594, 0.054096221923828125, 0.05668830871582031, 0.0592803955078125, 0.06187248229980469, 0.06446456909179688, 0.06705665588378906, 0.06964874267578125, 0.07224082946777344, 0.07483291625976562, 0.07742500305175781, 0.08001708984375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 6.0, 4.0, 8.0, 11.0, 21.0, 17.0, 24.0, 30.0, 37.0, 44.0, 54.0, 58.0, 69.0, 62.0, 64.0, 66.0, 61.0, 64.0, 60.0, 62.0, 42.0, 38.0, 25.0, 28.0, 19.0, 12.0, 9.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1717529296875, -0.16596031188964844, -0.16016769409179688, -0.1543750762939453, -0.14858245849609375, -0.1427898406982422, -0.13699722290039062, -0.13120460510253906, -0.1254119873046875, -0.11961936950683594, -0.11382675170898438, -0.10803413391113281, -0.10224151611328125, -0.09644889831542969, -0.09065628051757812, -0.08486366271972656, -0.079071044921875, -0.07327842712402344, -0.06748580932617188, -0.06169319152832031, -0.05590057373046875, -0.05010795593261719, -0.044315338134765625, -0.03852272033691406, -0.0327301025390625, -0.026937484741210938, -0.021144866943359375, -0.015352249145507812, -0.00955963134765625, -0.0037670135498046875, 0.002025604248046875, 0.007818222045898438, 0.01361083984375, 0.019403457641601562, 0.025196075439453125, 0.030988693237304688, 0.03678131103515625, 0.04257392883300781, 0.048366546630859375, 0.05415916442871094, 0.0599517822265625, 0.06574440002441406, 0.07153701782226562, 0.07732963562011719, 0.08312225341796875, 0.08891487121582031, 0.09470748901367188, 0.10050010681152344, 0.106292724609375, 0.11208534240722656, 0.11787796020507812, 0.12367057800292969, 0.12946319580078125, 0.1352558135986328, 0.14104843139648438, 0.14684104919433594, 0.1526336669921875, 0.15842628479003906, 0.16421890258789062, 0.1700115203857422, 0.17580413818359375, 0.1815967559814453, 0.18738937377929688, 0.19318199157714844, 0.198974609375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 2.0, 5.0, 7.0, 15.0, 10.0, 26.0, 40.0, 56.0, 107.0, 233.0, 532.0, 1370.0, 4996.0, 25992.0, 579441.0, 408577.0, 20509.0, 4315.0, 1354.0, 478.0, 219.0, 94.0, 44.0, 32.0, 29.0, 16.0, 13.0, 4.0, 4.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.127685546875, -0.123809814453125, -0.11993408203125, -0.116058349609375, -0.1121826171875, -0.108306884765625, -0.10443115234375, -0.100555419921875, -0.0966796875, -0.092803955078125, -0.08892822265625, -0.085052490234375, -0.0811767578125, -0.077301025390625, -0.07342529296875, -0.069549560546875, -0.065673828125, -0.061798095703125, -0.05792236328125, -0.054046630859375, -0.0501708984375, -0.046295166015625, -0.04241943359375, -0.038543701171875, -0.03466796875, -0.030792236328125, -0.02691650390625, -0.023040771484375, -0.0191650390625, -0.015289306640625, -0.01141357421875, -0.007537841796875, -0.003662109375, 0.000213623046875, 0.00408935546875, 0.007965087890625, 0.0118408203125, 0.015716552734375, 0.01959228515625, 0.023468017578125, 0.02734375, 0.031219482421875, 0.03509521484375, 0.038970947265625, 0.0428466796875, 0.046722412109375, 0.05059814453125, 0.054473876953125, 0.058349609375, 0.062225341796875, 0.06610107421875, 0.069976806640625, 0.0738525390625, 0.077728271484375, 0.08160400390625, 0.085479736328125, 0.08935546875, 0.093231201171875, 0.09710693359375, 0.100982666015625, 0.1048583984375, 0.108734130859375, 0.11260986328125, 0.116485595703125, 0.120361328125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 3.0, 9.0, 5.0, 10.0, 14.0, 11.0, 17.0, 17.0, 20.0, 25.0, 31.0, 24.0, 32.0, 34.0, 30.0, 45.0, 40.0, 54.0, 43.0, 52.0, 36.0, 41.0, 40.0, 38.0, 40.0, 34.0, 32.0, 32.0, 29.0, 20.0, 24.0, 21.0, 18.0, 17.0, 11.0, 16.0, 8.0, 8.0, 4.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.274658203125, -0.26700592041015625, -0.2593536376953125, -0.25170135498046875, -0.244049072265625, -0.23639678955078125, -0.2287445068359375, -0.22109222412109375, -0.21343994140625, -0.20578765869140625, -0.1981353759765625, -0.19048309326171875, -0.182830810546875, -0.17517852783203125, -0.1675262451171875, -0.15987396240234375, -0.1522216796875, -0.14456939697265625, -0.1369171142578125, -0.12926483154296875, -0.121612548828125, -0.11396026611328125, -0.1063079833984375, -0.09865570068359375, -0.09100341796875, -0.08335113525390625, -0.0756988525390625, -0.06804656982421875, -0.060394287109375, -0.05274200439453125, -0.0450897216796875, -0.03743743896484375, -0.02978515625, -0.02213287353515625, -0.0144805908203125, -0.00682830810546875, 0.000823974609375, 0.00847625732421875, 0.0161285400390625, 0.02378082275390625, 0.03143310546875, 0.03908538818359375, 0.0467376708984375, 0.05438995361328125, 0.062042236328125, 0.06969451904296875, 0.0773468017578125, 0.08499908447265625, 0.0926513671875, 0.10030364990234375, 0.1079559326171875, 0.11560821533203125, 0.123260498046875, 0.13091278076171875, 0.1385650634765625, 0.14621734619140625, 0.15386962890625, 0.16152191162109375, 0.1691741943359375, 0.17682647705078125, 0.184478759765625, 0.19213104248046875, 0.1997833251953125, 0.20743560791015625, 0.215087890625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 6.0, 12.0, 15.0, 16.0, 26.0, 36.0, 54.0, 128.0, 256.0, 606.0, 1897.0, 8058.0, 63085.0, 756528.0, 195760.0, 17067.0, 3280.0, 983.0, 327.0, 178.0, 76.0, 61.0, 34.0, 22.0, 6.0, 15.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0298309326171875, -0.028826475143432617, -0.027822017669677734, -0.02681756019592285, -0.02581310272216797, -0.024808645248413086, -0.023804187774658203, -0.02279973030090332, -0.021795272827148438, -0.020790815353393555, -0.019786357879638672, -0.01878190040588379, -0.017777442932128906, -0.016772985458374023, -0.01576852798461914, -0.014764070510864258, -0.013759613037109375, -0.012755155563354492, -0.01175069808959961, -0.010746240615844727, -0.009741783142089844, -0.008737325668334961, -0.007732868194580078, -0.006728410720825195, -0.0057239532470703125, -0.00471949577331543, -0.003715038299560547, -0.002710580825805664, -0.0017061233520507812, -0.0007016658782958984, 0.0003027915954589844, 0.0013072490692138672, 0.00231170654296875, 0.003316164016723633, 0.004320621490478516, 0.0053250789642333984, 0.006329536437988281, 0.007333993911743164, 0.008338451385498047, 0.00934290885925293, 0.010347366333007812, 0.011351823806762695, 0.012356281280517578, 0.013360738754272461, 0.014365196228027344, 0.015369653701782227, 0.01637411117553711, 0.017378568649291992, 0.018383026123046875, 0.019387483596801758, 0.02039194107055664, 0.021396398544311523, 0.022400856018066406, 0.02340531349182129, 0.024409770965576172, 0.025414228439331055, 0.026418685913085938, 0.02742314338684082, 0.028427600860595703, 0.029432058334350586, 0.03043651580810547, 0.03144097328186035, 0.032445430755615234, 0.03344988822937012, 0.034454345703125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 6.0, 6.0, 11.0, 13.0, 34.0, 48.0, 68.0, 96.0, 154.0, 133.0, 117.0, 87.0, 87.0, 58.0, 29.0, 21.0, 14.0, 10.0, 9.0, 2.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8835067749023438e-05, -1.840386539697647e-05, -1.7972663044929504e-05, -1.7541460692882538e-05, -1.711025834083557e-05, -1.6679055988788605e-05, -1.6247853636741638e-05, -1.581665128469467e-05, -1.5385448932647705e-05, -1.4954246580600739e-05, -1.4523044228553772e-05, -1.4091841876506805e-05, -1.3660639524459839e-05, -1.3229437172412872e-05, -1.2798234820365906e-05, -1.236703246831894e-05, -1.1935830116271973e-05, -1.1504627764225006e-05, -1.107342541217804e-05, -1.0642223060131073e-05, -1.0211020708084106e-05, -9.77981835603714e-06, -9.348616003990173e-06, -8.917413651943207e-06, -8.48621129989624e-06, -8.055008947849274e-06, -7.623806595802307e-06, -7.1926042437553406e-06, -6.761401891708374e-06, -6.3301995396614075e-06, -5.898997187614441e-06, -5.467794835567474e-06, -5.036592483520508e-06, -4.605390131473541e-06, -4.174187779426575e-06, -3.742985427379608e-06, -3.3117830753326416e-06, -2.880580723285675e-06, -2.4493783712387085e-06, -2.018176019191742e-06, -1.5869736671447754e-06, -1.1557713150978088e-06, -7.245689630508423e-07, -2.9336661100387573e-07, 1.3783574104309082e-07, 5.690380930900574e-07, 1.000240445137024e-06, 1.4314427971839905e-06, 1.862645149230957e-06, 2.2938475012779236e-06, 2.72504985332489e-06, 3.1562522053718567e-06, 3.5874545574188232e-06, 4.01865690946579e-06, 4.449859261512756e-06, 4.881061613559723e-06, 5.3122639656066895e-06, 5.743466317653656e-06, 6.1746686697006226e-06, 6.605871021747589e-06, 7.037073373794556e-06, 7.468275725841522e-06, 7.899478077888489e-06, 8.330680429935455e-06, 8.761882781982422e-06]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 5.0, 6.0, 20.0, 25.0, 43.0, 77.0, 130.0, 265.0, 830.0, 3275.0, 22470.0, 565842.0, 433139.0, 18371.0, 2686.0, 713.0, 285.0, 142.0, 90.0, 55.0, 29.0, 23.0, 16.0, 8.0, 5.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.05169677734375, -0.050464630126953125, -0.04923248291015625, -0.048000335693359375, -0.0467681884765625, -0.045536041259765625, -0.04430389404296875, -0.043071746826171875, -0.041839599609375, -0.040607452392578125, -0.03937530517578125, -0.038143157958984375, -0.0369110107421875, -0.035678863525390625, -0.03444671630859375, -0.033214569091796875, -0.031982421875, -0.030750274658203125, -0.02951812744140625, -0.028285980224609375, -0.0270538330078125, -0.025821685791015625, -0.02458953857421875, -0.023357391357421875, -0.022125244140625, -0.020893096923828125, -0.01966094970703125, -0.018428802490234375, -0.0171966552734375, -0.015964508056640625, -0.01473236083984375, -0.013500213623046875, -0.01226806640625, -0.011035919189453125, -0.00980377197265625, -0.008571624755859375, -0.0073394775390625, -0.006107330322265625, -0.00487518310546875, -0.003643035888671875, -0.002410888671875, -0.001178741455078125, 5.340576171875e-05, 0.001285552978515625, 0.0025177001953125, 0.003749847412109375, 0.00498199462890625, 0.006214141845703125, 0.0074462890625, 0.008678436279296875, 0.00991058349609375, 0.011142730712890625, 0.0123748779296875, 0.013607025146484375, 0.01483917236328125, 0.016071319580078125, 0.017303466796875, 0.018535614013671875, 0.01976776123046875, 0.020999908447265625, 0.0222320556640625, 0.023464202880859375, 0.02469635009765625, 0.025928497314453125, 0.02716064453125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 4.0, 15.0, 12.0, 23.0, 30.0, 46.0, 63.0, 109.0, 151.0, 143.0, 122.0, 97.0, 66.0, 36.0, 27.0, 26.0, 16.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.005329132080078125, -0.005089461803436279, -0.004849791526794434, -0.004610121250152588, -0.004370450973510742, -0.0041307806968688965, -0.0038911104202270508, -0.003651440143585205, -0.0034117698669433594, -0.0031720995903015137, -0.002932429313659668, -0.0026927590370178223, -0.0024530887603759766, -0.002213418483734131, -0.001973748207092285, -0.0017340779304504395, -0.0014944076538085938, -0.001254737377166748, -0.0010150671005249023, -0.0007753968238830566, -0.0005357265472412109, -0.00029605627059936523, -5.638599395751953e-05, 0.00018328428268432617, 0.0004229545593261719, 0.0006626248359680176, 0.0009022951126098633, 0.001141965389251709, 0.0013816356658935547, 0.0016213059425354004, 0.001860976219177246, 0.002100646495819092, 0.0023403167724609375, 0.002579987049102783, 0.002819657325744629, 0.0030593276023864746, 0.0032989978790283203, 0.003538668155670166, 0.0037783384323120117, 0.004018008708953857, 0.004257678985595703, 0.004497349262237549, 0.0047370195388793945, 0.00497668981552124, 0.005216360092163086, 0.005456030368804932, 0.005695700645446777, 0.005935370922088623, 0.006175041198730469, 0.0064147114753723145, 0.00665438175201416, 0.006894052028656006, 0.0071337223052978516, 0.007373392581939697, 0.007613062858581543, 0.007852733135223389, 0.008092403411865234, 0.00833207368850708, 0.008571743965148926, 0.008811414241790771, 0.009051084518432617, 0.009290754795074463, 0.009530425071716309, 0.009770095348358154, 0.010009765625]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 6.0, 11.0, 18.0, 27.0, 58.0, 147.0, 282.0, 248.0, 123.0, 40.0, 29.0, 9.0, 8.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61208176612854, -0.5970747470855713, -0.5820677280426025, -0.5670607686042786, -0.5520537495613098, -0.5370467305183411, -0.5220397114753723, -0.5070327520370483, -0.4920257329940796, -0.47701871395111084, -0.4620117247104645, -0.4470047056674957, -0.43199771642684937, -0.4169906973838806, -0.40198370814323425, -0.3869766891002655, -0.37196969985961914, -0.3569626808166504, -0.34195569157600403, -0.3269486725330353, -0.3119416832923889, -0.29693466424942017, -0.2819276750087738, -0.26692065596580505, -0.2519136369228363, -0.23690663278102875, -0.2218996286392212, -0.20689262449741364, -0.19188562035560608, -0.17687860131263733, -0.16187161207199097, -0.14686459302902222, -0.13185760378837585, -0.1168505996465683, -0.10184359550476074, -0.08683659136295319, -0.07182958722114563, -0.05682257562875748, -0.04181557148694992, -0.026808567345142365, -0.011801563203334808, 0.0032054418697953224, 0.018212446942925453, 0.03321945294737816, 0.048226457089185715, 0.06323346495628357, 0.07824046909809113, 0.09324747323989868, 0.10825447738170624, 0.1232614815235138, 0.13826848566532135, 0.1532754898071289, 0.16828249394893646, 0.18328949809074402, 0.19829651713371277, 0.21330350637435913, 0.22831052541732788, 0.24331752955913544, 0.258324533700943, 0.27333155274391174, 0.2883385419845581, 0.30334556102752686, 0.3183525502681732, 0.33335956931114197, 0.34836655855178833]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 5.0, 6.0, 11.0, 11.0, 18.0, 18.0, 14.0, 29.0, 24.0, 43.0, 40.0, 43.0, 59.0, 63.0, 39.0, 58.0, 44.0, 45.0, 67.0, 52.0, 41.0, 43.0, 35.0, 38.0, 38.0, 29.0, 22.0, 15.0, 13.0, 16.0, 8.0, 1.0, 4.0, 7.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.16176283359527588, -0.15728718042373657, -0.15281152725219727, -0.14833585917949677, -0.14386020600795746, -0.13938455283641815, -0.13490888476371765, -0.13043323159217834, -0.12595757842063904, -0.12148192524909973, -0.11700626462697983, -0.11253060400485992, -0.10805495083332062, -0.10357929766178131, -0.09910363703966141, -0.0946279764175415, -0.0901523232460022, -0.08567667007446289, -0.08120100945234299, -0.07672534883022308, -0.07224969565868378, -0.06777404248714447, -0.06329838186502457, -0.05882272496819496, -0.054347068071365356, -0.04987141117453575, -0.045395754277706146, -0.04092009738087654, -0.036444440484046936, -0.03196878358721733, -0.027493126690387726, -0.02301746979355812, -0.018541812896728516, -0.01406615599989891, -0.009590499103069305, -0.0051148422062397, -0.0006391853094100952, 0.00383647158741951, 0.008312128484249115, 0.01278778538107872, 0.017263442277908325, 0.02173909917473793, 0.026214756071567535, 0.03069041296839714, 0.035166069865226746, 0.03964172676205635, 0.044117383658885956, 0.04859304055571556, 0.053068697452545166, 0.05754435434937477, 0.062020011246204376, 0.06649567186832428, 0.07097132503986359, 0.0754469782114029, 0.0799226388335228, 0.0843982994556427, 0.088873952627182, 0.09334960579872131, 0.09782526642084122, 0.10230092704296112, 0.10677658021450043, 0.11125223338603973, 0.11572789400815964, 0.12020355463027954, 0.12467920780181885]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 5.0, 12.0, 20.0, 49.0, 133.0, 355.0, 1129.0, 4424.0, 28807.0, 852978.0, 147007.0, 10483.0, 2203.0, 629.0, 178.0, 63.0, 28.0, 11.0, 5.0, 6.0, 5.0, 1.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34619140625, -0.33371734619140625, -0.3212432861328125, -0.30876922607421875, -0.296295166015625, -0.28382110595703125, -0.2713470458984375, -0.25887298583984375, -0.24639892578125, -0.23392486572265625, -0.2214508056640625, -0.20897674560546875, -0.196502685546875, -0.18402862548828125, -0.1715545654296875, -0.15908050537109375, -0.1466064453125, -0.13413238525390625, -0.1216583251953125, -0.10918426513671875, -0.096710205078125, -0.08423614501953125, -0.0717620849609375, -0.05928802490234375, -0.04681396484375, -0.03433990478515625, -0.0218658447265625, -0.00939178466796875, 0.003082275390625, 0.01555633544921875, 0.0280303955078125, 0.04050445556640625, 0.052978515625, 0.06545257568359375, 0.0779266357421875, 0.09040069580078125, 0.102874755859375, 0.11534881591796875, 0.1278228759765625, 0.14029693603515625, 0.15277099609375, 0.16524505615234375, 0.1777191162109375, 0.19019317626953125, 0.202667236328125, 0.21514129638671875, 0.2276153564453125, 0.24008941650390625, 0.2525634765625, 0.26503753662109375, 0.2775115966796875, 0.28998565673828125, 0.302459716796875, 0.31493377685546875, 0.3274078369140625, 0.33988189697265625, 0.35235595703125, 0.36483001708984375, 0.3773040771484375, 0.38977813720703125, 0.402252197265625, 0.41472625732421875, 0.4272003173828125, 0.43967437744140625, 0.4521484375]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 6.0, 7.0, 10.0, 12.0, 16.0, 13.0, 25.0, 28.0, 42.0, 49.0, 50.0, 52.0, 49.0, 51.0, 48.0, 67.0, 50.0, 58.0, 56.0, 51.0, 39.0, 39.0, 35.0, 33.0, 25.0, 26.0, 16.0, 12.0, 8.0, 10.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.34716796875, -0.3376007080078125, -0.328033447265625, -0.3184661865234375, -0.30889892578125, -0.2993316650390625, -0.289764404296875, -0.2801971435546875, -0.2706298828125, -0.2610626220703125, -0.251495361328125, -0.2419281005859375, -0.23236083984375, -0.2227935791015625, -0.213226318359375, -0.2036590576171875, -0.194091796875, -0.1845245361328125, -0.174957275390625, -0.1653900146484375, -0.15582275390625, -0.1462554931640625, -0.136688232421875, -0.1271209716796875, -0.1175537109375, -0.1079864501953125, -0.098419189453125, -0.0888519287109375, -0.07928466796875, -0.0697174072265625, -0.060150146484375, -0.0505828857421875, -0.041015625, -0.0314483642578125, -0.021881103515625, -0.0123138427734375, -0.00274658203125, 0.0068206787109375, 0.016387939453125, 0.0259552001953125, 0.0355224609375, 0.0450897216796875, 0.054656982421875, 0.0642242431640625, 0.07379150390625, 0.0833587646484375, 0.092926025390625, 0.1024932861328125, 0.112060546875, 0.1216278076171875, 0.131195068359375, 0.1407623291015625, 0.15032958984375, 0.1598968505859375, 0.169464111328125, 0.1790313720703125, 0.1885986328125, 0.1981658935546875, 0.207733154296875, 0.2173004150390625, 0.22686767578125, 0.2364349365234375, 0.246002197265625, 0.2555694580078125, 0.26513671875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 10.0, 7.0, 13.0, 15.0, 23.0, 35.0, 41.0, 71.0, 141.0, 252.0, 664.0, 2605.0, 19770.0, 857151.0, 157851.0, 7577.0, 1364.0, 440.0, 212.0, 103.0, 73.0, 34.0, 29.0, 17.0, 12.0, 10.0, 10.0, 5.0, 7.0, 3.0, 5.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.380615234375, -0.36864471435546875, -0.3566741943359375, -0.34470367431640625, -0.332733154296875, -0.32076263427734375, -0.3087921142578125, -0.29682159423828125, -0.28485107421875, -0.27288055419921875, -0.2609100341796875, -0.24893951416015625, -0.236968994140625, -0.22499847412109375, -0.2130279541015625, -0.20105743408203125, -0.1890869140625, -0.17711639404296875, -0.1651458740234375, -0.15317535400390625, -0.141204833984375, -0.12923431396484375, -0.1172637939453125, -0.10529327392578125, -0.09332275390625, -0.08135223388671875, -0.0693817138671875, -0.05741119384765625, -0.045440673828125, -0.03347015380859375, -0.0214996337890625, -0.00952911376953125, 0.00244140625, 0.01441192626953125, 0.0263824462890625, 0.03835296630859375, 0.050323486328125, 0.06229400634765625, 0.0742645263671875, 0.08623504638671875, 0.09820556640625, 0.11017608642578125, 0.1221466064453125, 0.13411712646484375, 0.146087646484375, 0.15805816650390625, 0.1700286865234375, 0.18199920654296875, 0.1939697265625, 0.20594024658203125, 0.2179107666015625, 0.22988128662109375, 0.241851806640625, 0.25382232666015625, 0.2657928466796875, 0.27776336669921875, 0.28973388671875, 0.30170440673828125, 0.3136749267578125, 0.32564544677734375, 0.337615966796875, 0.34958648681640625, 0.3615570068359375, 0.37352752685546875, 0.385498046875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 5.0, 6.0, 7.0, 13.0, 6.0, 15.0, 12.0, 17.0, 18.0, 16.0, 24.0, 21.0, 19.0, 34.0, 28.0, 45.0, 40.0, 47.0, 41.0, 52.0, 44.0, 37.0, 43.0, 52.0, 54.0, 32.0, 30.0, 43.0, 23.0, 30.0, 26.0, 22.0, 22.0, 17.0, 17.0, 8.0, 12.0, 8.0, 4.0, 3.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.283203125, -0.2745780944824219, -0.26595306396484375, -0.2573280334472656, -0.2487030029296875, -0.24007797241210938, -0.23145294189453125, -0.22282791137695312, -0.214202880859375, -0.20557785034179688, -0.19695281982421875, -0.18832778930664062, -0.1797027587890625, -0.17107772827148438, -0.16245269775390625, -0.15382766723632812, -0.14520263671875, -0.13657760620117188, -0.12795257568359375, -0.11932754516601562, -0.1107025146484375, -0.10207748413085938, -0.09345245361328125, -0.08482742309570312, -0.076202392578125, -0.06757736206054688, -0.05895233154296875, -0.050327301025390625, -0.0417022705078125, -0.033077239990234375, -0.02445220947265625, -0.015827178955078125, -0.0072021484375, 0.001422882080078125, 0.01004791259765625, 0.018672943115234375, 0.0272979736328125, 0.035923004150390625, 0.04454803466796875, 0.053173065185546875, 0.061798095703125, 0.07042312622070312, 0.07904815673828125, 0.08767318725585938, 0.0962982177734375, 0.10492324829101562, 0.11354827880859375, 0.12217330932617188, 0.13079833984375, 0.13942337036132812, 0.14804840087890625, 0.15667343139648438, 0.1652984619140625, 0.17392349243164062, 0.18254852294921875, 0.19117355346679688, 0.199798583984375, 0.20842361450195312, 0.21704864501953125, 0.22567367553710938, 0.2342987060546875, 0.24292373657226562, 0.25154876708984375, 0.2601737976074219, 0.268798828125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 5.0, 0.0, 6.0, 5.0, 8.0, 17.0, 24.0, 44.0, 70.0, 156.0, 389.0, 1668.0, 13327.0, 864536.0, 161288.0, 5514.0, 910.0, 277.0, 121.0, 56.0, 43.0, 20.0, 25.0, 13.0, 7.0, 7.0, 3.0, 5.0, 4.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1549072265625, -0.1503276824951172, -0.14574813842773438, -0.14116859436035156, -0.13658905029296875, -0.13200950622558594, -0.12742996215820312, -0.12285041809082031, -0.1182708740234375, -0.11369132995605469, -0.10911178588867188, -0.10453224182128906, -0.09995269775390625, -0.09537315368652344, -0.09079360961914062, -0.08621406555175781, -0.081634521484375, -0.07705497741699219, -0.07247543334960938, -0.06789588928222656, -0.06331634521484375, -0.05873680114746094, -0.054157257080078125, -0.04957771301269531, -0.0449981689453125, -0.04041862487792969, -0.035839080810546875, -0.03125953674316406, -0.02667999267578125, -0.022100448608398438, -0.017520904541015625, -0.012941360473632812, -0.00836181640625, -0.0037822723388671875, 0.000797271728515625, 0.0053768157958984375, 0.00995635986328125, 0.014535903930664062, 0.019115447998046875, 0.023694992065429688, 0.0282745361328125, 0.03285408020019531, 0.037433624267578125, 0.04201316833496094, 0.04659271240234375, 0.05117225646972656, 0.055751800537109375, 0.06033134460449219, 0.064910888671875, 0.06949043273925781, 0.07406997680664062, 0.07864952087402344, 0.08322906494140625, 0.08780860900878906, 0.09238815307617188, 0.09696769714355469, 0.1015472412109375, 0.10612678527832031, 0.11070632934570312, 0.11528587341308594, 0.11986541748046875, 0.12444496154785156, 0.12902450561523438, 0.1336040496826172, 0.13818359375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 14.0, 8.0, 9.0, 29.0, 39.0, 86.0, 182.0, 240.0, 171.0, 94.0, 45.0, 37.0, 11.0, 9.0, 9.0, 6.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6450881958007812e-05, -1.5875324606895447e-05, -1.529976725578308e-05, -1.4724209904670715e-05, -1.414865255355835e-05, -1.3573095202445984e-05, -1.2997537851333618e-05, -1.2421980500221252e-05, -1.1846423149108887e-05, -1.1270865797996521e-05, -1.0695308446884155e-05, -1.011975109577179e-05, -9.544193744659424e-06, -8.968636393547058e-06, -8.393079042434692e-06, -7.817521691322327e-06, -7.241964340209961e-06, -6.666406989097595e-06, -6.0908496379852295e-06, -5.515292286872864e-06, -4.939734935760498e-06, -4.364177584648132e-06, -3.7886202335357666e-06, -3.213062882423401e-06, -2.637505531311035e-06, -2.0619481801986694e-06, -1.4863908290863037e-06, -9.10833477973938e-07, -3.3527612686157227e-07, 2.4028122425079346e-07, 8.158385753631592e-07, 1.391395926475525e-06, 1.9669532775878906e-06, 2.5425106287002563e-06, 3.118067979812622e-06, 3.693625330924988e-06, 4.2691826820373535e-06, 4.844740033149719e-06, 5.420297384262085e-06, 5.995854735374451e-06, 6.571412086486816e-06, 7.146969437599182e-06, 7.722526788711548e-06, 8.298084139823914e-06, 8.87364149093628e-06, 9.449198842048645e-06, 1.002475619316101e-05, 1.0600313544273376e-05, 1.1175870895385742e-05, 1.1751428246498108e-05, 1.2326985597610474e-05, 1.290254294872284e-05, 1.3478100299835205e-05, 1.405365765094757e-05, 1.4629215002059937e-05, 1.5204772353172302e-05, 1.5780329704284668e-05, 1.6355887055397034e-05, 1.69314444065094e-05, 1.7507001757621765e-05, 1.808255910873413e-05, 1.8658116459846497e-05, 1.9233673810958862e-05, 1.9809231162071228e-05, 2.0384788513183594e-05]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 11.0, 12.0, 12.0, 28.0, 43.0, 79.0, 188.0, 493.0, 1999.0, 18207.0, 984630.0, 38874.0, 2808.0, 678.0, 257.0, 100.0, 53.0, 26.0, 17.0, 10.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.186279296875, -0.18056488037109375, -0.1748504638671875, -0.16913604736328125, -0.163421630859375, -0.15770721435546875, -0.1519927978515625, -0.14627838134765625, -0.14056396484375, -0.13484954833984375, -0.1291351318359375, -0.12342071533203125, -0.117706298828125, -0.11199188232421875, -0.1062774658203125, -0.10056304931640625, -0.0948486328125, -0.08913421630859375, -0.0834197998046875, -0.07770538330078125, -0.071990966796875, -0.06627655029296875, -0.0605621337890625, -0.05484771728515625, -0.04913330078125, -0.04341888427734375, -0.0377044677734375, -0.03199005126953125, -0.026275634765625, -0.02056121826171875, -0.0148468017578125, -0.00913238525390625, -0.00341796875, 0.00229644775390625, 0.0080108642578125, 0.01372528076171875, 0.019439697265625, 0.02515411376953125, 0.0308685302734375, 0.03658294677734375, 0.04229736328125, 0.04801177978515625, 0.0537261962890625, 0.05944061279296875, 0.065155029296875, 0.07086944580078125, 0.0765838623046875, 0.08229827880859375, 0.0880126953125, 0.09372711181640625, 0.0994415283203125, 0.10515594482421875, 0.110870361328125, 0.11658477783203125, 0.1222991943359375, 0.12801361083984375, 0.13372802734375, 0.13944244384765625, 0.1451568603515625, 0.15087127685546875, 0.156585693359375, 0.16230010986328125, 0.1680145263671875, 0.17372894287109375, 0.179443359375]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 7.0, 25.0, 15.0, 28.0, 32.0, 72.0, 75.0, 127.0, 145.0, 150.0, 97.0, 74.0, 40.0, 35.0, 15.0, 15.0, 11.0, 10.0, 10.0, 0.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.033843994140625, -0.03273963928222656, -0.031635284423828125, -0.030530929565429688, -0.02942657470703125, -0.028322219848632812, -0.027217864990234375, -0.026113510131835938, -0.0250091552734375, -0.023904800415039062, -0.022800445556640625, -0.021696090698242188, -0.02059173583984375, -0.019487380981445312, -0.018383026123046875, -0.017278671264648438, -0.01617431640625, -0.015069961547851562, -0.013965606689453125, -0.012861251831054688, -0.01175689697265625, -0.010652542114257812, -0.009548187255859375, -0.008443832397460938, -0.0073394775390625, -0.0062351226806640625, -0.005130767822265625, -0.0040264129638671875, -0.00292205810546875, -0.0018177032470703125, -0.000713348388671875, 0.0003910064697265625, 0.001495361328125, 0.0025997161865234375, 0.003704071044921875, 0.0048084259033203125, 0.00591278076171875, 0.0070171356201171875, 0.008121490478515625, 0.009225845336914062, 0.0103302001953125, 0.011434555053710938, 0.012538909912109375, 0.013643264770507812, 0.01474761962890625, 0.015851974487304688, 0.016956329345703125, 0.018060684204101562, 0.0191650390625, 0.020269393920898438, 0.021373748779296875, 0.022478103637695312, 0.02358245849609375, 0.024686813354492188, 0.025791168212890625, 0.026895523071289062, 0.0279998779296875, 0.029104232788085938, 0.030208587646484375, 0.03131294250488281, 0.03241729736328125, 0.03352165222167969, 0.034626007080078125, 0.03573036193847656, 0.036834716796875]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 13.0, 26.0, 48.0, 185.0, 362.0, 263.0, 58.0, 31.0, 15.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.0096774101257324, -1.9699279069900513, -1.9301785230636597, -1.8904290199279785, -1.850679636001587, -1.8109301328659058, -1.7711807489395142, -1.731431245803833, -1.6916818618774414, -1.6519323587417603, -1.6121829748153687, -1.5724334716796875, -1.532684087753296, -1.4929345846176147, -1.4531852006912231, -1.413435697555542, -1.3736863136291504, -1.3339368104934692, -1.2941874265670776, -1.2544379234313965, -1.2146885395050049, -1.1749390363693237, -1.1351896524429321, -1.095440149307251, -1.0556906461715698, -1.0159411430358887, -0.9761917591094971, -0.9364423155784607, -0.8966928720474243, -0.8569434285163879, -0.8171939849853516, -0.7774444818496704, -0.7376950979232788, -0.6979456543922424, -0.658196210861206, -0.6184467673301697, -0.5786973237991333, -0.5389478802680969, -0.49919840693473816, -0.4594489634037018, -0.4196995198726654, -0.37995007634162903, -0.34020063281059265, -0.3004511594772339, -0.2607017159461975, -0.22095228731632233, -0.18120282888412476, -0.14145338535308838, -0.101703941822052, -0.06195449456572533, -0.02220504730939865, 0.017544403672218323, 0.0572938472032547, 0.09704329073429108, 0.13679274916648865, 0.17654219269752502, 0.2162916362285614, 0.2560410797595978, 0.29579052329063416, 0.3355399966239929, 0.3752894401550293, 0.4150388836860657, 0.45478832721710205, 0.4945377707481384, 0.5342872142791748]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 6.0, 3.0, 3.0, 5.0, 9.0, 7.0, 11.0, 16.0, 23.0, 14.0, 16.0, 27.0, 35.0, 45.0, 43.0, 53.0, 43.0, 37.0, 54.0, 53.0, 46.0, 50.0, 47.0, 46.0, 45.0, 44.0, 46.0, 30.0, 26.0, 26.0, 20.0, 17.0, 19.0, 6.0, 8.0, 9.0, 11.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.589144229888916, -0.5728532075881958, -0.5565621852874756, -0.5402711629867554, -0.5239801406860352, -0.5076891183853149, -0.49139806628227234, -0.4751070439815521, -0.4588159918785095, -0.4425249695777893, -0.4262339472770691, -0.4099429249763489, -0.3936518728733063, -0.37736085057258606, -0.36106982827186584, -0.34477880597114563, -0.3284877836704254, -0.3121967613697052, -0.295905739068985, -0.2796146869659424, -0.26332366466522217, -0.24703264236450195, -0.23074162006378174, -0.21445059776306152, -0.19815956056118011, -0.1818685382604599, -0.1655775010585785, -0.14928647875785828, -0.13299545645713806, -0.11670441925525665, -0.10041339695453644, -0.08412236720323563, -0.0678313672542572, -0.05154033750295639, -0.03524931147694588, -0.018958285450935364, -0.002667255699634552, 0.01362377405166626, 0.029914796352386475, 0.046205826103687286, 0.0624968558549881, 0.07878788560628891, 0.09507891535758972, 0.11136993765830994, 0.12766095995903015, 0.14395199716091156, 0.16024301946163177, 0.17653405666351318, 0.1928250789642334, 0.2091161012649536, 0.22540713846683502, 0.24169816076755524, 0.25798919796943665, 0.27428022027015686, 0.2905712425708771, 0.3068622648715973, 0.3231533169746399, 0.3394443392753601, 0.3557353615760803, 0.37202638387680054, 0.38831743597984314, 0.40460845828056335, 0.42089948058128357, 0.4371905028820038, 0.453481525182724]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 2.0, 8.0, 13.0, 11.0, 16.0, 18.0, 30.0, 40.0, 65.0, 95.0, 149.0, 294.0, 591.0, 1317.0, 3285.0, 12638.0, 258103.0, 3715774.0, 183419.0, 12653.0, 3276.0, 1239.0, 538.0, 280.0, 139.0, 91.0, 54.0, 44.0, 27.0, 20.0, 12.0, 11.0, 6.0, 6.0, 8.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3994140625, -0.3867225646972656, -0.37403106689453125, -0.3613395690917969, -0.3486480712890625, -0.3359565734863281, -0.32326507568359375, -0.3105735778808594, -0.297882080078125, -0.2851905822753906, -0.27249908447265625, -0.2598075866699219, -0.2471160888671875, -0.23442459106445312, -0.22173309326171875, -0.20904159545898438, -0.19635009765625, -0.18365859985351562, -0.17096710205078125, -0.15827560424804688, -0.1455841064453125, -0.13289260864257812, -0.12020111083984375, -0.10750961303710938, -0.094818115234375, -0.08212661743164062, -0.06943511962890625, -0.056743621826171875, -0.0440521240234375, -0.031360626220703125, -0.01866912841796875, -0.005977630615234375, 0.0067138671875, 0.019405364990234375, 0.03209686279296875, 0.044788360595703125, 0.0574798583984375, 0.07017135620117188, 0.08286285400390625, 0.09555435180664062, 0.108245849609375, 0.12093734741210938, 0.13362884521484375, 0.14632034301757812, 0.1590118408203125, 0.17170333862304688, 0.18439483642578125, 0.19708633422851562, 0.20977783203125, 0.22246932983398438, 0.23516082763671875, 0.24785232543945312, 0.2605438232421875, 0.2732353210449219, 0.28592681884765625, 0.2986183166503906, 0.311309814453125, 0.3240013122558594, 0.33669281005859375, 0.3493843078613281, 0.3620758056640625, 0.3747673034667969, 0.38745880126953125, 0.4001502990722656, 0.412841796875]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 8.0, 6.0, 9.0, 10.0, 15.0, 19.0, 27.0, 44.0, 59.0, 50.0, 61.0, 60.0, 77.0, 76.0, 62.0, 67.0, 56.0, 50.0, 43.0, 36.0, 38.0, 34.0, 23.0, 21.0, 20.0, 12.0, 8.0, 5.0, 2.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2509765625, -0.2445354461669922, -0.23809432983398438, -0.23165321350097656, -0.22521209716796875, -0.21877098083496094, -0.21232986450195312, -0.2058887481689453, -0.1994476318359375, -0.1930065155029297, -0.18656539916992188, -0.18012428283691406, -0.17368316650390625, -0.16724205017089844, -0.16080093383789062, -0.1543598175048828, -0.147918701171875, -0.1414775848388672, -0.13503646850585938, -0.12859535217285156, -0.12215423583984375, -0.11571311950683594, -0.10927200317382812, -0.10283088684082031, -0.0963897705078125, -0.08994865417480469, -0.08350753784179688, -0.07706642150878906, -0.07062530517578125, -0.06418418884277344, -0.057743072509765625, -0.05130195617675781, -0.04486083984375, -0.03841972351074219, -0.031978607177734375, -0.025537490844726562, -0.01909637451171875, -0.012655258178710938, -0.006214141845703125, 0.0002269744873046875, 0.0066680908203125, 0.013109207153320312, 0.019550323486328125, 0.025991439819335938, 0.03243255615234375, 0.03887367248535156, 0.045314788818359375, 0.05175590515136719, 0.058197021484375, 0.06463813781738281, 0.07107925415039062, 0.07752037048339844, 0.08396148681640625, 0.09040260314941406, 0.09684371948242188, 0.10328483581542969, 0.1097259521484375, 0.11616706848144531, 0.12260818481445312, 0.12904930114746094, 0.13549041748046875, 0.14193153381347656, 0.14837265014648438, 0.1548137664794922, 0.1612548828125]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 6.0, 11.0, 8.0, 17.0, 19.0, 27.0, 35.0, 73.0, 92.0, 176.0, 315.0, 795.0, 2139.0, 8750.0, 81714.0, 3982344.0, 103343.0, 10134.0, 2479.0, 911.0, 355.0, 200.0, 107.0, 59.0, 46.0, 30.0, 17.0, 13.0, 12.0, 8.0, 6.0, 2.0, 7.0, 3.0, 6.0, 4.0, 2.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.335693359375, -0.3220100402832031, -0.30832672119140625, -0.2946434020996094, -0.2809600830078125, -0.2672767639160156, -0.25359344482421875, -0.23991012573242188, -0.226226806640625, -0.21254348754882812, -0.19886016845703125, -0.18517684936523438, -0.1714935302734375, -0.15781021118164062, -0.14412689208984375, -0.13044357299804688, -0.11676025390625, -0.10307693481445312, -0.08939361572265625, -0.07571029663085938, -0.0620269775390625, -0.048343658447265625, -0.03466033935546875, -0.020977020263671875, -0.007293701171875, 0.006389617919921875, 0.02007293701171875, 0.033756256103515625, 0.0474395751953125, 0.061122894287109375, 0.07480621337890625, 0.08848953247070312, 0.1021728515625, 0.11585617065429688, 0.12953948974609375, 0.14322280883789062, 0.1569061279296875, 0.17058944702148438, 0.18427276611328125, 0.19795608520507812, 0.211639404296875, 0.22532272338867188, 0.23900604248046875, 0.2526893615722656, 0.2663726806640625, 0.2800559997558594, 0.29373931884765625, 0.3074226379394531, 0.32110595703125, 0.3347892761230469, 0.34847259521484375, 0.3621559143066406, 0.3758392333984375, 0.3895225524902344, 0.40320587158203125, 0.4168891906738281, 0.430572509765625, 0.4442558288574219, 0.45793914794921875, 0.4716224670410156, 0.4853057861328125, 0.4989891052246094, 0.5126724243164062, 0.5263557434082031, 0.5400390625]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 10.0, 12.0, 9.0, 16.0, 17.0, 32.0, 43.0, 73.0, 97.0, 252.0, 548.0, 1051.0, 944.0, 467.0, 208.0, 110.0, 41.0, 44.0, 18.0, 16.0, 13.0, 11.0, 6.0, 5.0, 6.0, 2.0, 9.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.10394287109375, -0.1013336181640625, -0.098724365234375, -0.0961151123046875, -0.093505859375, -0.0908966064453125, -0.088287353515625, -0.0856781005859375, -0.08306884765625, -0.0804595947265625, -0.077850341796875, -0.0752410888671875, -0.0726318359375, -0.0700225830078125, -0.067413330078125, -0.0648040771484375, -0.06219482421875, -0.0595855712890625, -0.056976318359375, -0.0543670654296875, -0.0517578125, -0.0491485595703125, -0.046539306640625, -0.0439300537109375, -0.04132080078125, -0.0387115478515625, -0.036102294921875, -0.0334930419921875, -0.0308837890625, -0.0282745361328125, -0.025665283203125, -0.0230560302734375, -0.02044677734375, -0.0178375244140625, -0.015228271484375, -0.0126190185546875, -0.010009765625, -0.0074005126953125, -0.004791259765625, -0.0021820068359375, 0.00042724609375, 0.0030364990234375, 0.005645751953125, 0.0082550048828125, 0.0108642578125, 0.0134735107421875, 0.016082763671875, 0.0186920166015625, 0.02130126953125, 0.0239105224609375, 0.026519775390625, 0.0291290283203125, 0.03173828125, 0.0343475341796875, 0.036956787109375, 0.0395660400390625, 0.04217529296875, 0.0447845458984375, 0.047393798828125, 0.0500030517578125, 0.0526123046875, 0.0552215576171875, 0.057830810546875, 0.0604400634765625, 0.06304931640625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 6.0, 15.0, 6.0, 20.0, 29.0, 44.0, 71.0, 108.0, 153.0, 163.0, 133.0, 82.0, 58.0, 36.0, 23.0, 14.0, 13.0, 9.0, 5.0, 0.0, 4.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34517422318458557, -0.3340901732444763, -0.32300612330436707, -0.3119220733642578, -0.30083802342414856, -0.2897539734840393, -0.27866995334625244, -0.2675859034061432, -0.25650185346603394, -0.24541780352592468, -0.23433375358581543, -0.22324970364570618, -0.21216566860675812, -0.20108161866664886, -0.1899975687265396, -0.17891353368759155, -0.1678294688463211, -0.15674541890621185, -0.1456613689661026, -0.13457733392715454, -0.12349328398704529, -0.11240923404693604, -0.10132518410682678, -0.09024114161729813, -0.07915709167718887, -0.06807304173707962, -0.056988999247550964, -0.04590494930744171, -0.03482090309262276, -0.023736856877803802, -0.01265280693769455, -0.0015687644481658936, 0.00951528549194336, 0.020599331706762314, 0.03168337792158127, 0.04276742786169052, 0.053851474076509476, 0.06493552029132843, 0.07601957023143768, 0.08710361272096634, 0.09818766266107559, 0.10927171260118484, 0.1203557550907135, 0.13143980503082275, 0.142523854970932, 0.15360790491104126, 0.1646919548511505, 0.17577598989009857, 0.18686003983020782, 0.19794408977031708, 0.20902813971042633, 0.2201121747493744, 0.23119622468948364, 0.2422802746295929, 0.25336432456970215, 0.2644483745098114, 0.27553242444992065, 0.2866164743900299, 0.29770052433013916, 0.3087845742702484, 0.31986862421035767, 0.33095264434814453, 0.34203672409057617, 0.35312074422836304, 0.3642047941684723]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 6.0, 4.0, 5.0, 6.0, 14.0, 13.0, 19.0, 15.0, 21.0, 30.0, 29.0, 28.0, 38.0, 43.0, 43.0, 50.0, 49.0, 49.0, 63.0, 53.0, 36.0, 42.0, 44.0, 38.0, 38.0, 37.0, 49.0, 22.0, 21.0, 17.0, 15.0, 15.0, 13.0, 9.0, 8.0, 7.0, 3.0, 2.0, 2.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13359737396240234, -0.12859424948692322, -0.12359113991260529, -0.11858802288770676, -0.11358490586280823, -0.1085817888379097, -0.10357867181301117, -0.09857554733753204, -0.09357243776321411, -0.08856932073831558, -0.08356620371341705, -0.07856308668851852, -0.07355996966362, -0.06855685263872147, -0.06355373561382294, -0.05855061486363411, -0.05354749411344528, -0.04854437708854675, -0.043541260063648224, -0.038538143038749695, -0.033535026013851166, -0.028531907126307487, -0.02352878823876381, -0.01852567121386528, -0.013522554188966751, -0.008519437164068222, -0.0035163192078471184, 0.0014867987483739853, 0.006489915773272514, 0.011493032798171043, 0.01649615168571472, 0.02149926871061325, 0.02650238573551178, 0.03150550276041031, 0.03650861978530884, 0.04151173681020737, 0.046514853835105896, 0.051517970860004425, 0.05652109161019325, 0.06152420863509178, 0.06652732193470001, 0.07153043895959854, 0.07653355598449707, 0.0815366730093956, 0.08653979003429413, 0.09154290705919266, 0.09654602408409119, 0.10154914855957031, 0.10655226558446884, 0.11155538260936737, 0.1165584996342659, 0.12156161665916443, 0.12656474113464355, 0.1315678507089615, 0.1365709751844406, 0.14157408475875854, 0.14657720923423767, 0.1515803337097168, 0.15658344328403473, 0.16158656775951385, 0.1665896773338318, 0.1715928018093109, 0.17659591138362885, 0.18159903585910797, 0.1866021454334259]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 2.0, 3.0, 3.0, 9.0, 16.0, 26.0, 16.0, 32.0, 54.0, 72.0, 121.0, 158.0, 280.0, 370.0, 577.0, 960.0, 1505.0, 2486.0, 4158.0, 7141.0, 12684.0, 23665.0, 45449.0, 92795.0, 187339.0, 276092.0, 193389.0, 95801.0, 47411.0, 24291.0, 13069.0, 7334.0, 4352.0, 2562.0, 1590.0, 948.0, 622.0, 379.0, 274.0, 177.0, 123.0, 80.0, 49.0, 31.0, 25.0, 18.0, 6.0, 6.0, 2.0, 7.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.0172119140625, -0.016713380813598633, -0.016214847564697266, -0.0157163143157959, -0.015217781066894531, -0.014719247817993164, -0.014220714569091797, -0.01372218132019043, -0.013223648071289062, -0.012725114822387695, -0.012226581573486328, -0.011728048324584961, -0.011229515075683594, -0.010730981826782227, -0.01023244857788086, -0.009733915328979492, -0.009235382080078125, -0.008736848831176758, -0.00823831558227539, -0.0077397823333740234, -0.007241249084472656, -0.006742715835571289, -0.006244182586669922, -0.005745649337768555, -0.0052471160888671875, -0.00474858283996582, -0.004250049591064453, -0.003751516342163086, -0.0032529830932617188, -0.0027544498443603516, -0.0022559165954589844, -0.0017573833465576172, -0.00125885009765625, -0.0007603168487548828, -0.0002617835998535156, 0.00023674964904785156, 0.0007352828979492188, 0.001233816146850586, 0.0017323493957519531, 0.0022308826446533203, 0.0027294158935546875, 0.0032279491424560547, 0.003726482391357422, 0.004225015640258789, 0.004723548889160156, 0.0052220821380615234, 0.005720615386962891, 0.006219148635864258, 0.006717681884765625, 0.007216215133666992, 0.007714748382568359, 0.008213281631469727, 0.008711814880371094, 0.009210348129272461, 0.009708881378173828, 0.010207414627075195, 0.010705947875976562, 0.01120448112487793, 0.011703014373779297, 0.012201547622680664, 0.012700080871582031, 0.013198614120483398, 0.013697147369384766, 0.014195680618286133, 0.0146942138671875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 1.0, 3.0, 8.0, 8.0, 15.0, 14.0, 19.0, 17.0, 34.0, 23.0, 39.0, 42.0, 47.0, 67.0, 47.0, 63.0, 64.0, 63.0, 40.0, 55.0, 53.0, 46.0, 39.0, 38.0, 40.0, 28.0, 21.0, 13.0, 15.0, 7.0, 5.0, 7.0, 5.0, 4.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1241455078125, -0.12025260925292969, -0.11635971069335938, -0.11246681213378906, -0.10857391357421875, -0.10468101501464844, -0.10078811645507812, -0.09689521789550781, -0.0930023193359375, -0.08910942077636719, -0.08521652221679688, -0.08132362365722656, -0.07743072509765625, -0.07353782653808594, -0.06964492797851562, -0.06575202941894531, -0.061859130859375, -0.05796623229980469, -0.054073333740234375, -0.05018043518066406, -0.04628753662109375, -0.04239463806152344, -0.038501739501953125, -0.03460884094238281, -0.0307159423828125, -0.026823043823242188, -0.022930145263671875, -0.019037246704101562, -0.01514434814453125, -0.011251449584960938, -0.007358551025390625, -0.0034656524658203125, 0.00042724609375, 0.0043201446533203125, 0.008213043212890625, 0.012105941772460938, 0.01599884033203125, 0.019891738891601562, 0.023784637451171875, 0.027677536010742188, 0.0315704345703125, 0.03546333312988281, 0.039356231689453125, 0.04324913024902344, 0.04714202880859375, 0.05103492736816406, 0.054927825927734375, 0.05882072448730469, 0.062713623046875, 0.06660652160644531, 0.07049942016601562, 0.07439231872558594, 0.07828521728515625, 0.08217811584472656, 0.08607101440429688, 0.08996391296386719, 0.0938568115234375, 0.09774971008300781, 0.10164260864257812, 0.10553550720214844, 0.10942840576171875, 0.11332130432128906, 0.11721420288085938, 0.12110710144042969, 0.125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 9.0, 8.0, 12.0, 39.0, 59.0, 119.0, 295.0, 802.0, 2382.0, 9289.0, 48791.0, 370933.0, 525127.0, 72899.0, 12815.0, 3135.0, 1064.0, 406.0, 171.0, 88.0, 34.0, 19.0, 11.0, 6.0, 8.0, 10.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.048065185546875, -0.046613216400146484, -0.04516124725341797, -0.04370927810668945, -0.04225730895996094, -0.04080533981323242, -0.039353370666503906, -0.03790140151977539, -0.036449432373046875, -0.03499746322631836, -0.033545494079589844, -0.03209352493286133, -0.030641555786132812, -0.029189586639404297, -0.02773761749267578, -0.026285648345947266, -0.02483367919921875, -0.023381710052490234, -0.02192974090576172, -0.020477771759033203, -0.019025802612304688, -0.017573833465576172, -0.016121864318847656, -0.01466989517211914, -0.013217926025390625, -0.01176595687866211, -0.010313987731933594, -0.008862018585205078, -0.0074100494384765625, -0.005958080291748047, -0.004506111145019531, -0.0030541419982910156, -0.0016021728515625, -0.00015020370483398438, 0.0013017654418945312, 0.002753734588623047, 0.0042057037353515625, 0.005657672882080078, 0.007109642028808594, 0.00856161117553711, 0.010013580322265625, 0.01146554946899414, 0.012917518615722656, 0.014369487762451172, 0.015821456909179688, 0.017273426055908203, 0.01872539520263672, 0.020177364349365234, 0.02162933349609375, 0.023081302642822266, 0.02453327178955078, 0.025985240936279297, 0.027437210083007812, 0.028889179229736328, 0.030341148376464844, 0.03179311752319336, 0.033245086669921875, 0.03469705581665039, 0.036149024963378906, 0.03760099411010742, 0.03905296325683594, 0.04050493240356445, 0.04195690155029297, 0.043408870697021484, 0.04486083984375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 5.0, 4.0, 3.0, 3.0, 7.0, 1.0, 8.0, 5.0, 10.0, 14.0, 13.0, 22.0, 20.0, 25.0, 27.0, 23.0, 36.0, 43.0, 38.0, 40.0, 65.0, 46.0, 60.0, 47.0, 54.0, 44.0, 54.0, 31.0, 45.0, 35.0, 36.0, 29.0, 22.0, 21.0, 16.0, 22.0, 5.0, 6.0, 8.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1990966796875, -0.19237327575683594, -0.18564987182617188, -0.1789264678955078, -0.17220306396484375, -0.1654796600341797, -0.15875625610351562, -0.15203285217285156, -0.1453094482421875, -0.13858604431152344, -0.13186264038085938, -0.1251392364501953, -0.11841583251953125, -0.11169242858886719, -0.10496902465820312, -0.09824562072753906, -0.091522216796875, -0.08479881286621094, -0.07807540893554688, -0.07135200500488281, -0.06462860107421875, -0.05790519714355469, -0.051181793212890625, -0.04445838928222656, -0.0377349853515625, -0.031011581420898438, -0.024288177490234375, -0.017564773559570312, -0.01084136962890625, -0.0041179656982421875, 0.002605438232421875, 0.009328842163085938, 0.01605224609375, 0.022775650024414062, 0.029499053955078125, 0.03622245788574219, 0.04294586181640625, 0.04966926574707031, 0.056392669677734375, 0.06311607360839844, 0.0698394775390625, 0.07656288146972656, 0.08328628540039062, 0.09000968933105469, 0.09673309326171875, 0.10345649719238281, 0.11017990112304688, 0.11690330505371094, 0.123626708984375, 0.13035011291503906, 0.13707351684570312, 0.1437969207763672, 0.15052032470703125, 0.1572437286376953, 0.16396713256835938, 0.17069053649902344, 0.1774139404296875, 0.18413734436035156, 0.19086074829101562, 0.1975841522216797, 0.20430755615234375, 0.2110309600830078, 0.21775436401367188, 0.22447776794433594, 0.231201171875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 4.0, 5.0, 8.0, 21.0, 13.0, 26.0, 44.0, 55.0, 90.0, 124.0, 225.0, 347.0, 592.0, 1171.0, 2365.0, 5748.0, 16824.0, 70059.0, 393476.0, 446017.0, 80936.0, 18908.0, 6106.0, 2525.0, 1237.0, 642.0, 345.0, 228.0, 132.0, 80.0, 68.0, 40.0, 18.0, 23.0, 16.0, 10.0, 10.0, 5.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.01029205322265625, -0.009960532188415527, -0.009629011154174805, -0.009297490119934082, -0.00896596908569336, -0.008634448051452637, -0.008302927017211914, -0.007971405982971191, -0.007639884948730469, -0.007308363914489746, -0.0069768428802490234, -0.006645321846008301, -0.006313800811767578, -0.0059822797775268555, -0.005650758743286133, -0.00531923770904541, -0.0049877166748046875, -0.004656195640563965, -0.004324674606323242, -0.0039931535720825195, -0.003661632537841797, -0.0033301115036010742, -0.0029985904693603516, -0.002667069435119629, -0.0023355484008789062, -0.0020040273666381836, -0.001672506332397461, -0.0013409852981567383, -0.0010094642639160156, -0.000677943229675293, -0.0003464221954345703, -1.4901161193847656e-05, 0.000316619873046875, 0.0006481409072875977, 0.0009796619415283203, 0.001311182975769043, 0.0016427040100097656, 0.0019742250442504883, 0.002305746078491211, 0.0026372671127319336, 0.0029687881469726562, 0.003300309181213379, 0.0036318302154541016, 0.003963351249694824, 0.004294872283935547, 0.0046263933181762695, 0.004957914352416992, 0.005289435386657715, 0.0056209564208984375, 0.00595247745513916, 0.006283998489379883, 0.0066155195236206055, 0.006947040557861328, 0.007278561592102051, 0.0076100826263427734, 0.007941603660583496, 0.008273124694824219, 0.008604645729064941, 0.008936166763305664, 0.009267687797546387, 0.00959920883178711, 0.009930729866027832, 0.010262250900268555, 0.010593771934509277, 0.01092529296875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 4.0, 3.0, 10.0, 4.0, 7.0, 6.0, 13.0, 7.0, 23.0, 26.0, 23.0, 55.0, 37.0, 58.0, 61.0, 80.0, 83.0, 48.0, 73.0, 77.0, 61.0, 52.0, 52.0, 43.0, 17.0, 25.0, 19.0, 11.0, 11.0, 7.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.635883331298828e-06, -3.4654513001441956e-06, -3.295019268989563e-06, -3.1245872378349304e-06, -2.954155206680298e-06, -2.7837231755256653e-06, -2.6132911443710327e-06, -2.4428591132164e-06, -2.2724270820617676e-06, -2.101995050907135e-06, -1.9315630197525024e-06, -1.7611309885978699e-06, -1.5906989574432373e-06, -1.4202669262886047e-06, -1.2498348951339722e-06, -1.0794028639793396e-06, -9.08970832824707e-07, -7.385388016700745e-07, -5.681067705154419e-07, -3.976747393608093e-07, -2.2724270820617676e-07, -5.681067705154419e-08, 1.1362135410308838e-07, 2.8405338525772095e-07, 4.544854164123535e-07, 6.249174475669861e-07, 7.953494787216187e-07, 9.657815098762512e-07, 1.1362135410308838e-06, 1.3066455721855164e-06, 1.477077603340149e-06, 1.6475096344947815e-06, 1.817941665649414e-06, 1.9883736968040466e-06, 2.158805727958679e-06, 2.3292377591133118e-06, 2.4996697902679443e-06, 2.670101821422577e-06, 2.8405338525772095e-06, 3.010965883731842e-06, 3.1813979148864746e-06, 3.351829946041107e-06, 3.5222619771957397e-06, 3.6926940083503723e-06, 3.863126039505005e-06, 4.0335580706596375e-06, 4.20399010181427e-06, 4.374422132968903e-06, 4.544854164123535e-06, 4.715286195278168e-06, 4.8857182264328e-06, 5.056150257587433e-06, 5.2265822887420654e-06, 5.397014319896698e-06, 5.5674463510513306e-06, 5.737878382205963e-06, 5.908310413360596e-06, 6.078742444515228e-06, 6.249174475669861e-06, 6.419606506824493e-06, 6.590038537979126e-06, 6.7604705691337585e-06, 6.930902600288391e-06, 7.101334631443024e-06, 7.271766662597656e-06]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 6.0, 7.0, 2.0, 8.0, 7.0, 15.0, 15.0, 25.0, 33.0, 35.0, 57.0, 80.0, 109.0, 178.0, 234.0, 445.0, 826.0, 1583.0, 4112.0, 11775.0, 40542.0, 171836.0, 504253.0, 233566.0, 53747.0, 15336.0, 5321.0, 2059.0, 934.0, 551.0, 304.0, 172.0, 129.0, 72.0, 38.0, 36.0, 33.0, 17.0, 17.0, 8.0, 11.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00911712646484375, -0.00882863998413086, -0.008540153503417969, -0.008251667022705078, -0.007963180541992188, -0.007674694061279297, -0.007386207580566406, -0.007097721099853516, -0.006809234619140625, -0.006520748138427734, -0.006232261657714844, -0.005943775177001953, -0.0056552886962890625, -0.005366802215576172, -0.005078315734863281, -0.004789829254150391, -0.0045013427734375, -0.004212856292724609, -0.003924369812011719, -0.003635883331298828, -0.0033473968505859375, -0.003058910369873047, -0.0027704238891601562, -0.0024819374084472656, -0.002193450927734375, -0.0019049644470214844, -0.0016164779663085938, -0.0013279914855957031, -0.0010395050048828125, -0.0007510185241699219, -0.00046253204345703125, -0.00017404556274414062, 0.00011444091796875, 0.0004029273986816406, 0.0006914138793945312, 0.0009799003601074219, 0.0012683868408203125, 0.0015568733215332031, 0.0018453598022460938, 0.0021338462829589844, 0.002422332763671875, 0.0027108192443847656, 0.0029993057250976562, 0.003287792205810547, 0.0035762786865234375, 0.003864765167236328, 0.004153251647949219, 0.004441738128662109, 0.004730224609375, 0.005018711090087891, 0.005307197570800781, 0.005595684051513672, 0.0058841705322265625, 0.006172657012939453, 0.006461143493652344, 0.006749629974365234, 0.007038116455078125, 0.007326602935791016, 0.007615089416503906, 0.007903575897216797, 0.008192062377929688, 0.008480548858642578, 0.008769035339355469, 0.00905752182006836, 0.00934600830078125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 6.0, 2.0, 1.0, 6.0, 1.0, 3.0, 11.0, 18.0, 16.0, 17.0, 19.0, 25.0, 28.0, 37.0, 33.0, 45.0, 46.0, 53.0, 55.0, 62.0, 53.0, 65.0, 61.0, 56.0, 45.0, 34.0, 31.0, 26.0, 24.0, 27.0, 21.0, 16.0, 5.0, 12.0, 10.0, 9.0, 6.0, 2.0, 2.0, 2.0, 4.0, 7.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0017490386962890625, -0.0016888082027435303, -0.001628577709197998, -0.0015683472156524658, -0.0015081167221069336, -0.0014478862285614014, -0.0013876557350158691, -0.001327425241470337, -0.0012671947479248047, -0.0012069642543792725, -0.0011467337608337402, -0.001086503267288208, -0.0010262727737426758, -0.0009660422801971436, -0.0009058117866516113, -0.0008455812931060791, -0.0007853507995605469, -0.0007251203060150146, -0.0006648898124694824, -0.0006046593189239502, -0.000544428825378418, -0.00048419833183288574, -0.0004239678382873535, -0.0003637373447418213, -0.00030350685119628906, -0.00024327635765075684, -0.0001830458641052246, -0.00012281537055969238, -6.258487701416016e-05, -2.3543834686279297e-06, 5.78761100769043e-05, 0.00011810660362243652, 0.00017833709716796875, 0.00023856759071350098, 0.0002987980842590332, 0.00035902857780456543, 0.00041925907135009766, 0.0004794895648956299, 0.0005397200584411621, 0.0005999505519866943, 0.0006601810455322266, 0.0007204115390777588, 0.000780642032623291, 0.0008408725261688232, 0.0009011030197143555, 0.0009613335132598877, 0.00102156400680542, 0.0010817945003509521, 0.0011420249938964844, 0.0012022554874420166, 0.0012624859809875488, 0.001322716474533081, 0.0013829469680786133, 0.0014431774616241455, 0.0015034079551696777, 0.00156363844871521, 0.0016238689422607422, 0.0016840994358062744, 0.0017443299293518066, 0.0018045604228973389, 0.001864790916442871, 0.0019250214099884033, 0.0019852519035339355, 0.0020454823970794678, 0.002105712890625]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 8.0, 24.0, 31.0, 70.0, 136.0, 264.0, 222.0, 115.0, 63.0, 22.0, 19.0, 8.0, 5.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3553064465522766, -0.34480053186416626, -0.3342946171760559, -0.32378873229026794, -0.3132828176021576, -0.30277690291404724, -0.2922710180282593, -0.2817651033401489, -0.2712591886520386, -0.2607532739639282, -0.25024735927581787, -0.2397414743900299, -0.22923555970191956, -0.2187296450138092, -0.20822374522686005, -0.1977178454399109, -0.18721193075180054, -0.17670601606369019, -0.16620011627674103, -0.15569421648979187, -0.14518830180168152, -0.13468238711357117, -0.12417648732662201, -0.11367058008909225, -0.1031646728515625, -0.09265876561403275, -0.08215285837650299, -0.07164695113897324, -0.06114104390144348, -0.05063513666391373, -0.04012922942638397, -0.029623322188854218, -0.019117414951324463, -0.008611507713794708, 0.0018943995237350464, 0.012400306761264801, 0.022906213998794556, 0.03341212123632431, 0.043918028473854065, 0.05442393571138382, 0.06492984294891357, 0.07543575018644333, 0.08594165742397308, 0.09644756466150284, 0.10695347189903259, 0.11745937913656235, 0.1279652863740921, 0.13847118616104126, 0.1489771008491516, 0.15948301553726196, 0.16998891532421112, 0.18049481511116028, 0.19100072979927063, 0.20150664448738098, 0.21201254427433014, 0.2225184440612793, 0.23302435874938965, 0.2435302734375, 0.25403618812561035, 0.2645420730113983, 0.27504798769950867, 0.285553902387619, 0.296059787273407, 0.30656570196151733, 0.3170716166496277]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 6.0, 2.0, 1.0, 7.0, 10.0, 12.0, 18.0, 14.0, 17.0, 21.0, 28.0, 36.0, 38.0, 42.0, 50.0, 50.0, 49.0, 62.0, 63.0, 56.0, 35.0, 44.0, 54.0, 40.0, 42.0, 37.0, 41.0, 25.0, 24.0, 9.0, 19.0, 13.0, 7.0, 7.0, 6.0, 4.0, 6.0, 2.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10806149989366531, -0.10454869270324707, -0.10103588551282883, -0.09752307832241058, -0.09401026368141174, -0.0904974564909935, -0.08698464930057526, -0.08347184211015701, -0.07995903491973877, -0.07644622772932053, -0.07293342053890228, -0.06942060589790344, -0.0659077987074852, -0.062394991517066956, -0.05888218432664871, -0.05536937713623047, -0.05185656622052193, -0.048343759030103683, -0.04483094811439514, -0.0413181409239769, -0.037805333733558655, -0.03429252654314041, -0.03077971562743187, -0.027266908437013626, -0.023754099383950233, -0.02024129033088684, -0.016728483140468597, -0.013215674087405205, -0.009702865965664387, -0.006190057843923569, -0.002677248790860176, 0.0008355583995580673, 0.00434836745262146, 0.007861175574362278, 0.011373983696103096, 0.014886792749166489, 0.018399599939584732, 0.021912408992648125, 0.025425218045711517, 0.02893802523612976, 0.032450832426548004, 0.03596363961696625, 0.03947645053267479, 0.04298925772309303, 0.046502064913511276, 0.05001487582921982, 0.05352768301963806, 0.057040490210056305, 0.06055330112576485, 0.06406611204147339, 0.06757891923189163, 0.07109172642230988, 0.07460453361272812, 0.07811734080314636, 0.0816301554441452, 0.08514295518398285, 0.08865576982498169, 0.09216857701539993, 0.09568138420581818, 0.09919419884681702, 0.10270700603723526, 0.1062198132276535, 0.10973262041807175, 0.11324542760848999, 0.11675823479890823]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 6.0, 14.0, 33.0, 34.0, 62.0, 90.0, 173.0, 263.0, 503.0, 921.0, 1678.0, 3288.0, 6861.0, 15780.0, 43583.0, 182828.0, 581340.0, 146608.0, 37596.0, 14173.0, 6148.0, 3034.0, 1577.0, 838.0, 469.0, 277.0, 159.0, 102.0, 45.0, 38.0, 20.0, 12.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10638427734375, -0.10338211059570312, -0.10037994384765625, -0.09737777709960938, -0.0943756103515625, -0.09137344360351562, -0.08837127685546875, -0.08536911010742188, -0.082366943359375, -0.07936477661132812, -0.07636260986328125, -0.07336044311523438, -0.0703582763671875, -0.06735610961914062, -0.06435394287109375, -0.061351776123046875, -0.058349609375, -0.055347442626953125, -0.05234527587890625, -0.049343109130859375, -0.0463409423828125, -0.043338775634765625, -0.04033660888671875, -0.037334442138671875, -0.034332275390625, -0.031330108642578125, -0.02832794189453125, -0.025325775146484375, -0.0223236083984375, -0.019321441650390625, -0.01631927490234375, -0.013317108154296875, -0.01031494140625, -0.007312774658203125, -0.00431060791015625, -0.001308441162109375, 0.0016937255859375, 0.004695892333984375, 0.00769805908203125, 0.010700225830078125, 0.013702392578125, 0.016704559326171875, 0.01970672607421875, 0.022708892822265625, 0.0257110595703125, 0.028713226318359375, 0.03171539306640625, 0.034717559814453125, 0.0377197265625, 0.040721893310546875, 0.04372406005859375, 0.046726226806640625, 0.0497283935546875, 0.052730560302734375, 0.05573272705078125, 0.058734893798828125, 0.061737060546875, 0.06473922729492188, 0.06774139404296875, 0.07074356079101562, 0.0737457275390625, 0.07674789428710938, 0.07975006103515625, 0.08275222778320312, 0.08575439453125]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 5.0, 8.0, 3.0, 12.0, 12.0, 8.0, 16.0, 21.0, 26.0, 36.0, 37.0, 49.0, 48.0, 58.0, 53.0, 53.0, 61.0, 54.0, 41.0, 47.0, 49.0, 56.0, 48.0, 44.0, 32.0, 27.0, 21.0, 12.0, 11.0, 12.0, 10.0, 9.0, 4.0, 6.0, 3.0, 1.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.243408203125, -0.23533248901367188, -0.22725677490234375, -0.21918106079101562, -0.2111053466796875, -0.20302963256835938, -0.19495391845703125, -0.18687820434570312, -0.178802490234375, -0.17072677612304688, -0.16265106201171875, -0.15457534790039062, -0.1464996337890625, -0.13842391967773438, -0.13034820556640625, -0.12227249145507812, -0.11419677734375, -0.10612106323242188, -0.09804534912109375, -0.08996963500976562, -0.0818939208984375, -0.07381820678710938, -0.06574249267578125, -0.057666778564453125, -0.049591064453125, -0.041515350341796875, -0.03343963623046875, -0.025363922119140625, -0.0172882080078125, -0.009212493896484375, -0.00113677978515625, 0.006938934326171875, 0.0150146484375, 0.023090362548828125, 0.03116607666015625, 0.039241790771484375, 0.0473175048828125, 0.055393218994140625, 0.06346893310546875, 0.07154464721679688, 0.079620361328125, 0.08769607543945312, 0.09577178955078125, 0.10384750366210938, 0.1119232177734375, 0.11999893188476562, 0.12807464599609375, 0.13615036010742188, 0.14422607421875, 0.15230178833007812, 0.16037750244140625, 0.16845321655273438, 0.1765289306640625, 0.18460464477539062, 0.19268035888671875, 0.20075607299804688, 0.208831787109375, 0.21690750122070312, 0.22498321533203125, 0.23305892944335938, 0.2411346435546875, 0.24921035766601562, 0.25728607177734375, 0.2653617858886719, 0.2734375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 3.0, 3.0, 9.0, 17.0, 27.0, 32.0, 54.0, 101.0, 182.0, 436.0, 1186.0, 5538.0, 141672.0, 879515.0, 16557.0, 2020.0, 611.0, 266.0, 129.0, 61.0, 44.0, 25.0, 13.0, 13.0, 4.0, 6.0, 5.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.33544921875, -0.3264350891113281, -0.31742095947265625, -0.3084068298339844, -0.2993927001953125, -0.2903785705566406, -0.28136444091796875, -0.2723503112792969, -0.263336181640625, -0.2543220520019531, -0.24530792236328125, -0.23629379272460938, -0.2272796630859375, -0.21826553344726562, -0.20925140380859375, -0.20023727416992188, -0.19122314453125, -0.18220901489257812, -0.17319488525390625, -0.16418075561523438, -0.1551666259765625, -0.14615249633789062, -0.13713836669921875, -0.12812423706054688, -0.119110107421875, -0.11009597778320312, -0.10108184814453125, -0.09206771850585938, -0.0830535888671875, -0.07403945922851562, -0.06502532958984375, -0.056011199951171875, -0.0469970703125, -0.037982940673828125, -0.02896881103515625, -0.019954681396484375, -0.0109405517578125, -0.001926422119140625, 0.00708770751953125, 0.016101837158203125, 0.025115966796875, 0.034130096435546875, 0.04314422607421875, 0.052158355712890625, 0.0611724853515625, 0.07018661499023438, 0.07920074462890625, 0.08821487426757812, 0.09722900390625, 0.10624313354492188, 0.11525726318359375, 0.12427139282226562, 0.1332855224609375, 0.14229965209960938, 0.15131378173828125, 0.16032791137695312, 0.169342041015625, 0.17835617065429688, 0.18737030029296875, 0.19638442993164062, 0.2053985595703125, 0.21441268920898438, 0.22342681884765625, 0.23244094848632812, 0.241455078125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 7.0, 3.0, 7.0, 6.0, 9.0, 11.0, 13.0, 24.0, 12.0, 16.0, 21.0, 25.0, 28.0, 26.0, 39.0, 42.0, 49.0, 34.0, 35.0, 43.0, 44.0, 55.0, 37.0, 37.0, 32.0, 45.0, 45.0, 33.0, 37.0, 25.0, 22.0, 16.0, 20.0, 29.0, 15.0, 17.0, 8.0, 8.0, 9.0, 7.0, 3.0, 2.0, 3.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.2427978515625, -0.2352924346923828, -0.22778701782226562, -0.22028160095214844, -0.21277618408203125, -0.20527076721191406, -0.19776535034179688, -0.1902599334716797, -0.1827545166015625, -0.1752490997314453, -0.16774368286132812, -0.16023826599121094, -0.15273284912109375, -0.14522743225097656, -0.13772201538085938, -0.1302165985107422, -0.122711181640625, -0.11520576477050781, -0.10770034790039062, -0.10019493103027344, -0.09268951416015625, -0.08518409729003906, -0.07767868041992188, -0.07017326354980469, -0.0626678466796875, -0.05516242980957031, -0.047657012939453125, -0.04015159606933594, -0.03264617919921875, -0.025140762329101562, -0.017635345458984375, -0.010129928588867188, -0.00262451171875, 0.0048809051513671875, 0.012386322021484375, 0.019891738891601562, 0.02739715576171875, 0.03490257263183594, 0.042407989501953125, 0.04991340637207031, 0.0574188232421875, 0.06492424011230469, 0.07242965698242188, 0.07993507385253906, 0.08744049072265625, 0.09494590759277344, 0.10245132446289062, 0.10995674133300781, 0.117462158203125, 0.12496757507324219, 0.13247299194335938, 0.13997840881347656, 0.14748382568359375, 0.15498924255371094, 0.16249465942382812, 0.1700000762939453, 0.1775054931640625, 0.1850109100341797, 0.19251632690429688, 0.20002174377441406, 0.20752716064453125, 0.21503257751464844, 0.22253799438476562, 0.2300434112548828, 0.237548828125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 6.0, 12.0, 10.0, 18.0, 22.0, 55.0, 130.0, 304.0, 896.0, 4335.0, 84996.0, 943776.0, 11587.0, 1633.0, 444.0, 146.0, 78.0, 39.0, 21.0, 17.0, 12.0, 2.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.169189453125, -0.16438674926757812, -0.15958404541015625, -0.15478134155273438, -0.1499786376953125, -0.14517593383789062, -0.14037322998046875, -0.13557052612304688, -0.130767822265625, -0.12596511840820312, -0.12116241455078125, -0.11635971069335938, -0.1115570068359375, -0.10675430297851562, -0.10195159912109375, -0.09714889526367188, -0.09234619140625, -0.08754348754882812, -0.08274078369140625, -0.07793807983398438, -0.0731353759765625, -0.06833267211914062, -0.06352996826171875, -0.058727264404296875, -0.053924560546875, -0.049121856689453125, -0.04431915283203125, -0.039516448974609375, -0.0347137451171875, -0.029911041259765625, -0.02510833740234375, -0.020305633544921875, -0.0155029296875, -0.010700225830078125, -0.00589752197265625, -0.001094818115234375, 0.0037078857421875, 0.008510589599609375, 0.01331329345703125, 0.018115997314453125, 0.022918701171875, 0.027721405029296875, 0.03252410888671875, 0.037326812744140625, 0.0421295166015625, 0.046932220458984375, 0.05173492431640625, 0.056537628173828125, 0.06134033203125, 0.06614303588867188, 0.07094573974609375, 0.07574844360351562, 0.0805511474609375, 0.08535385131835938, 0.09015655517578125, 0.09495925903320312, 0.099761962890625, 0.10456466674804688, 0.10936737060546875, 0.11417007446289062, 0.1189727783203125, 0.12377548217773438, 0.12857818603515625, 0.13338088989257812, 0.13818359375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 4.0, 9.0, 15.0, 11.0, 22.0, 36.0, 79.0, 143.0, 230.0, 157.0, 125.0, 65.0, 38.0, 21.0, 14.0, 8.0, 5.0, 3.0, 3.0, 2.0, 5.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.6629695892333984e-05, -1.624133437871933e-05, -1.5852972865104675e-05, -1.546461135149002e-05, -1.5076249837875366e-05, -1.4687888324260712e-05, -1.4299526810646057e-05, -1.3911165297031403e-05, -1.3522803783416748e-05, -1.3134442269802094e-05, -1.2746080756187439e-05, -1.2357719242572784e-05, -1.196935772895813e-05, -1.1580996215343475e-05, -1.119263470172882e-05, -1.0804273188114166e-05, -1.0415911674499512e-05, -1.0027550160884857e-05, -9.639188647270203e-06, -9.250827133655548e-06, -8.862465620040894e-06, -8.474104106426239e-06, -8.085742592811584e-06, -7.69738107919693e-06, -7.309019565582275e-06, -6.920658051967621e-06, -6.532296538352966e-06, -6.143935024738312e-06, -5.755573511123657e-06, -5.367211997509003e-06, -4.978850483894348e-06, -4.590488970279694e-06, -4.202127456665039e-06, -3.8137659430503845e-06, -3.42540442943573e-06, -3.0370429158210754e-06, -2.648681402206421e-06, -2.2603198885917664e-06, -1.8719583749771118e-06, -1.4835968613624573e-06, -1.0952353477478027e-06, -7.068738341331482e-07, -3.1851232051849365e-07, 6.984919309616089e-08, 4.5821070671081543e-07, 8.4657222032547e-07, 1.2349337339401245e-06, 1.623295247554779e-06, 2.0116567611694336e-06, 2.400018274784088e-06, 2.7883797883987427e-06, 3.1767413020133972e-06, 3.5651028156280518e-06, 3.953464329242706e-06, 4.341825842857361e-06, 4.730187356472015e-06, 5.11854887008667e-06, 5.5069103837013245e-06, 5.895271897315979e-06, 6.2836334109306335e-06, 6.671994924545288e-06, 7.060356438159943e-06, 7.448717951774597e-06, 7.837079465389252e-06, 8.225440979003906e-06]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 4.0, 6.0, 15.0, 27.0, 39.0, 55.0, 117.0, 256.0, 831.0, 3757.0, 117340.0, 916322.0, 7898.0, 1169.0, 386.0, 134.0, 85.0, 40.0, 20.0, 17.0, 6.0, 6.0, 7.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.157470703125, -0.15187835693359375, -0.1462860107421875, -0.14069366455078125, -0.135101318359375, -0.12950897216796875, -0.1239166259765625, -0.11832427978515625, -0.11273193359375, -0.10713958740234375, -0.1015472412109375, -0.09595489501953125, -0.090362548828125, -0.08477020263671875, -0.0791778564453125, -0.07358551025390625, -0.0679931640625, -0.06240081787109375, -0.0568084716796875, -0.05121612548828125, -0.045623779296875, -0.04003143310546875, -0.0344390869140625, -0.02884674072265625, -0.02325439453125, -0.01766204833984375, -0.0120697021484375, -0.00647735595703125, -0.000885009765625, 0.00470733642578125, 0.0102996826171875, 0.01589202880859375, 0.021484375, 0.02707672119140625, 0.0326690673828125, 0.03826141357421875, 0.043853759765625, 0.04944610595703125, 0.0550384521484375, 0.06063079833984375, 0.06622314453125, 0.07181549072265625, 0.0774078369140625, 0.08300018310546875, 0.088592529296875, 0.09418487548828125, 0.0997772216796875, 0.10536956787109375, 0.1109619140625, 0.11655426025390625, 0.1221466064453125, 0.12773895263671875, 0.133331298828125, 0.13892364501953125, 0.1445159912109375, 0.15010833740234375, 0.15570068359375, 0.16129302978515625, 0.1668853759765625, 0.17247772216796875, 0.178070068359375, 0.18366241455078125, 0.1892547607421875, 0.19484710693359375, 0.200439453125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 5.0, 5.0, 9.0, 7.0, 8.0, 26.0, 23.0, 66.0, 111.0, 235.0, 233.0, 120.0, 61.0, 29.0, 20.0, 18.0, 14.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049224853515625, -0.04785728454589844, -0.046489715576171875, -0.04512214660644531, -0.04375457763671875, -0.04238700866699219, -0.041019439697265625, -0.03965187072753906, -0.0382843017578125, -0.03691673278808594, -0.035549163818359375, -0.03418159484863281, -0.03281402587890625, -0.03144645690917969, -0.030078887939453125, -0.028711318969726562, -0.02734375, -0.025976181030273438, -0.024608612060546875, -0.023241043090820312, -0.02187347412109375, -0.020505905151367188, -0.019138336181640625, -0.017770767211914062, -0.0164031982421875, -0.015035629272460938, -0.013668060302734375, -0.012300491333007812, -0.01093292236328125, -0.009565353393554688, -0.008197784423828125, -0.0068302154541015625, -0.005462646484375, -0.0040950775146484375, -0.002727508544921875, -0.0013599395751953125, 7.62939453125e-06, 0.0013751983642578125, 0.002742767333984375, 0.0041103363037109375, 0.0054779052734375, 0.0068454742431640625, 0.008213043212890625, 0.009580612182617188, 0.01094818115234375, 0.012315750122070312, 0.013683319091796875, 0.015050888061523438, 0.01641845703125, 0.017786026000976562, 0.019153594970703125, 0.020521163940429688, 0.02188873291015625, 0.023256301879882812, 0.024623870849609375, 0.025991439819335938, 0.0273590087890625, 0.028726577758789062, 0.030094146728515625, 0.03146171569824219, 0.03282928466796875, 0.03419685363769531, 0.035564422607421875, 0.03693199157714844, 0.038299560546875]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 13.0, 41.0, 169.0, 461.0, 236.0, 61.0, 12.0, 11.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.575226366519928, -0.5330412983894348, -0.49085626006126404, -0.4486711919307709, -0.4064861536026001, -0.36430108547210693, -0.32211601734161377, -0.279930979013443, -0.23774591088294983, -0.19556085765361786, -0.1533758044242859, -0.11119073629379272, -0.06900568306446075, -0.026820629835128784, 0.01536443829536438, 0.057549476623535156, 0.09973454475402832, 0.1419195979833603, 0.18410465121269226, 0.22628971934318542, 0.2684747576713562, 0.31065982580184937, 0.35284489393234253, 0.3950299322605133, 0.43721500039100647, 0.47940006852149963, 0.5215851068496704, 0.5637701749801636, 0.6059552431106567, 0.6481403112411499, 0.6903253793716431, 0.7325103878974915, 0.7746955156326294, 0.8168805837631226, 0.8590656518936157, 0.9012507200241089, 0.9434357285499573, 0.9856207966804504, 1.0278058052062988, 1.069990873336792, 1.1121759414672852, 1.1543610095977783, 1.1965460777282715, 1.2387311458587646, 1.2809162139892578, 1.323101282119751, 1.3652863502502441, 1.4074712991714478, 1.4496564865112305, 1.4918415546417236, 1.5340266227722168, 1.57621169090271, 1.6183967590332031, 1.6605818271636963, 1.7027668952941895, 1.744951844215393, 1.7871369123458862, 1.8293219804763794, 1.8715070486068726, 1.9136921167373657, 1.9558771848678589, 1.9980621337890625, 2.0402472019195557, 2.082432270050049, 2.124617338180542]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 6.0, 12.0, 15.0, 17.0, 26.0, 19.0, 37.0, 27.0, 29.0, 52.0, 34.0, 35.0, 44.0, 48.0, 47.0, 60.0, 60.0, 45.0, 52.0, 48.0, 40.0, 45.0, 36.0, 35.0, 25.0, 16.0, 19.0, 14.0, 13.0, 12.0, 11.0, 4.0, 7.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.6271568536758423, -0.6113367676734924, -0.5955166816711426, -0.5796966552734375, -0.5638765692710876, -0.5480564832687378, -0.5322363972663879, -0.5164163112640381, -0.500596284866333, -0.48477619886398315, -0.4689561426639557, -0.45313605666160583, -0.43731600046157837, -0.4214959144592285, -0.40567582845687866, -0.3898557424545288, -0.37403565645217896, -0.3582155704498291, -0.34239551424980164, -0.3265754282474518, -0.3107553720474243, -0.29493528604507446, -0.2791152000427246, -0.26329511404037476, -0.2474750578403473, -0.23165498673915863, -0.21583491563796997, -0.20001482963562012, -0.18419475853443146, -0.1683746874332428, -0.15255460143089294, -0.13673453032970428, -0.12091448903083801, -0.10509441792964935, -0.0892743393778801, -0.07345426082611084, -0.05763418972492218, -0.04181411862373352, -0.025994040071964264, -0.010173961520195007, 0.005646109580993652, 0.02146618440747261, 0.03728625923395157, 0.05310633406043053, 0.06892640888690948, 0.08474647998809814, 0.1005665585398674, 0.11638663709163666, 0.13220670819282532, 0.14802677929401398, 0.16384685039520264, 0.1796669363975525, 0.19548700749874115, 0.2113070785999298, 0.22712716460227966, 0.24294723570346832, 0.258767306804657, 0.27458739280700684, 0.2904074490070343, 0.30622753500938416, 0.3220475912094116, 0.3378676772117615, 0.35368776321411133, 0.3695078492164612, 0.38532790541648865]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 5.0, 2.0, 3.0, 2.0, 3.0, 4.0, 11.0, 12.0, 14.0, 19.0, 36.0, 37.0, 68.0, 112.0, 185.0, 242.0, 491.0, 889.0, 1722.0, 4311.0, 14165.0, 117929.0, 2952185.0, 1039865.0, 47029.0, 8593.0, 3285.0, 1371.0, 749.0, 367.0, 219.0, 117.0, 74.0, 45.0, 42.0, 27.0, 19.0, 13.0, 8.0, 11.0, 3.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.291259765625, -0.28238677978515625, -0.2735137939453125, -0.26464080810546875, -0.255767822265625, -0.24689483642578125, -0.2380218505859375, -0.22914886474609375, -0.22027587890625, -0.21140289306640625, -0.2025299072265625, -0.19365692138671875, -0.184783935546875, -0.17591094970703125, -0.1670379638671875, -0.15816497802734375, -0.1492919921875, -0.14041900634765625, -0.1315460205078125, -0.12267303466796875, -0.113800048828125, -0.10492706298828125, -0.0960540771484375, -0.08718109130859375, -0.07830810546875, -0.06943511962890625, -0.0605621337890625, -0.05168914794921875, -0.042816162109375, -0.03394317626953125, -0.0250701904296875, -0.01619720458984375, -0.00732421875, 0.00154876708984375, 0.0104217529296875, 0.01929473876953125, 0.028167724609375, 0.03704071044921875, 0.0459136962890625, 0.05478668212890625, 0.06365966796875, 0.07253265380859375, 0.0814056396484375, 0.09027862548828125, 0.099151611328125, 0.10802459716796875, 0.1168975830078125, 0.12577056884765625, 0.1346435546875, 0.14351654052734375, 0.1523895263671875, 0.16126251220703125, 0.170135498046875, 0.17900848388671875, 0.1878814697265625, 0.19675445556640625, 0.20562744140625, 0.21450042724609375, 0.2233734130859375, 0.23224639892578125, 0.241119384765625, 0.24999237060546875, 0.2588653564453125, 0.26773834228515625, 0.276611328125]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 9.0, 4.0, 8.0, 20.0, 18.0, 28.0, 22.0, 25.0, 25.0, 40.0, 38.0, 64.0, 54.0, 43.0, 54.0, 51.0, 70.0, 45.0, 57.0, 47.0, 35.0, 37.0, 35.0, 30.0, 26.0, 16.0, 18.0, 10.0, 14.0, 9.0, 7.0, 11.0, 6.0, 6.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11334228515625, -0.10926532745361328, -0.10518836975097656, -0.10111141204833984, -0.09703445434570312, -0.0929574966430664, -0.08888053894042969, -0.08480358123779297, -0.08072662353515625, -0.07664966583251953, -0.07257270812988281, -0.0684957504272461, -0.06441879272460938, -0.060341835021972656, -0.05626487731933594, -0.05218791961669922, -0.0481109619140625, -0.04403400421142578, -0.03995704650878906, -0.035880088806152344, -0.031803131103515625, -0.027726173400878906, -0.023649215698242188, -0.01957225799560547, -0.01549530029296875, -0.011418342590332031, -0.0073413848876953125, -0.0032644271850585938, 0.000812530517578125, 0.004889488220214844, 0.008966445922851562, 0.013043403625488281, 0.017120361328125, 0.02119731903076172, 0.025274276733398438, 0.029351234436035156, 0.033428192138671875, 0.037505149841308594, 0.04158210754394531, 0.04565906524658203, 0.04973602294921875, 0.05381298065185547, 0.05788993835449219, 0.061966896057128906, 0.06604385375976562, 0.07012081146240234, 0.07419776916503906, 0.07827472686767578, 0.0823516845703125, 0.08642864227294922, 0.09050559997558594, 0.09458255767822266, 0.09865951538085938, 0.1027364730834961, 0.10681343078613281, 0.11089038848876953, 0.11496734619140625, 0.11904430389404297, 0.12312126159667969, 0.1271982192993164, 0.13127517700195312, 0.13535213470458984, 0.13942909240722656, 0.14350605010986328, 0.1475830078125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 5.0, 4.0, 3.0, 9.0, 8.0, 13.0, 13.0, 15.0, 27.0, 50.0, 55.0, 104.0, 183.0, 321.0, 754.0, 2102.0, 8211.0, 63622.0, 3762991.0, 330422.0, 19270.0, 3884.0, 1168.0, 470.0, 229.0, 118.0, 81.0, 42.0, 25.0, 20.0, 17.0, 12.0, 7.0, 13.0, 12.0, 3.0, 1.0, 2.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.32666015625, -0.31603240966796875, -0.3054046630859375, -0.29477691650390625, -0.284149169921875, -0.27352142333984375, -0.2628936767578125, -0.25226593017578125, -0.24163818359375, -0.23101043701171875, -0.2203826904296875, -0.20975494384765625, -0.199127197265625, -0.18849945068359375, -0.1778717041015625, -0.16724395751953125, -0.1566162109375, -0.14598846435546875, -0.1353607177734375, -0.12473297119140625, -0.114105224609375, -0.10347747802734375, -0.0928497314453125, -0.08222198486328125, -0.07159423828125, -0.06096649169921875, -0.0503387451171875, -0.03971099853515625, -0.029083251953125, -0.01845550537109375, -0.0078277587890625, 0.00279998779296875, 0.013427734375, 0.02405548095703125, 0.0346832275390625, 0.04531097412109375, 0.055938720703125, 0.06656646728515625, 0.0771942138671875, 0.08782196044921875, 0.09844970703125, 0.10907745361328125, 0.1197052001953125, 0.13033294677734375, 0.140960693359375, 0.15158843994140625, 0.1622161865234375, 0.17284393310546875, 0.1834716796875, 0.19409942626953125, 0.2047271728515625, 0.21535491943359375, 0.225982666015625, 0.23661041259765625, 0.2472381591796875, 0.25786590576171875, 0.26849365234375, 0.27912139892578125, 0.2897491455078125, 0.30037689208984375, 0.311004638671875, 0.32163238525390625, 0.3322601318359375, 0.34288787841796875, 0.353515625]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 5.0, 5.0, 9.0, 13.0, 10.0, 20.0, 28.0, 44.0, 82.0, 83.0, 168.0, 387.0, 643.0, 957.0, 685.0, 380.0, 191.0, 118.0, 72.0, 41.0, 27.0, 25.0, 23.0, 17.0, 10.0, 5.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055877685546875, -0.0538487434387207, -0.051819801330566406, -0.04979085922241211, -0.04776191711425781, -0.045732975006103516, -0.04370403289794922, -0.04167509078979492, -0.039646148681640625, -0.03761720657348633, -0.03558826446533203, -0.033559322357177734, -0.03153038024902344, -0.02950143814086914, -0.027472496032714844, -0.025443553924560547, -0.02341461181640625, -0.021385669708251953, -0.019356727600097656, -0.01732778549194336, -0.015298843383789062, -0.013269901275634766, -0.011240959167480469, -0.009212017059326172, -0.007183074951171875, -0.005154132843017578, -0.0031251907348632812, -0.0010962486267089844, 0.0009326934814453125, 0.0029616355895996094, 0.004990577697753906, 0.007019519805908203, 0.0090484619140625, 0.011077404022216797, 0.013106346130371094, 0.01513528823852539, 0.017164230346679688, 0.019193172454833984, 0.02122211456298828, 0.023251056671142578, 0.025279998779296875, 0.027308940887451172, 0.02933788299560547, 0.031366825103759766, 0.03339576721191406, 0.03542470932006836, 0.037453651428222656, 0.03948259353637695, 0.04151153564453125, 0.04354047775268555, 0.045569419860839844, 0.04759836196899414, 0.04962730407714844, 0.051656246185302734, 0.05368518829345703, 0.05571413040161133, 0.057743072509765625, 0.05977201461791992, 0.06180095672607422, 0.06382989883422852, 0.06585884094238281, 0.06788778305053711, 0.0699167251586914, 0.0719456672668457, 0.073974609375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 8.0, 3.0, 6.0, 14.0, 14.0, 17.0, 55.0, 67.0, 97.0, 152.0, 144.0, 145.0, 92.0, 57.0, 44.0, 32.0, 24.0, 10.0, 2.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.32026854157447815, -0.3109922707080841, -0.3017159700393677, -0.29243969917297363, -0.2831634283065796, -0.27388715744018555, -0.2646108567714691, -0.2553345859050751, -0.24605830013751984, -0.2367820143699646, -0.22750574350357056, -0.21822945773601532, -0.20895317196846008, -0.19967690110206604, -0.1904006153345108, -0.18112432956695557, -0.17184805870056152, -0.1625717729330063, -0.15329550206661224, -0.144019216299057, -0.13474294543266296, -0.12546665966510773, -0.11619037389755249, -0.10691409558057785, -0.09763781726360321, -0.08836153894662857, -0.07908526062965393, -0.0698089748620987, -0.060532696545124054, -0.051256418228149414, -0.041980136185884476, -0.03270385414361954, -0.023427575826644897, -0.014151295647025108, -0.004875015467405319, 0.00440126471221447, 0.013677544891834259, 0.0229538232088089, 0.03223010525107384, 0.041506387293338776, 0.050782665610313416, 0.060058943927288055, 0.0693352222442627, 0.07861150801181793, 0.08788778632879257, 0.09716406464576721, 0.10644035041332245, 0.11571662873029709, 0.12499290704727173, 0.13426919281482697, 0.143545463681221, 0.15282174944877625, 0.1620980203151703, 0.17137430608272552, 0.18065059185028076, 0.1899268627166748, 0.19920314848423004, 0.20847943425178528, 0.21775570511817932, 0.22703199088573456, 0.2363082766532898, 0.24558454751968384, 0.2548608183860779, 0.2641371190547943, 0.27341338992118835]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 11.0, 16.0, 17.0, 16.0, 21.0, 23.0, 22.0, 16.0, 36.0, 40.0, 32.0, 33.0, 46.0, 45.0, 49.0, 44.0, 57.0, 51.0, 42.0, 47.0, 49.0, 33.0, 43.0, 37.0, 31.0, 30.0, 18.0, 12.0, 16.0, 13.0, 15.0, 5.0, 6.0, 6.0, 2.0, 3.0, 4.0, 4.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11806507408618927, -0.11389222741127014, -0.10971938073635101, -0.10554653406143188, -0.10137368738651276, -0.09720084071159363, -0.0930280014872551, -0.08885515481233597, -0.08468230813741684, -0.08050946146249771, -0.07633661478757858, -0.07216376811265945, -0.06799092888832092, -0.0638180822134018, -0.059645235538482666, -0.05547238886356354, -0.05129954218864441, -0.04712669551372528, -0.04295384883880615, -0.03878100588917732, -0.034608159214258194, -0.030435312539339066, -0.026262467727065086, -0.022089622914791107, -0.01791677623987198, -0.013743930496275425, -0.009571084752678871, -0.005398239009082317, -0.0012253932654857635, 0.002947453409433365, 0.007120298221707344, 0.011293143033981323, 0.015466004610061646, 0.019638851284980774, 0.023811696097254753, 0.027984540909528732, 0.03215738758444786, 0.03633023425936699, 0.04050307720899582, 0.04467592388391495, 0.048848770558834076, 0.053021617233753204, 0.05719446390867233, 0.06136730685830116, 0.06554014980792999, 0.06971299648284912, 0.07388584315776825, 0.07805868983268738, 0.0822315365076065, 0.08640438318252563, 0.09057722985744476, 0.09475007653236389, 0.09892292320728302, 0.10309576988220215, 0.10726860910654068, 0.11144145578145981, 0.11561430245637894, 0.11978714913129807, 0.1239599958062172, 0.12813283503055573, 0.13230568170547485, 0.13647852838039398, 0.1406513750553131, 0.14482422173023224, 0.14899706840515137]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 2.0, 3.0, 14.0, 7.0, 15.0, 25.0, 69.0, 87.0, 181.0, 421.0, 770.0, 1804.0, 4467.0, 12421.0, 39922.0, 156743.0, 482547.0, 258288.0, 61947.0, 18145.0, 6223.0, 2438.0, 1020.0, 474.0, 255.0, 102.0, 68.0, 37.0, 26.0, 17.0, 11.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.037994384765625, -0.03703665733337402, -0.03607892990112305, -0.03512120246887207, -0.034163475036621094, -0.03320574760437012, -0.03224802017211914, -0.031290292739868164, -0.030332565307617188, -0.02937483787536621, -0.028417110443115234, -0.027459383010864258, -0.02650165557861328, -0.025543928146362305, -0.024586200714111328, -0.02362847328186035, -0.022670745849609375, -0.0217130184173584, -0.020755290985107422, -0.019797563552856445, -0.01883983612060547, -0.017882108688354492, -0.016924381256103516, -0.01596665382385254, -0.015008926391601562, -0.014051198959350586, -0.01309347152709961, -0.012135744094848633, -0.011178016662597656, -0.01022028923034668, -0.009262561798095703, -0.008304834365844727, -0.00734710693359375, -0.0063893795013427734, -0.005431652069091797, -0.00447392463684082, -0.0035161972045898438, -0.002558469772338867, -0.0016007423400878906, -0.0006430149078369141, 0.0003147125244140625, 0.001272439956665039, 0.0022301673889160156, 0.003187894821166992, 0.004145622253417969, 0.005103349685668945, 0.006061077117919922, 0.0070188045501708984, 0.007976531982421875, 0.008934259414672852, 0.009891986846923828, 0.010849714279174805, 0.011807441711425781, 0.012765169143676758, 0.013722896575927734, 0.014680624008178711, 0.015638351440429688, 0.016596078872680664, 0.01755380630493164, 0.018511533737182617, 0.019469261169433594, 0.02042698860168457, 0.021384716033935547, 0.022342443466186523, 0.0233001708984375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 8.0, 9.0, 19.0, 23.0, 19.0, 23.0, 23.0, 26.0, 27.0, 35.0, 57.0, 45.0, 50.0, 44.0, 62.0, 57.0, 59.0, 47.0, 58.0, 42.0, 53.0, 38.0, 35.0, 25.0, 22.0, 20.0, 7.0, 8.0, 9.0, 10.0, 13.0, 6.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.095458984375, -0.0921010971069336, -0.08874320983886719, -0.08538532257080078, -0.08202743530273438, -0.07866954803466797, -0.07531166076660156, -0.07195377349853516, -0.06859588623046875, -0.06523799896240234, -0.06188011169433594, -0.05852222442626953, -0.055164337158203125, -0.05180644989013672, -0.04844856262207031, -0.045090675354003906, -0.0417327880859375, -0.038374900817871094, -0.03501701354980469, -0.03165912628173828, -0.028301239013671875, -0.02494335174560547, -0.021585464477539062, -0.018227577209472656, -0.01486968994140625, -0.011511802673339844, -0.008153915405273438, -0.004796028137207031, -0.001438140869140625, 0.0019197463989257812, 0.0052776336669921875, 0.008635520935058594, 0.011993408203125, 0.015351295471191406, 0.018709182739257812, 0.02206707000732422, 0.025424957275390625, 0.02878284454345703, 0.03214073181152344, 0.035498619079589844, 0.03885650634765625, 0.042214393615722656, 0.04557228088378906, 0.04893016815185547, 0.052288055419921875, 0.05564594268798828, 0.05900382995605469, 0.062361717224121094, 0.0657196044921875, 0.0690774917602539, 0.07243537902832031, 0.07579326629638672, 0.07915115356445312, 0.08250904083251953, 0.08586692810058594, 0.08922481536865234, 0.09258270263671875, 0.09594058990478516, 0.09929847717285156, 0.10265636444091797, 0.10601425170898438, 0.10937213897705078, 0.11273002624511719, 0.1160879135131836, 0.11944580078125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 7.0, 6.0, 5.0, 14.0, 14.0, 21.0, 38.0, 77.0, 111.0, 177.0, 342.0, 603.0, 1162.0, 2607.0, 6800.0, 20911.0, 84265.0, 379515.0, 417585.0, 97268.0, 23864.0, 7454.0, 2854.0, 1309.0, 680.0, 346.0, 203.0, 108.0, 75.0, 35.0, 25.0, 16.0, 13.0, 9.0, 8.0, 3.0, 6.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.032928466796875, -0.03196120262145996, -0.030993938446044922, -0.030026674270629883, -0.029059410095214844, -0.028092145919799805, -0.027124881744384766, -0.026157617568969727, -0.025190353393554688, -0.02422308921813965, -0.02325582504272461, -0.02228856086730957, -0.02132129669189453, -0.020354032516479492, -0.019386768341064453, -0.018419504165649414, -0.017452239990234375, -0.016484975814819336, -0.015517711639404297, -0.014550447463989258, -0.013583183288574219, -0.01261591911315918, -0.01164865493774414, -0.010681390762329102, -0.009714126586914062, -0.008746862411499023, -0.007779598236083984, -0.006812334060668945, -0.005845069885253906, -0.004877805709838867, -0.003910541534423828, -0.002943277359008789, -0.00197601318359375, -0.001008749008178711, -4.1484832763671875e-05, 0.0009257793426513672, 0.0018930435180664062, 0.0028603076934814453, 0.0038275718688964844, 0.0047948360443115234, 0.0057621002197265625, 0.0067293643951416016, 0.007696628570556641, 0.00866389274597168, 0.009631156921386719, 0.010598421096801758, 0.011565685272216797, 0.012532949447631836, 0.013500213623046875, 0.014467477798461914, 0.015434741973876953, 0.016402006149291992, 0.01736927032470703, 0.01833653450012207, 0.01930379867553711, 0.02027106285095215, 0.021238327026367188, 0.022205591201782227, 0.023172855377197266, 0.024140119552612305, 0.025107383728027344, 0.026074647903442383, 0.027041912078857422, 0.02800917625427246, 0.0289764404296875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 5.0, 3.0, 6.0, 6.0, 15.0, 13.0, 14.0, 16.0, 13.0, 23.0, 19.0, 26.0, 19.0, 21.0, 26.0, 38.0, 32.0, 37.0, 39.0, 41.0, 37.0, 43.0, 37.0, 44.0, 36.0, 40.0, 36.0, 50.0, 31.0, 17.0, 34.0, 30.0, 24.0, 26.0, 16.0, 15.0, 9.0, 9.0, 16.0, 9.0, 7.0, 5.0, 7.0, 6.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.1640625, -0.15893936157226562, -0.15381622314453125, -0.14869308471679688, -0.1435699462890625, -0.13844680786132812, -0.13332366943359375, -0.12820053100585938, -0.123077392578125, -0.11795425415039062, -0.11283111572265625, -0.10770797729492188, -0.1025848388671875, -0.09746170043945312, -0.09233856201171875, -0.08721542358398438, -0.08209228515625, -0.07696914672851562, -0.07184600830078125, -0.06672286987304688, -0.0615997314453125, -0.056476593017578125, -0.05135345458984375, -0.046230316162109375, -0.041107177734375, -0.035984039306640625, -0.03086090087890625, -0.025737762451171875, -0.0206146240234375, -0.015491485595703125, -0.01036834716796875, -0.005245208740234375, -0.0001220703125, 0.005001068115234375, 0.01012420654296875, 0.015247344970703125, 0.0203704833984375, 0.025493621826171875, 0.03061676025390625, 0.035739898681640625, 0.040863037109375, 0.045986175537109375, 0.05110931396484375, 0.056232452392578125, 0.0613555908203125, 0.06647872924804688, 0.07160186767578125, 0.07672500610351562, 0.08184814453125, 0.08697128295898438, 0.09209442138671875, 0.09721755981445312, 0.1023406982421875, 0.10746383666992188, 0.11258697509765625, 0.11771011352539062, 0.122833251953125, 0.12795639038085938, 0.13307952880859375, 0.13820266723632812, 0.1433258056640625, 0.14844894409179688, 0.15357208251953125, 0.15869522094726562, 0.163818359375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 6.0, 12.0, 14.0, 24.0, 37.0, 60.0, 109.0, 236.0, 495.0, 1255.0, 4028.0, 20170.0, 215857.0, 710464.0, 81264.0, 10412.0, 2464.0, 863.0, 378.0, 167.0, 85.0, 56.0, 30.0, 17.0, 12.0, 9.0, 9.0, 4.0, 9.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0142364501953125, -0.013715267181396484, -0.013194084167480469, -0.012672901153564453, -0.012151718139648438, -0.011630535125732422, -0.011109352111816406, -0.01058816909790039, -0.010066986083984375, -0.00954580307006836, -0.009024620056152344, -0.008503437042236328, -0.007982254028320312, -0.007461071014404297, -0.006939888000488281, -0.006418704986572266, -0.00589752197265625, -0.005376338958740234, -0.004855155944824219, -0.004333972930908203, -0.0038127899169921875, -0.003291606903076172, -0.0027704238891601562, -0.0022492408752441406, -0.001728057861328125, -0.0012068748474121094, -0.0006856918334960938, -0.00016450881958007812, 0.0003566741943359375, 0.0008778572082519531, 0.0013990402221679688, 0.0019202232360839844, 0.00244140625, 0.0029625892639160156, 0.0034837722778320312, 0.004004955291748047, 0.0045261383056640625, 0.005047321319580078, 0.005568504333496094, 0.006089687347412109, 0.006610870361328125, 0.007132053375244141, 0.007653236389160156, 0.008174419403076172, 0.008695602416992188, 0.009216785430908203, 0.009737968444824219, 0.010259151458740234, 0.01078033447265625, 0.011301517486572266, 0.011822700500488281, 0.012343883514404297, 0.012865066528320312, 0.013386249542236328, 0.013907432556152344, 0.01442861557006836, 0.014949798583984375, 0.01547098159790039, 0.015992164611816406, 0.016513347625732422, 0.017034530639648438, 0.017555713653564453, 0.01807689666748047, 0.018598079681396484, 0.0191192626953125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 9.0, 6.0, 12.0, 18.0, 15.0, 37.0, 32.0, 57.0, 58.0, 57.0, 107.0, 75.0, 125.0, 82.0, 68.0, 53.0, 43.0, 43.0, 23.0, 27.0, 9.0, 12.0, 12.0, 6.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.841255187988281e-06, -5.638226866722107e-06, -5.435198545455933e-06, -5.232170224189758e-06, -5.029141902923584e-06, -4.82611358165741e-06, -4.623085260391235e-06, -4.420056939125061e-06, -4.217028617858887e-06, -4.014000296592712e-06, -3.810971975326538e-06, -3.6079436540603638e-06, -3.4049153327941895e-06, -3.201887011528015e-06, -2.998858690261841e-06, -2.7958303689956665e-06, -2.592802047729492e-06, -2.389773726463318e-06, -2.1867454051971436e-06, -1.9837170839309692e-06, -1.780688762664795e-06, -1.5776604413986206e-06, -1.3746321201324463e-06, -1.171603798866272e-06, -9.685754776000977e-07, -7.655471563339233e-07, -5.62518835067749e-07, -3.594905138015747e-07, -1.564621925354004e-07, 4.6566128730773926e-08, 2.4959444999694824e-07, 4.5262277126312256e-07, 6.556510925292969e-07, 8.586794137954712e-07, 1.0617077350616455e-06, 1.2647360563278198e-06, 1.4677643775939941e-06, 1.6707926988601685e-06, 1.8738210201263428e-06, 2.076849341392517e-06, 2.2798776626586914e-06, 2.4829059839248657e-06, 2.68593430519104e-06, 2.8889626264572144e-06, 3.0919909477233887e-06, 3.295019268989563e-06, 3.4980475902557373e-06, 3.7010759115219116e-06, 3.904104232788086e-06, 4.10713255405426e-06, 4.3101608753204346e-06, 4.513189196586609e-06, 4.716217517852783e-06, 4.9192458391189575e-06, 5.122274160385132e-06, 5.325302481651306e-06, 5.5283308029174805e-06, 5.731359124183655e-06, 5.934387445449829e-06, 6.137415766716003e-06, 6.340444087982178e-06, 6.543472409248352e-06, 6.746500730514526e-06, 6.949529051780701e-06, 7.152557373046875e-06]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 9.0, 7.0, 3.0, 14.0, 15.0, 33.0, 27.0, 41.0, 62.0, 113.0, 150.0, 234.0, 443.0, 830.0, 1940.0, 4786.0, 15297.0, 64376.0, 313413.0, 481180.0, 126005.0, 26734.0, 7441.0, 2755.0, 1157.0, 603.0, 321.0, 194.0, 113.0, 87.0, 53.0, 43.0, 19.0, 18.0, 10.0, 14.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00933837890625, -0.009018659591674805, -0.00869894027709961, -0.008379220962524414, -0.008059501647949219, -0.0077397823333740234, -0.007420063018798828, -0.007100343704223633, -0.0067806243896484375, -0.006460905075073242, -0.006141185760498047, -0.0058214664459228516, -0.005501747131347656, -0.005182027816772461, -0.004862308502197266, -0.00454258918762207, -0.004222869873046875, -0.0039031505584716797, -0.0035834312438964844, -0.003263711929321289, -0.0029439926147460938, -0.0026242733001708984, -0.002304553985595703, -0.001984834671020508, -0.0016651153564453125, -0.0013453960418701172, -0.0010256767272949219, -0.0007059574127197266, -0.00038623809814453125, -6.651878356933594e-05, 0.0002532005310058594, 0.0005729198455810547, 0.00089263916015625, 0.0012123584747314453, 0.0015320777893066406, 0.001851797103881836, 0.0021715164184570312, 0.0024912357330322266, 0.002810955047607422, 0.003130674362182617, 0.0034503936767578125, 0.003770112991333008, 0.004089832305908203, 0.0044095516204833984, 0.004729270935058594, 0.005048990249633789, 0.005368709564208984, 0.00568842887878418, 0.006008148193359375, 0.00632786750793457, 0.006647586822509766, 0.006967306137084961, 0.007287025451660156, 0.0076067447662353516, 0.007926464080810547, 0.008246183395385742, 0.008565902709960938, 0.008885622024536133, 0.009205341339111328, 0.009525060653686523, 0.009844779968261719, 0.010164499282836914, 0.01048421859741211, 0.010803937911987305, 0.0111236572265625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 6.0, 12.0, 7.0, 15.0, 21.0, 19.0, 30.0, 35.0, 44.0, 68.0, 49.0, 63.0, 70.0, 78.0, 79.0, 58.0, 71.0, 61.0, 32.0, 46.0, 34.0, 30.0, 16.0, 10.0, 13.0, 12.0, 6.0, 3.0, 5.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0029659271240234375, -0.0028780102729797363, -0.002790093421936035, -0.002702176570892334, -0.002614259719848633, -0.0025263428688049316, -0.0024384260177612305, -0.0023505091667175293, -0.002262592315673828, -0.002174675464630127, -0.0020867586135864258, -0.0019988417625427246, -0.0019109249114990234, -0.0018230080604553223, -0.001735091209411621, -0.00164717435836792, -0.0015592575073242188, -0.0014713406562805176, -0.0013834238052368164, -0.0012955069541931152, -0.001207590103149414, -0.0011196732521057129, -0.0010317564010620117, -0.0009438395500183105, -0.0008559226989746094, -0.0007680058479309082, -0.000680088996887207, -0.0005921721458435059, -0.0005042552947998047, -0.0004163384437561035, -0.00032842159271240234, -0.00024050474166870117, -0.000152587890625, -6.467103958129883e-05, 2.3245811462402344e-05, 0.00011116266250610352, 0.0001990795135498047, 0.00028699636459350586, 0.00037491321563720703, 0.0004628300666809082, 0.0005507469177246094, 0.0006386637687683105, 0.0007265806198120117, 0.0008144974708557129, 0.0009024143218994141, 0.0009903311729431152, 0.0010782480239868164, 0.0011661648750305176, 0.0012540817260742188, 0.00134199857711792, 0.001429915428161621, 0.0015178322792053223, 0.0016057491302490234, 0.0016936659812927246, 0.0017815828323364258, 0.001869499683380127, 0.001957416534423828, 0.0020453333854675293, 0.0021332502365112305, 0.0022211670875549316, 0.002309083938598633, 0.002397000789642334, 0.002484917640686035, 0.0025728344917297363, 0.0026607513427734375]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 7.0, 13.0, 15.0, 52.0, 94.0, 169.0, 214.0, 188.0, 104.0, 61.0, 26.0, 24.0, 7.0, 7.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3339976370334625, -0.32557156682014465, -0.3171454668045044, -0.3087193965911865, -0.30029332637786865, -0.2918672561645508, -0.2834411859512329, -0.27501508593559265, -0.2665890157222748, -0.2581629455089569, -0.24973686039447784, -0.24131077527999878, -0.2328847050666809, -0.22445863485336304, -0.21603254973888397, -0.2076064646244049, -0.19918039441108704, -0.19075432419776917, -0.1823282390832901, -0.17390215396881104, -0.16547608375549316, -0.1570500135421753, -0.14862392842769623, -0.14019784331321716, -0.1317717730998993, -0.12334569543600082, -0.11491961777210236, -0.10649354010820389, -0.09806746244430542, -0.08964138478040695, -0.08121530711650848, -0.07278922945261002, -0.06436315178871155, -0.05593707412481308, -0.04751099646091461, -0.039084918797016144, -0.030658841133117676, -0.022232763469219208, -0.01380668580532074, -0.005380608141422272, 0.0030454695224761963, 0.011471547186374664, 0.019897624850273132, 0.0283237025141716, 0.03674978017807007, 0.045175857841968536, 0.053601935505867004, 0.06202801316976547, 0.07045409083366394, 0.07888016849756241, 0.08730624616146088, 0.09573232382535934, 0.10415840148925781, 0.11258447915315628, 0.12101055681705475, 0.1294366419315338, 0.13786271214485168, 0.14628878235816956, 0.15471486747264862, 0.16314095258712769, 0.17156702280044556, 0.17999309301376343, 0.1884191781282425, 0.19684526324272156, 0.20527133345603943]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 6.0, 6.0, 8.0, 17.0, 14.0, 24.0, 20.0, 29.0, 23.0, 35.0, 43.0, 37.0, 48.0, 41.0, 49.0, 64.0, 66.0, 52.0, 54.0, 58.0, 48.0, 34.0, 45.0, 35.0, 30.0, 24.0, 17.0, 14.0, 14.0, 12.0, 9.0, 5.0, 7.0, 0.0, 2.0, 4.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0979456678032875, -0.09462704509496689, -0.09130841493606567, -0.08798979222774506, -0.08467116206884384, -0.08135253936052322, -0.07803390920162201, -0.07471528649330139, -0.07139666378498077, -0.06807804107666016, -0.06475941091775894, -0.061440788209438324, -0.05812216177582741, -0.05480353534221649, -0.051484908908605576, -0.04816628247499466, -0.04484765604138374, -0.04152902960777283, -0.03821040317416191, -0.034891776740550995, -0.03157315403223038, -0.02825452759861946, -0.024935901165008545, -0.021617276594042778, -0.018298650160431862, -0.01498002465814352, -0.011661399155855179, -0.008342772722244263, -0.005024147219955921, -0.0017055217176675797, 0.0016131047159433365, 0.004931729286909103, 0.00825035572052002, 0.011568981222808361, 0.014887606725096703, 0.01820623315870762, 0.021524857729673386, 0.024843484163284302, 0.028162110596895218, 0.031480737030506134, 0.03479935973882675, 0.03811798617243767, 0.041436612606048584, 0.0447552353143692, 0.04807386174798012, 0.051392488181591034, 0.05471111461520195, 0.058029741048812866, 0.06134836748242378, 0.0646669939160347, 0.06798561662435532, 0.07130424678325653, 0.07462286949157715, 0.07794149219989777, 0.08126012235879898, 0.0845787450671196, 0.08789737522602081, 0.09121599793434143, 0.09453462809324265, 0.09785325080156326, 0.10117188096046448, 0.1044905036687851, 0.10780912637710571, 0.11112775653600693, 0.11444637924432755]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 7.0, 6.0, 2.0, 10.0, 21.0, 10.0, 23.0, 34.0, 49.0, 63.0, 128.0, 142.0, 268.0, 429.0, 689.0, 1210.0, 2213.0, 4444.0, 9748.0, 23440.0, 68303.0, 287531.0, 477539.0, 111663.0, 34522.0, 13509.0, 5880.0, 2901.0, 1538.0, 831.0, 506.0, 293.0, 186.0, 145.0, 91.0, 47.0, 44.0, 28.0, 22.0, 17.0, 10.0, 11.0, 2.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0711669921875, -0.06864261627197266, -0.06611824035644531, -0.06359386444091797, -0.061069488525390625, -0.05854511260986328, -0.05602073669433594, -0.053496360778808594, -0.05097198486328125, -0.048447608947753906, -0.04592323303222656, -0.04339885711669922, -0.040874481201171875, -0.03835010528564453, -0.03582572937011719, -0.033301353454589844, -0.0307769775390625, -0.028252601623535156, -0.025728225708007812, -0.02320384979248047, -0.020679473876953125, -0.01815509796142578, -0.015630722045898438, -0.013106346130371094, -0.01058197021484375, -0.008057594299316406, -0.0055332183837890625, -0.0030088424682617188, -0.000484466552734375, 0.0020399093627929688, 0.0045642852783203125, 0.007088661193847656, 0.009613037109375, 0.012137413024902344, 0.014661788940429688, 0.01718616485595703, 0.019710540771484375, 0.02223491668701172, 0.024759292602539062, 0.027283668518066406, 0.02980804443359375, 0.032332420349121094, 0.03485679626464844, 0.03738117218017578, 0.039905548095703125, 0.04242992401123047, 0.04495429992675781, 0.047478675842285156, 0.0500030517578125, 0.052527427673339844, 0.05505180358886719, 0.05757617950439453, 0.060100555419921875, 0.06262493133544922, 0.06514930725097656, 0.0676736831665039, 0.07019805908203125, 0.0727224349975586, 0.07524681091308594, 0.07777118682861328, 0.08029556274414062, 0.08281993865966797, 0.08534431457519531, 0.08786869049072266, 0.09039306640625]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 11.0, 12.0, 9.0, 16.0, 18.0, 22.0, 22.0, 39.0, 43.0, 48.0, 46.0, 52.0, 62.0, 74.0, 65.0, 57.0, 57.0, 65.0, 43.0, 40.0, 42.0, 32.0, 20.0, 19.0, 19.0, 14.0, 12.0, 7.0, 4.0, 4.0, 3.0, 3.0, 5.0, 5.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.211669921875, -0.20444107055664062, -0.19721221923828125, -0.18998336791992188, -0.1827545166015625, -0.17552566528320312, -0.16829681396484375, -0.16106796264648438, -0.153839111328125, -0.14661026000976562, -0.13938140869140625, -0.13215255737304688, -0.1249237060546875, -0.11769485473632812, -0.11046600341796875, -0.10323715209960938, -0.09600830078125, -0.08877944946289062, -0.08155059814453125, -0.07432174682617188, -0.0670928955078125, -0.059864044189453125, -0.05263519287109375, -0.045406341552734375, -0.038177490234375, -0.030948638916015625, -0.02371978759765625, -0.016490936279296875, -0.0092620849609375, -0.002033233642578125, 0.00519561767578125, 0.012424468994140625, 0.0196533203125, 0.026882171630859375, 0.03411102294921875, 0.041339874267578125, 0.0485687255859375, 0.055797576904296875, 0.06302642822265625, 0.07025527954101562, 0.077484130859375, 0.08471298217773438, 0.09194183349609375, 0.09917068481445312, 0.1063995361328125, 0.11362838745117188, 0.12085723876953125, 0.12808609008789062, 0.13531494140625, 0.14254379272460938, 0.14977264404296875, 0.15700149536132812, 0.1642303466796875, 0.17145919799804688, 0.17868804931640625, 0.18591690063476562, 0.193145751953125, 0.20037460327148438, 0.20760345458984375, 0.21483230590820312, 0.2220611572265625, 0.22929000854492188, 0.23651885986328125, 0.24374771118164062, 0.2509765625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 0.0, 3.0, 8.0, 5.0, 8.0, 6.0, 8.0, 28.0, 31.0, 48.0, 97.0, 193.0, 491.0, 1489.0, 13253.0, 804644.0, 219947.0, 6499.0, 1046.0, 351.0, 157.0, 89.0, 51.0, 29.0, 21.0, 8.0, 11.0, 7.0, 6.0, 6.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28759765625, -0.27857208251953125, -0.2695465087890625, -0.26052093505859375, -0.251495361328125, -0.24246978759765625, -0.2334442138671875, -0.22441864013671875, -0.21539306640625, -0.20636749267578125, -0.1973419189453125, -0.18831634521484375, -0.179290771484375, -0.17026519775390625, -0.1612396240234375, -0.15221405029296875, -0.1431884765625, -0.13416290283203125, -0.1251373291015625, -0.11611175537109375, -0.107086181640625, -0.09806060791015625, -0.0890350341796875, -0.08000946044921875, -0.07098388671875, -0.06195831298828125, -0.0529327392578125, -0.04390716552734375, -0.034881591796875, -0.02585601806640625, -0.0168304443359375, -0.00780487060546875, 0.001220703125, 0.01024627685546875, 0.0192718505859375, 0.02829742431640625, 0.037322998046875, 0.04634857177734375, 0.0553741455078125, 0.06439971923828125, 0.07342529296875, 0.08245086669921875, 0.0914764404296875, 0.10050201416015625, 0.109527587890625, 0.11855316162109375, 0.1275787353515625, 0.13660430908203125, 0.1456298828125, 0.15465545654296875, 0.1636810302734375, 0.17270660400390625, 0.181732177734375, 0.19075775146484375, 0.1997833251953125, 0.20880889892578125, 0.21783447265625, 0.22686004638671875, 0.2358856201171875, 0.24491119384765625, 0.253936767578125, 0.26296234130859375, 0.2719879150390625, 0.28101348876953125, 0.2900390625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 8.0, 8.0, 8.0, 10.0, 19.0, 21.0, 22.0, 32.0, 33.0, 32.0, 29.0, 37.0, 47.0, 35.0, 55.0, 53.0, 48.0, 51.0, 54.0, 36.0, 32.0, 33.0, 33.0, 38.0, 23.0, 27.0, 31.0, 22.0, 25.0, 18.0, 15.0, 16.0, 11.0, 10.0, 4.0, 5.0, 4.0, 1.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.221923828125, -0.21456527709960938, -0.20720672607421875, -0.19984817504882812, -0.1924896240234375, -0.18513107299804688, -0.17777252197265625, -0.17041397094726562, -0.163055419921875, -0.15569686889648438, -0.14833831787109375, -0.14097976684570312, -0.1336212158203125, -0.12626266479492188, -0.11890411376953125, -0.11154556274414062, -0.10418701171875, -0.09682846069335938, -0.08946990966796875, -0.08211135864257812, -0.0747528076171875, -0.06739425659179688, -0.06003570556640625, -0.052677154541015625, -0.045318603515625, -0.037960052490234375, -0.03060150146484375, -0.023242950439453125, -0.0158843994140625, -0.008525848388671875, -0.00116729736328125, 0.006191253662109375, 0.0135498046875, 0.020908355712890625, 0.02826690673828125, 0.035625457763671875, 0.0429840087890625, 0.050342559814453125, 0.05770111083984375, 0.06505966186523438, 0.072418212890625, 0.07977676391601562, 0.08713531494140625, 0.09449386596679688, 0.1018524169921875, 0.10921096801757812, 0.11656951904296875, 0.12392807006835938, 0.13128662109375, 0.13864517211914062, 0.14600372314453125, 0.15336227416992188, 0.1607208251953125, 0.16807937622070312, 0.17543792724609375, 0.18279647827148438, 0.190155029296875, 0.19751358032226562, 0.20487213134765625, 0.21223068237304688, 0.2195892333984375, 0.22694778442382812, 0.23430633544921875, 0.24166488647460938, 0.2490234375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 7.0, 19.0, 14.0, 24.0, 33.0, 64.0, 103.0, 255.0, 1063.0, 10755.0, 949727.0, 82892.0, 2758.0, 476.0, 160.0, 59.0, 40.0, 38.0, 15.0, 13.0, 9.0, 9.0, 5.0, 9.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1317138671875, -0.1272869110107422, -0.12285995483398438, -0.11843299865722656, -0.11400604248046875, -0.10957908630371094, -0.10515213012695312, -0.10072517395019531, -0.0962982177734375, -0.09187126159667969, -0.08744430541992188, -0.08301734924316406, -0.07859039306640625, -0.07416343688964844, -0.06973648071289062, -0.06530952453613281, -0.060882568359375, -0.05645561218261719, -0.052028656005859375, -0.04760169982910156, -0.04317474365234375, -0.03874778747558594, -0.034320831298828125, -0.029893875122070312, -0.0254669189453125, -0.021039962768554688, -0.016613006591796875, -0.012186050415039062, -0.00775909423828125, -0.0033321380615234375, 0.001094818115234375, 0.0055217742919921875, 0.00994873046875, 0.014375686645507812, 0.018802642822265625, 0.023229598999023438, 0.02765655517578125, 0.03208351135253906, 0.036510467529296875, 0.04093742370605469, 0.0453643798828125, 0.04979133605957031, 0.054218292236328125, 0.05864524841308594, 0.06307220458984375, 0.06749916076660156, 0.07192611694335938, 0.07635307312011719, 0.080780029296875, 0.08520698547363281, 0.08963394165039062, 0.09406089782714844, 0.09848785400390625, 0.10291481018066406, 0.10734176635742188, 0.11176872253417969, 0.1161956787109375, 0.12062263488769531, 0.12504959106445312, 0.12947654724121094, 0.13390350341796875, 0.13833045959472656, 0.14275741577148438, 0.1471843719482422, 0.151611328125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 3.0, 6.0, 8.0, 7.0, 7.0, 19.0, 24.0, 42.0, 68.0, 109.0, 195.0, 203.0, 129.0, 64.0, 34.0, 27.0, 13.0, 14.0, 12.0, 5.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2993812561035156e-05, -1.2575648725032806e-05, -1.2157484889030457e-05, -1.1739321053028107e-05, -1.1321157217025757e-05, -1.0902993381023407e-05, -1.0484829545021057e-05, -1.0066665709018707e-05, -9.648501873016357e-06, -9.230338037014008e-06, -8.812174201011658e-06, -8.394010365009308e-06, -7.975846529006958e-06, -7.557682693004608e-06, -7.139518857002258e-06, -6.7213550209999084e-06, -6.303191184997559e-06, -5.885027348995209e-06, -5.466863512992859e-06, -5.048699676990509e-06, -4.630535840988159e-06, -4.212372004985809e-06, -3.7942081689834595e-06, -3.3760443329811096e-06, -2.9578804969787598e-06, -2.53971666097641e-06, -2.12155282497406e-06, -1.7033889889717102e-06, -1.2852251529693604e-06, -8.670613169670105e-07, -4.4889748096466064e-07, -3.073364496231079e-08, 3.8743019104003906e-07, 8.055940270423889e-07, 1.2237578630447388e-06, 1.6419216990470886e-06, 2.0600855350494385e-06, 2.4782493710517883e-06, 2.896413207054138e-06, 3.314577043056488e-06, 3.732740879058838e-06, 4.150904715061188e-06, 4.569068551063538e-06, 4.9872323870658875e-06, 5.405396223068237e-06, 5.823560059070587e-06, 6.241723895072937e-06, 6.659887731075287e-06, 7.078051567077637e-06, 7.4962154030799866e-06, 7.914379239082336e-06, 8.332543075084686e-06, 8.750706911087036e-06, 9.168870747089386e-06, 9.587034583091736e-06, 1.0005198419094086e-05, 1.0423362255096436e-05, 1.0841526091098785e-05, 1.1259689927101135e-05, 1.1677853763103485e-05, 1.2096017599105835e-05, 1.2514181435108185e-05, 1.2932345271110535e-05, 1.3350509107112885e-05, 1.3768672943115234e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 8.0, 14.0, 14.0, 54.0, 103.0, 427.0, 2932.0, 647226.0, 394474.0, 2684.0, 397.0, 114.0, 40.0, 22.0, 13.0, 13.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1622314453125, -0.15517234802246094, -0.14811325073242188, -0.1410541534423828, -0.13399505615234375, -0.1269359588623047, -0.11987686157226562, -0.11281776428222656, -0.1057586669921875, -0.09869956970214844, -0.09164047241210938, -0.08458137512207031, -0.07752227783203125, -0.07046318054199219, -0.06340408325195312, -0.05634498596191406, -0.049285888671875, -0.04222679138183594, -0.035167694091796875, -0.028108596801757812, -0.02104949951171875, -0.013990402221679688, -0.006931304931640625, 0.0001277923583984375, 0.0071868896484375, 0.014245986938476562, 0.021305084228515625, 0.028364181518554688, 0.03542327880859375, 0.04248237609863281, 0.049541473388671875, 0.05660057067871094, 0.06365966796875, 0.07071876525878906, 0.07777786254882812, 0.08483695983886719, 0.09189605712890625, 0.09895515441894531, 0.10601425170898438, 0.11307334899902344, 0.1201324462890625, 0.12719154357910156, 0.13425064086914062, 0.1413097381591797, 0.14836883544921875, 0.1554279327392578, 0.16248703002929688, 0.16954612731933594, 0.176605224609375, 0.18366432189941406, 0.19072341918945312, 0.1977825164794922, 0.20484161376953125, 0.2119007110595703, 0.21895980834960938, 0.22601890563964844, 0.2330780029296875, 0.24013710021972656, 0.24719619750976562, 0.2542552947998047, 0.26131439208984375, 0.2683734893798828, 0.2754325866699219, 0.28249168395996094, 0.28955078125]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 7.0, 8.0, 12.0, 17.0, 44.0, 53.0, 115.0, 258.0, 231.0, 109.0, 56.0, 38.0, 13.0, 10.0, 6.0, 6.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.054962158203125, -0.05368375778198242, -0.052405357360839844, -0.051126956939697266, -0.04984855651855469, -0.04857015609741211, -0.04729175567626953, -0.04601335525512695, -0.044734954833984375, -0.0434565544128418, -0.04217815399169922, -0.04089975357055664, -0.03962135314941406, -0.038342952728271484, -0.037064552307128906, -0.03578615188598633, -0.03450775146484375, -0.03322935104370117, -0.031950950622558594, -0.030672550201416016, -0.029394149780273438, -0.02811574935913086, -0.02683734893798828, -0.025558948516845703, -0.024280548095703125, -0.023002147674560547, -0.02172374725341797, -0.02044534683227539, -0.019166946411132812, -0.017888545989990234, -0.016610145568847656, -0.015331745147705078, -0.0140533447265625, -0.012774944305419922, -0.011496543884277344, -0.010218143463134766, -0.008939743041992188, -0.007661342620849609, -0.006382942199707031, -0.005104541778564453, -0.003826141357421875, -0.002547740936279297, -0.0012693405151367188, 9.059906005859375e-06, 0.0012874603271484375, 0.0025658607482910156, 0.0038442611694335938, 0.005122661590576172, 0.00640106201171875, 0.007679462432861328, 0.008957862854003906, 0.010236263275146484, 0.011514663696289062, 0.01279306411743164, 0.014071464538574219, 0.015349864959716797, 0.016628265380859375, 0.017906665802001953, 0.01918506622314453, 0.02046346664428711, 0.021741867065429688, 0.023020267486572266, 0.024298667907714844, 0.025577068328857422, 0.02685546875]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 4.0, 7.0, 11.0, 12.0, 34.0, 74.0, 112.0, 183.0, 183.0, 145.0, 95.0, 52.0, 34.0, 22.0, 11.0, 7.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38317203521728516, -0.3685572147369385, -0.3539423644542694, -0.33932754397392273, -0.32471272349357605, -0.310097873210907, -0.2954830527305603, -0.2808682322502136, -0.26625341176986694, -0.25163859128952026, -0.2370237559080124, -0.22240892052650452, -0.20779410004615784, -0.19317926466464996, -0.1785644292831421, -0.1639496088027954, -0.14933475852012634, -0.13471992313861847, -0.12010510265827179, -0.10549026727676392, -0.09087543934583664, -0.07626061141490936, -0.06164577603340149, -0.04703094810247421, -0.032416120171546936, -0.01780129037797451, -0.0031864605844020844, 0.01142837107181549, 0.026043199002742767, 0.040658026933670044, 0.05527286231517792, 0.0698876902461052, 0.08450251817703247, 0.09911734610795975, 0.11373217403888702, 0.1283470094203949, 0.14296182990074158, 0.15757666528224945, 0.17219150066375732, 0.186806321144104, 0.20142115652561188, 0.21603599190711975, 0.23065081238746643, 0.2452656477689743, 0.2598804831504822, 0.27449530363082886, 0.28911012411117554, 0.3037249743938446, 0.3183397948741913, 0.33295461535453796, 0.34756946563720703, 0.3621842861175537, 0.3767991065979004, 0.39141392707824707, 0.40602877736091614, 0.4206435978412628, 0.4352584481239319, 0.44987326860427856, 0.46448811888694763, 0.4791029393672943, 0.493717759847641, 0.5083326101303101, 0.5229474306106567, 0.5375622510910034, 0.5521770715713501]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 1.0, 1.0, 3.0, 6.0, 4.0, 12.0, 10.0, 13.0, 13.0, 22.0, 22.0, 24.0, 21.0, 23.0, 36.0, 34.0, 43.0, 39.0, 26.0, 44.0, 44.0, 48.0, 51.0, 43.0, 29.0, 33.0, 40.0, 41.0, 30.0, 30.0, 24.0, 25.0, 25.0, 28.0, 20.0, 20.0, 12.0, 10.0, 10.0, 10.0, 6.0, 7.0, 5.0, 5.0, 5.0, 4.0, 3.0, 1.0, 0.0, 4.0, 0.0, 2.0], "bins": [-0.388520210981369, -0.37729737162590027, -0.3660745322704315, -0.35485169291496277, -0.343628853559494, -0.33240601420402527, -0.32118314504623413, -0.3099603056907654, -0.29873746633529663, -0.2875146269798279, -0.27629178762435913, -0.2650689482688904, -0.25384610891342163, -0.24262326955795288, -0.23140041530132294, -0.2201775759458542, -0.20895475149154663, -0.19773191213607788, -0.18650907278060913, -0.17528623342514038, -0.16406339406967163, -0.15284055471420288, -0.14161770045757294, -0.1303948611021042, -0.11917202174663544, -0.10794918239116669, -0.09672634303569794, -0.08550349622964859, -0.07428065687417984, -0.06305781751871109, -0.05183497071266174, -0.04061213135719299, -0.029389262199401855, -0.018166420981287956, -0.006943579763174057, 0.0042792633175849915, 0.015502102673053741, 0.02672494202852249, 0.03794778883457184, 0.04917062819004059, 0.06039346754550934, 0.07161630690097809, 0.08283914625644684, 0.09406199306249619, 0.10528483241796494, 0.11650767177343369, 0.12773051857948303, 0.13895335793495178, 0.15017619729042053, 0.16139903664588928, 0.17262187600135803, 0.18384471535682678, 0.19506755471229553, 0.20629039406776428, 0.21751324832439423, 0.22873608767986298, 0.23995892703533173, 0.25118178129196167, 0.2624046206474304, 0.27362746000289917, 0.2848502993583679, 0.29607313871383667, 0.3072959780693054, 0.31851881742477417, 0.3297416567802429]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 4.0, 3.0, 1.0, 12.0, 10.0, 10.0, 20.0, 26.0, 42.0, 53.0, 88.0, 155.0, 238.0, 417.0, 702.0, 1389.0, 2951.0, 7843.0, 32816.0, 368109.0, 3315159.0, 417360.0, 32846.0, 7895.0, 2997.0, 1382.0, 721.0, 400.0, 240.0, 145.0, 76.0, 60.0, 39.0, 33.0, 7.0, 14.0, 8.0, 8.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.226318359375, -0.2193584442138672, -0.21239852905273438, -0.20543861389160156, -0.19847869873046875, -0.19151878356933594, -0.18455886840820312, -0.1775989532470703, -0.1706390380859375, -0.1636791229248047, -0.15671920776367188, -0.14975929260253906, -0.14279937744140625, -0.13583946228027344, -0.12887954711914062, -0.12191963195800781, -0.114959716796875, -0.10799980163574219, -0.10103988647460938, -0.09407997131347656, -0.08712005615234375, -0.08016014099121094, -0.07320022583007812, -0.06624031066894531, -0.0592803955078125, -0.05232048034667969, -0.045360565185546875, -0.03840065002441406, -0.03144073486328125, -0.024480819702148438, -0.017520904541015625, -0.010560989379882812, -0.00360107421875, 0.0033588409423828125, 0.010318756103515625, 0.017278671264648438, 0.02423858642578125, 0.031198501586914062, 0.038158416748046875, 0.04511833190917969, 0.0520782470703125, 0.05903816223144531, 0.06599807739257812, 0.07295799255371094, 0.07991790771484375, 0.08687782287597656, 0.09383773803710938, 0.10079765319824219, 0.107757568359375, 0.11471748352050781, 0.12167739868164062, 0.12863731384277344, 0.13559722900390625, 0.14255714416503906, 0.14951705932617188, 0.1564769744873047, 0.1634368896484375, 0.1703968048095703, 0.17735671997070312, 0.18431663513183594, 0.19127655029296875, 0.19823646545410156, 0.20519638061523438, 0.2121562957763672, 0.2191162109375]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 5.0, 1.0, 3.0, 5.0, 8.0, 7.0, 11.0, 21.0, 14.0, 16.0, 34.0, 28.0, 29.0, 38.0, 47.0, 55.0, 49.0, 61.0, 52.0, 45.0, 71.0, 45.0, 55.0, 48.0, 44.0, 34.0, 31.0, 19.0, 31.0, 18.0, 20.0, 10.0, 19.0, 6.0, 2.0, 7.0, 2.0, 3.0, 5.0, 0.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.098876953125, -0.09499549865722656, -0.09111404418945312, -0.08723258972167969, -0.08335113525390625, -0.07946968078613281, -0.07558822631835938, -0.07170677185058594, -0.0678253173828125, -0.06394386291503906, -0.060062408447265625, -0.05618095397949219, -0.05229949951171875, -0.04841804504394531, -0.044536590576171875, -0.04065513610839844, -0.036773681640625, -0.03289222717285156, -0.029010772705078125, -0.025129318237304688, -0.02124786376953125, -0.017366409301757812, -0.013484954833984375, -0.009603500366210938, -0.0057220458984375, -0.0018405914306640625, 0.002040863037109375, 0.0059223175048828125, 0.00980377197265625, 0.013685226440429688, 0.017566680908203125, 0.021448135375976562, 0.02532958984375, 0.029211044311523438, 0.033092498779296875, 0.03697395324707031, 0.04085540771484375, 0.04473686218261719, 0.048618316650390625, 0.05249977111816406, 0.0563812255859375, 0.06026268005371094, 0.06414413452148438, 0.06802558898925781, 0.07190704345703125, 0.07578849792480469, 0.07966995239257812, 0.08355140686035156, 0.087432861328125, 0.09131431579589844, 0.09519577026367188, 0.09907722473144531, 0.10295867919921875, 0.10684013366699219, 0.11072158813476562, 0.11460304260253906, 0.1184844970703125, 0.12236595153808594, 0.12624740600585938, 0.1301288604736328, 0.13401031494140625, 0.1378917694091797, 0.14177322387695312, 0.14565467834472656, 0.1495361328125]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 8.0, 6.0, 13.0, 8.0, 18.0, 24.0, 37.0, 83.0, 107.0, 284.0, 622.0, 2225.0, 14292.0, 1135959.0, 3018251.0, 18474.0, 2569.0, 737.0, 272.0, 127.0, 64.0, 27.0, 22.0, 18.0, 3.0, 10.0, 6.0, 3.0, 7.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.322509765625, -0.3085212707519531, -0.29453277587890625, -0.2805442810058594, -0.2665557861328125, -0.2525672912597656, -0.23857879638671875, -0.22459030151367188, -0.210601806640625, -0.19661331176757812, -0.18262481689453125, -0.16863632202148438, -0.1546478271484375, -0.14065933227539062, -0.12667083740234375, -0.11268234252929688, -0.09869384765625, -0.08470535278320312, -0.07071685791015625, -0.056728363037109375, -0.0427398681640625, -0.028751373291015625, -0.01476287841796875, -0.000774383544921875, 0.013214111328125, 0.027202606201171875, 0.04119110107421875, 0.055179595947265625, 0.0691680908203125, 0.08315658569335938, 0.09714508056640625, 0.11113357543945312, 0.1251220703125, 0.13911056518554688, 0.15309906005859375, 0.16708755493164062, 0.1810760498046875, 0.19506454467773438, 0.20905303955078125, 0.22304153442382812, 0.237030029296875, 0.2510185241699219, 0.26500701904296875, 0.2789955139160156, 0.2929840087890625, 0.3069725036621094, 0.32096099853515625, 0.3349494934082031, 0.34893798828125, 0.3629264831542969, 0.37691497802734375, 0.3909034729003906, 0.4048919677734375, 0.4188804626464844, 0.43286895751953125, 0.4468574523925781, 0.460845947265625, 0.4748344421386719, 0.48882293701171875, 0.5028114318847656, 0.5167999267578125, 0.5307884216308594, 0.5447769165039062, 0.5587654113769531, 0.57275390625]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 3.0, 3.0, 7.0, 7.0, 9.0, 10.0, 14.0, 35.0, 38.0, 99.0, 180.0, 313.0, 693.0, 1059.0, 753.0, 366.0, 180.0, 94.0, 75.0, 35.0, 26.0, 17.0, 15.0, 12.0, 7.0, 6.0, 9.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0906982421875, -0.0885167121887207, -0.0863351821899414, -0.08415365219116211, -0.08197212219238281, -0.07979059219360352, -0.07760906219482422, -0.07542753219604492, -0.07324600219726562, -0.07106447219848633, -0.06888294219970703, -0.06670141220092773, -0.06451988220214844, -0.06233835220336914, -0.060156822204589844, -0.05797529220581055, -0.05579376220703125, -0.05361223220825195, -0.051430702209472656, -0.04924917221069336, -0.04706764221191406, -0.044886112213134766, -0.04270458221435547, -0.04052305221557617, -0.038341522216796875, -0.03615999221801758, -0.03397846221923828, -0.031796932220458984, -0.029615402221679688, -0.02743387222290039, -0.025252342224121094, -0.023070812225341797, -0.0208892822265625, -0.018707752227783203, -0.016526222229003906, -0.01434469223022461, -0.012163162231445312, -0.009981632232666016, -0.007800102233886719, -0.005618572235107422, -0.003437042236328125, -0.0012555122375488281, 0.0009260177612304688, 0.0031075477600097656, 0.0052890777587890625, 0.007470607757568359, 0.009652137756347656, 0.011833667755126953, 0.01401519775390625, 0.016196727752685547, 0.018378257751464844, 0.02055978775024414, 0.022741317749023438, 0.024922847747802734, 0.02710437774658203, 0.029285907745361328, 0.031467437744140625, 0.03364896774291992, 0.03583049774169922, 0.038012027740478516, 0.04019355773925781, 0.04237508773803711, 0.044556617736816406, 0.0467381477355957, 0.048919677734375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 6.0, 5.0, 9.0, 19.0, 38.0, 83.0, 119.0, 174.0, 186.0, 148.0, 85.0, 64.0, 37.0, 9.0, 9.0, 4.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4136539697647095, -0.4022037088871002, -0.39075344800949097, -0.3793031871318817, -0.36785292625427246, -0.3564026653766632, -0.34495240449905396, -0.3335021436214447, -0.32205188274383545, -0.3106016218662262, -0.29915136098861694, -0.2877011001110077, -0.27625083923339844, -0.2648005783557892, -0.25335031747817993, -0.24190005660057068, -0.23044981062412262, -0.21899954974651337, -0.2075492888689041, -0.19609902799129486, -0.1846487671136856, -0.17319850623607635, -0.1617482602596283, -0.15029799938201904, -0.1388477385044098, -0.12739747762680054, -0.11594721674919128, -0.10449695587158203, -0.09304669499397278, -0.08159643411636353, -0.07014618068933487, -0.058695919811725616, -0.04724565148353577, -0.035795390605926514, -0.02434513159096241, -0.012894872575998306, -0.0014446116983890533, 0.0100056491792202, 0.021455906331539154, 0.03290616720914841, 0.04435642808675766, 0.05580668896436691, 0.06725694984197617, 0.07870720326900482, 0.09015746414661407, 0.10160772502422333, 0.11305798590183258, 0.12450824677944183, 0.1359585076570511, 0.14740876853466034, 0.1588590294122696, 0.17030929028987885, 0.1817595511674881, 0.19320981204509735, 0.2046600580215454, 0.21611031889915466, 0.22756057977676392, 0.23901084065437317, 0.2504611015319824, 0.2619113624095917, 0.2733616232872009, 0.2848118841648102, 0.29626214504241943, 0.3077124059200287, 0.31916266679763794]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 4.0, 7.0, 13.0, 8.0, 12.0, 12.0, 20.0, 23.0, 22.0, 35.0, 38.0, 31.0, 41.0, 39.0, 52.0, 27.0, 52.0, 47.0, 45.0, 44.0, 46.0, 46.0, 50.0, 47.0, 42.0, 35.0, 22.0, 38.0, 28.0, 15.0, 12.0, 6.0, 10.0, 4.0, 4.0, 7.0, 7.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11764003336429596, -0.11358009278774261, -0.10952015221118927, -0.10546021908521652, -0.10140027850866318, -0.09734033793210983, -0.09328040480613708, -0.08922046422958374, -0.0851605236530304, -0.08110058307647705, -0.0770406424999237, -0.07298070937395096, -0.06892076879739761, -0.06486082822084427, -0.06080089136958122, -0.056740954518318176, -0.05268101394176483, -0.04862107336521149, -0.04456113651394844, -0.040501199662685394, -0.03644125908613205, -0.032381318509578705, -0.02832138165831566, -0.024261442944407463, -0.020201504230499268, -0.016141565516591072, -0.012081626802682877, -0.008021688088774681, -0.003961749374866486, 9.81893390417099e-05, 0.004158128052949905, 0.008218066766858101, 0.01227802038192749, 0.016337959095835686, 0.02039789780974388, 0.024457836523652077, 0.028517775237560272, 0.03257771581411362, 0.03663765266537666, 0.04069758951663971, 0.044757530093193054, 0.0488174706697464, 0.052877407521009445, 0.05693734437227249, 0.060997284948825836, 0.06505722552537918, 0.06911715865135193, 0.07317709922790527, 0.07723703980445862, 0.08129698038101196, 0.08535692095756531, 0.08941685408353806, 0.0934767946600914, 0.09753673523664474, 0.10159666836261749, 0.10565660893917084, 0.10971654951572418, 0.11377649009227753, 0.11783643066883087, 0.12189636379480362, 0.12595629692077637, 0.1300162374973297, 0.13407617807388306, 0.1381361186504364, 0.14219605922698975]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 7.0, 8.0, 13.0, 11.0, 26.0, 29.0, 47.0, 73.0, 103.0, 164.0, 262.0, 395.0, 683.0, 1109.0, 1945.0, 3831.0, 8066.0, 21199.0, 95432.0, 613053.0, 241798.0, 37204.0, 11746.0, 5067.0, 2632.0, 1531.0, 825.0, 466.0, 288.0, 165.0, 138.0, 83.0, 48.0, 50.0, 19.0, 9.0, 9.0, 4.0, 6.0, 3.0, 2.0, 5.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.045806884765625, -0.04415416717529297, -0.04250144958496094, -0.040848731994628906, -0.039196014404296875, -0.037543296813964844, -0.03589057922363281, -0.03423786163330078, -0.03258514404296875, -0.03093242645263672, -0.029279708862304688, -0.027626991271972656, -0.025974273681640625, -0.024321556091308594, -0.022668838500976562, -0.02101612091064453, -0.0193634033203125, -0.01771068572998047, -0.016057968139648438, -0.014405250549316406, -0.012752532958984375, -0.011099815368652344, -0.009447097778320312, -0.007794380187988281, -0.00614166259765625, -0.004488945007324219, -0.0028362274169921875, -0.0011835098266601562, 0.000469207763671875, 0.0021219253540039062, 0.0037746429443359375, 0.005427360534667969, 0.007080078125, 0.008732795715332031, 0.010385513305664062, 0.012038230895996094, 0.013690948486328125, 0.015343666076660156, 0.016996383666992188, 0.01864910125732422, 0.02030181884765625, 0.02195453643798828, 0.023607254028320312, 0.025259971618652344, 0.026912689208984375, 0.028565406799316406, 0.030218124389648438, 0.03187084197998047, 0.0335235595703125, 0.03517627716064453, 0.03682899475097656, 0.038481712341308594, 0.040134429931640625, 0.041787147521972656, 0.04343986511230469, 0.04509258270263672, 0.04674530029296875, 0.04839801788330078, 0.05005073547363281, 0.051703453063964844, 0.053356170654296875, 0.055008888244628906, 0.05666160583496094, 0.05831432342529297, 0.059967041015625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 9.0, 9.0, 9.0, 14.0, 16.0, 30.0, 28.0, 34.0, 50.0, 55.0, 55.0, 61.0, 67.0, 70.0, 58.0, 66.0, 57.0, 61.0, 55.0, 44.0, 42.0, 35.0, 24.0, 12.0, 9.0, 10.0, 6.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09808349609375, -0.09442615509033203, -0.09076881408691406, -0.0871114730834961, -0.08345413208007812, -0.07979679107666016, -0.07613945007324219, -0.07248210906982422, -0.06882476806640625, -0.06516742706298828, -0.06151008605957031, -0.057852745056152344, -0.054195404052734375, -0.050538063049316406, -0.04688072204589844, -0.04322338104248047, -0.0395660400390625, -0.03590869903564453, -0.03225135803222656, -0.028594017028808594, -0.024936676025390625, -0.021279335021972656, -0.017621994018554688, -0.013964653015136719, -0.01030731201171875, -0.006649971008300781, -0.0029926300048828125, 0.0006647109985351562, 0.004322052001953125, 0.007979393005371094, 0.011636734008789062, 0.015294075012207031, 0.018951416015625, 0.02260875701904297, 0.026266098022460938, 0.029923439025878906, 0.033580780029296875, 0.037238121032714844, 0.04089546203613281, 0.04455280303955078, 0.04821014404296875, 0.05186748504638672, 0.05552482604980469, 0.059182167053222656, 0.06283950805664062, 0.0664968490600586, 0.07015419006347656, 0.07381153106689453, 0.0774688720703125, 0.08112621307373047, 0.08478355407714844, 0.0884408950805664, 0.09209823608398438, 0.09575557708740234, 0.09941291809082031, 0.10307025909423828, 0.10672760009765625, 0.11038494110107422, 0.11404228210449219, 0.11769962310791016, 0.12135696411132812, 0.1250143051147461, 0.12867164611816406, 0.13232898712158203, 0.135986328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 5.0, 4.0, 10.0, 11.0, 15.0, 16.0, 28.0, 43.0, 77.0, 166.0, 286.0, 731.0, 1802.0, 5298.0, 23853.0, 446803.0, 533094.0, 27334.0, 5687.0, 1897.0, 727.0, 296.0, 148.0, 82.0, 40.0, 32.0, 18.0, 13.0, 2.0, 7.0, 5.0, 4.0, 2.0, 2.0, 3.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.08599853515625, -0.08367633819580078, -0.08135414123535156, -0.07903194427490234, -0.07670974731445312, -0.0743875503540039, -0.07206535339355469, -0.06974315643310547, -0.06742095947265625, -0.06509876251220703, -0.06277656555175781, -0.060454368591308594, -0.058132171630859375, -0.055809974670410156, -0.05348777770996094, -0.05116558074951172, -0.0488433837890625, -0.04652118682861328, -0.04419898986816406, -0.041876792907714844, -0.039554595947265625, -0.037232398986816406, -0.03491020202636719, -0.03258800506591797, -0.03026580810546875, -0.02794361114501953, -0.025621414184570312, -0.023299217224121094, -0.020977020263671875, -0.018654823303222656, -0.016332626342773438, -0.014010429382324219, -0.011688232421875, -0.009366035461425781, -0.0070438385009765625, -0.004721641540527344, -0.002399444580078125, -7.724761962890625e-05, 0.0022449493408203125, 0.004567146301269531, 0.00688934326171875, 0.009211540222167969, 0.011533737182617188, 0.013855934143066406, 0.016178131103515625, 0.018500328063964844, 0.020822525024414062, 0.02314472198486328, 0.0254669189453125, 0.02778911590576172, 0.030111312866210938, 0.032433509826660156, 0.034755706787109375, 0.037077903747558594, 0.03940010070800781, 0.04172229766845703, 0.04404449462890625, 0.04636669158935547, 0.04868888854980469, 0.051011085510253906, 0.053333282470703125, 0.055655479431152344, 0.05797767639160156, 0.06029987335205078, 0.0626220703125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 4.0, 10.0, 12.0, 10.0, 15.0, 11.0, 19.0, 20.0, 30.0, 26.0, 38.0, 36.0, 25.0, 52.0, 48.0, 46.0, 33.0, 40.0, 57.0, 45.0, 35.0, 46.0, 53.0, 39.0, 38.0, 35.0, 30.0, 27.0, 30.0, 18.0, 22.0, 8.0, 12.0, 3.0, 7.0, 6.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1611328125, -0.1559123992919922, -0.15069198608398438, -0.14547157287597656, -0.14025115966796875, -0.13503074645996094, -0.12981033325195312, -0.12458992004394531, -0.1193695068359375, -0.11414909362792969, -0.10892868041992188, -0.10370826721191406, -0.09848785400390625, -0.09326744079589844, -0.08804702758789062, -0.08282661437988281, -0.077606201171875, -0.07238578796386719, -0.06716537475585938, -0.06194496154785156, -0.05672454833984375, -0.05150413513183594, -0.046283721923828125, -0.04106330871582031, -0.0358428955078125, -0.030622482299804688, -0.025402069091796875, -0.020181655883789062, -0.01496124267578125, -0.009740829467773438, -0.004520416259765625, 0.0006999969482421875, 0.00592041015625, 0.011140823364257812, 0.016361236572265625, 0.021581649780273438, 0.02680206298828125, 0.03202247619628906, 0.037242889404296875, 0.04246330261230469, 0.0476837158203125, 0.05290412902832031, 0.058124542236328125, 0.06334495544433594, 0.06856536865234375, 0.07378578186035156, 0.07900619506835938, 0.08422660827636719, 0.089447021484375, 0.09466743469238281, 0.09988784790039062, 0.10510826110839844, 0.11032867431640625, 0.11554908752441406, 0.12076950073242188, 0.1259899139404297, 0.1312103271484375, 0.1364307403564453, 0.14165115356445312, 0.14687156677246094, 0.15209197998046875, 0.15731239318847656, 0.16253280639648438, 0.1677532196044922, 0.1729736328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 3.0, 6.0, 8.0, 11.0, 10.0, 17.0, 18.0, 33.0, 42.0, 78.0, 123.0, 239.0, 357.0, 811.0, 1981.0, 5821.0, 22293.0, 145021.0, 697981.0, 142005.0, 22020.0, 5768.0, 2074.0, 846.0, 440.0, 218.0, 117.0, 56.0, 52.0, 32.0, 22.0, 12.0, 14.0, 5.0, 2.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0153045654296875, -0.014802694320678711, -0.014300823211669922, -0.013798952102661133, -0.013297080993652344, -0.012795209884643555, -0.012293338775634766, -0.011791467666625977, -0.011289596557617188, -0.010787725448608398, -0.01028585433959961, -0.00978398323059082, -0.009282112121582031, -0.008780241012573242, -0.008278369903564453, -0.007776498794555664, -0.007274627685546875, -0.006772756576538086, -0.006270885467529297, -0.005769014358520508, -0.005267143249511719, -0.00476527214050293, -0.004263401031494141, -0.0037615299224853516, -0.0032596588134765625, -0.0027577877044677734, -0.0022559165954589844, -0.0017540454864501953, -0.0012521743774414062, -0.0007503032684326172, -0.0002484321594238281, 0.00025343894958496094, 0.00075531005859375, 0.001257181167602539, 0.0017590522766113281, 0.002260923385620117, 0.0027627944946289062, 0.0032646656036376953, 0.0037665367126464844, 0.0042684078216552734, 0.0047702789306640625, 0.0052721500396728516, 0.005774021148681641, 0.00627589225769043, 0.006777763366699219, 0.007279634475708008, 0.007781505584716797, 0.008283376693725586, 0.008785247802734375, 0.009287118911743164, 0.009788990020751953, 0.010290861129760742, 0.010792732238769531, 0.01129460334777832, 0.01179647445678711, 0.012298345565795898, 0.012800216674804688, 0.013302087783813477, 0.013803958892822266, 0.014305830001831055, 0.014807701110839844, 0.015309572219848633, 0.015811443328857422, 0.01631331443786621, 0.016815185546875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 2.0, 2.0, 8.0, 8.0, 13.0, 19.0, 16.0, 24.0, 39.0, 47.0, 56.0, 47.0, 69.0, 74.0, 81.0, 98.0, 74.0, 65.0, 63.0, 38.0, 32.0, 28.0, 23.0, 17.0, 10.0, 11.0, 7.0, 4.0, 3.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0067901611328125e-06, -4.827044904232025e-06, -4.647299647331238e-06, -4.4675543904304504e-06, -4.287809133529663e-06, -4.108063876628876e-06, -3.928318619728088e-06, -3.748573362827301e-06, -3.5688281059265137e-06, -3.3890828490257263e-06, -3.209337592124939e-06, -3.0295923352241516e-06, -2.8498470783233643e-06, -2.670101821422577e-06, -2.4903565645217896e-06, -2.310611307621002e-06, -2.130866050720215e-06, -1.9511207938194275e-06, -1.7713755369186401e-06, -1.5916302800178528e-06, -1.4118850231170654e-06, -1.232139766216278e-06, -1.0523945093154907e-06, -8.726492524147034e-07, -6.92903995513916e-07, -5.131587386131287e-07, -3.334134817123413e-07, -1.5366822481155396e-07, 2.60770320892334e-08, 2.0582228899002075e-07, 3.855675458908081e-07, 5.653128027915955e-07, 7.450580596923828e-07, 9.248033165931702e-07, 1.1045485734939575e-06, 1.2842938303947449e-06, 1.4640390872955322e-06, 1.6437843441963196e-06, 1.823529601097107e-06, 2.0032748579978943e-06, 2.1830201148986816e-06, 2.362765371799469e-06, 2.5425106287002563e-06, 2.7222558856010437e-06, 2.902001142501831e-06, 3.0817463994026184e-06, 3.2614916563034058e-06, 3.441236913204193e-06, 3.6209821701049805e-06, 3.800727427005768e-06, 3.980472683906555e-06, 4.1602179408073425e-06, 4.33996319770813e-06, 4.519708454608917e-06, 4.699453711509705e-06, 4.879198968410492e-06, 5.058944225311279e-06, 5.238689482212067e-06, 5.418434739112854e-06, 5.598179996013641e-06, 5.777925252914429e-06, 5.957670509815216e-06, 6.137415766716003e-06, 6.317161023616791e-06, 6.496906280517578e-06]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 7.0, 4.0, 11.0, 15.0, 11.0, 25.0, 39.0, 39.0, 71.0, 128.0, 194.0, 319.0, 553.0, 996.0, 2093.0, 4895.0, 14299.0, 59439.0, 363697.0, 487548.0, 84442.0, 18577.0, 6012.0, 2388.0, 1153.0, 644.0, 384.0, 198.0, 125.0, 89.0, 52.0, 33.0, 28.0, 13.0, 14.0, 6.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01465606689453125, -0.014213323593139648, -0.013770580291748047, -0.013327836990356445, -0.012885093688964844, -0.012442350387573242, -0.01199960708618164, -0.011556863784790039, -0.011114120483398438, -0.010671377182006836, -0.010228633880615234, -0.009785890579223633, -0.009343147277832031, -0.00890040397644043, -0.008457660675048828, -0.008014917373657227, -0.007572174072265625, -0.0071294307708740234, -0.006686687469482422, -0.00624394416809082, -0.005801200866699219, -0.005358457565307617, -0.004915714263916016, -0.004472970962524414, -0.0040302276611328125, -0.003587484359741211, -0.0031447410583496094, -0.002701997756958008, -0.0022592544555664062, -0.0018165111541748047, -0.0013737678527832031, -0.0009310245513916016, -0.00048828125, -4.553794860839844e-05, 0.0003972053527832031, 0.0008399486541748047, 0.0012826919555664062, 0.0017254352569580078, 0.0021681785583496094, 0.002610921859741211, 0.0030536651611328125, 0.003496408462524414, 0.003939151763916016, 0.004381895065307617, 0.004824638366699219, 0.00526738166809082, 0.005710124969482422, 0.0061528682708740234, 0.006595611572265625, 0.0070383548736572266, 0.007481098175048828, 0.00792384147644043, 0.008366584777832031, 0.008809328079223633, 0.009252071380615234, 0.009694814682006836, 0.010137557983398438, 0.010580301284790039, 0.01102304458618164, 0.011465787887573242, 0.011908531188964844, 0.012351274490356445, 0.012794017791748047, 0.013236761093139648, 0.01367950439453125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 7.0, 4.0, 8.0, 11.0, 19.0, 25.0, 29.0, 35.0, 46.0, 54.0, 74.0, 94.0, 101.0, 82.0, 72.0, 75.0, 55.0, 54.0, 44.0, 28.0, 16.0, 19.0, 14.0, 7.0, 6.0, 4.0, 5.0, 4.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00290679931640625, -0.0027904510498046875, -0.002674102783203125, -0.0025577545166015625, -0.00244140625, -0.0023250579833984375, -0.002208709716796875, -0.0020923614501953125, -0.00197601318359375, -0.0018596649169921875, -0.001743316650390625, -0.0016269683837890625, -0.0015106201171875, -0.0013942718505859375, -0.001277923583984375, -0.0011615753173828125, -0.00104522705078125, -0.0009288787841796875, -0.000812530517578125, -0.0006961822509765625, -0.000579833984375, -0.0004634857177734375, -0.000347137451171875, -0.0002307891845703125, -0.00011444091796875, 1.9073486328125e-06, 0.000118255615234375, 0.0002346038818359375, 0.0003509521484375, 0.0004673004150390625, 0.000583648681640625, 0.0006999969482421875, 0.00081634521484375, 0.0009326934814453125, 0.001049041748046875, 0.0011653900146484375, 0.00128173828125, 0.0013980865478515625, 0.001514434814453125, 0.0016307830810546875, 0.00174713134765625, 0.0018634796142578125, 0.001979827880859375, 0.0020961761474609375, 0.0022125244140625, 0.0023288726806640625, 0.002445220947265625, 0.0025615692138671875, 0.00267791748046875, 0.0027942657470703125, 0.002910614013671875, 0.0030269622802734375, 0.003143310546875, 0.0032596588134765625, 0.003376007080078125, 0.0034923553466796875, 0.00360870361328125, 0.0037250518798828125, 0.003841400146484375, 0.0039577484130859375, 0.0040740966796875, 0.0041904449462890625, 0.004306793212890625, 0.0044231414794921875, 0.00453948974609375]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 10.0, 13.0, 31.0, 88.0, 160.0, 228.0, 214.0, 129.0, 68.0, 24.0, 18.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31877464056015015, -0.3103354275226593, -0.30189621448516846, -0.29345703125, -0.28501781821250916, -0.2765786051750183, -0.26813939213752747, -0.2597001791000366, -0.25126099586486816, -0.24282178282737732, -0.23438258469104767, -0.22594337165355682, -0.21750417351722717, -0.20906496047973633, -0.20062574744224548, -0.19218653440475464, -0.1837473213672638, -0.17530810832977295, -0.1668689101934433, -0.15842969715595245, -0.1499904990196228, -0.14155128598213196, -0.1331120729446411, -0.12467286735773087, -0.11623366177082062, -0.10779445618391037, -0.09935525059700012, -0.09091603755950928, -0.08247683197259903, -0.07403762638568878, -0.06559841334819794, -0.05715920776128769, -0.04871998727321625, -0.040280781686306, -0.031841572374105453, -0.023402364924550056, -0.01496315747499466, -0.006523951888084412, 0.0019152574241161346, 0.010354466736316681, 0.01879367232322693, 0.027232879772782326, 0.03567208722233772, 0.04411129653453827, 0.05255050212144852, 0.060989707708358765, 0.06942892074584961, 0.07786812633275986, 0.0863073319196701, 0.09474653750658035, 0.1031857430934906, 0.11162495613098145, 0.1200641617178917, 0.12850336730480194, 0.13694258034229279, 0.14538177847862244, 0.15382099151611328, 0.16226020455360413, 0.17069940268993378, 0.17913861572742462, 0.18757781386375427, 0.19601702690124512, 0.20445623993873596, 0.2128954529762268, 0.22133465111255646]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 8.0, 3.0, 12.0, 11.0, 10.0, 24.0, 33.0, 33.0, 50.0, 40.0, 56.0, 61.0, 52.0, 60.0, 69.0, 56.0, 59.0, 52.0, 64.0, 61.0, 37.0, 38.0, 40.0, 12.0, 15.0, 13.0, 7.0, 10.0, 3.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08594147861003876, -0.08259603381156921, -0.07925058156251907, -0.07590513676404953, -0.07255969196557999, -0.06921423971652985, -0.0658687949180603, -0.06252335011959076, -0.059177905321121216, -0.055832456797361374, -0.05248701199889183, -0.04914156347513199, -0.045796118676662445, -0.0424506701529026, -0.03910522162914276, -0.03575977683067322, -0.032414328306913376, -0.029068881645798683, -0.02572343498468399, -0.02237798646092415, -0.019032541662454605, -0.015687093138694763, -0.01234164647758007, -0.008996199816465378, -0.005650753155350685, -0.0023053062614053488, 0.0010401406325399876, 0.0043855877593159676, 0.00773103442043066, 0.011076482012867928, 0.01442192867398262, 0.017767375335097313, 0.021112821996212006, 0.0244582686573267, 0.02780371531844139, 0.031149163842201233, 0.034494608640670776, 0.03784005716443062, 0.04118550568819046, 0.044530950486660004, 0.04787639528512955, 0.05122184380888939, 0.05456728860735893, 0.057912737131118774, 0.06125818192958832, 0.06460362672805786, 0.067949078977108, 0.07129452377557755, 0.07463997602462769, 0.07798542082309723, 0.08133087307214737, 0.08467631787061691, 0.08802176266908646, 0.0913672149181366, 0.09471265971660614, 0.09805810451507568, 0.10140354931354523, 0.10474899411201477, 0.10809444636106491, 0.11143989115953445, 0.114785335958004, 0.11813078820705414, 0.12147623300552368, 0.12482167780399323, 0.12816712260246277]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 4.0, 5.0, 10.0, 9.0, 12.0, 16.0, 17.0, 36.0, 47.0, 77.0, 132.0, 217.0, 279.0, 470.0, 882.0, 1543.0, 2943.0, 6018.0, 13143.0, 35739.0, 171263.0, 680459.0, 89537.0, 25209.0, 10287.0, 4636.0, 2391.0, 1259.0, 724.0, 455.0, 250.0, 161.0, 116.0, 67.0, 44.0, 29.0, 24.0, 14.0, 12.0, 8.0, 8.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09271240234375, -0.08932113647460938, -0.08592987060546875, -0.08253860473632812, -0.0791473388671875, -0.07575607299804688, -0.07236480712890625, -0.06897354125976562, -0.065582275390625, -0.062191009521484375, -0.05879974365234375, -0.055408477783203125, -0.0520172119140625, -0.048625946044921875, -0.04523468017578125, -0.041843414306640625, -0.0384521484375, -0.035060882568359375, -0.03166961669921875, -0.028278350830078125, -0.0248870849609375, -0.021495819091796875, -0.01810455322265625, -0.014713287353515625, -0.011322021484375, -0.007930755615234375, -0.00453948974609375, -0.001148223876953125, 0.0022430419921875, 0.005634307861328125, 0.00902557373046875, 0.012416839599609375, 0.01580810546875, 0.019199371337890625, 0.02259063720703125, 0.025981903076171875, 0.0293731689453125, 0.032764434814453125, 0.03615570068359375, 0.039546966552734375, 0.042938232421875, 0.046329498291015625, 0.04972076416015625, 0.053112030029296875, 0.0565032958984375, 0.059894561767578125, 0.06328582763671875, 0.06667709350585938, 0.070068359375, 0.07345962524414062, 0.07685089111328125, 0.08024215698242188, 0.0836334228515625, 0.08702468872070312, 0.09041595458984375, 0.09380722045898438, 0.097198486328125, 0.10058975219726562, 0.10398101806640625, 0.10737228393554688, 0.1107635498046875, 0.11415481567382812, 0.11754608154296875, 0.12093734741210938, 0.12432861328125]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 2.0, 5.0, 4.0, 7.0, 8.0, 8.0, 16.0, 18.0, 17.0, 31.0, 39.0, 39.0, 46.0, 59.0, 50.0, 65.0, 66.0, 45.0, 56.0, 57.0, 55.0, 61.0, 56.0, 37.0, 35.0, 33.0, 19.0, 23.0, 7.0, 8.0, 9.0, 5.0, 5.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1820068359375, -0.17581939697265625, -0.1696319580078125, -0.16344451904296875, -0.157257080078125, -0.15106964111328125, -0.1448822021484375, -0.13869476318359375, -0.13250732421875, -0.12631988525390625, -0.1201324462890625, -0.11394500732421875, -0.107757568359375, -0.10157012939453125, -0.0953826904296875, -0.08919525146484375, -0.0830078125, -0.07682037353515625, -0.0706329345703125, -0.06444549560546875, -0.058258056640625, -0.05207061767578125, -0.0458831787109375, -0.03969573974609375, -0.03350830078125, -0.02732086181640625, -0.0211334228515625, -0.01494598388671875, -0.008758544921875, -0.00257110595703125, 0.0036163330078125, 0.00980377197265625, 0.0159912109375, 0.02217864990234375, 0.0283660888671875, 0.03455352783203125, 0.040740966796875, 0.04692840576171875, 0.0531158447265625, 0.05930328369140625, 0.06549072265625, 0.07167816162109375, 0.0778656005859375, 0.08405303955078125, 0.090240478515625, 0.09642791748046875, 0.1026153564453125, 0.10880279541015625, 0.114990234375, 0.12117767333984375, 0.1273651123046875, 0.13355255126953125, 0.139739990234375, 0.14592742919921875, 0.1521148681640625, 0.15830230712890625, 0.16448974609375, 0.17067718505859375, 0.1768646240234375, 0.18305206298828125, 0.189239501953125, 0.19542694091796875, 0.2016143798828125, 0.20780181884765625, 0.2139892578125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0, 5.0, 8.0, 7.0, 14.0, 21.0, 12.0, 26.0, 20.0, 22.0, 36.0, 45.0, 60.0, 83.0, 120.0, 151.0, 178.0, 251.0, 390.0, 841.0, 3050.0, 16699.0, 630274.0, 377084.0, 14148.0, 2695.0, 823.0, 396.0, 251.0, 182.0, 152.0, 125.0, 64.0, 84.0, 48.0, 47.0, 46.0, 24.0, 22.0, 19.0, 10.0, 5.0, 5.0, 8.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2342529296875, -0.22643470764160156, -0.21861648559570312, -0.2107982635498047, -0.20298004150390625, -0.1951618194580078, -0.18734359741210938, -0.17952537536621094, -0.1717071533203125, -0.16388893127441406, -0.15607070922851562, -0.1482524871826172, -0.14043426513671875, -0.1326160430908203, -0.12479782104492188, -0.11697959899902344, -0.109161376953125, -0.10134315490722656, -0.09352493286132812, -0.08570671081542969, -0.07788848876953125, -0.07007026672363281, -0.062252044677734375, -0.05443382263183594, -0.0466156005859375, -0.03879737854003906, -0.030979156494140625, -0.023160934448242188, -0.01534271240234375, -0.0075244903564453125, 0.000293731689453125, 0.008111953735351562, 0.01593017578125, 0.023748397827148438, 0.031566619873046875, 0.03938484191894531, 0.04720306396484375, 0.05502128601074219, 0.06283950805664062, 0.07065773010253906, 0.0784759521484375, 0.08629417419433594, 0.09411239624023438, 0.10193061828613281, 0.10974884033203125, 0.11756706237792969, 0.12538528442382812, 0.13320350646972656, 0.141021728515625, 0.14883995056152344, 0.15665817260742188, 0.1644763946533203, 0.17229461669921875, 0.1801128387451172, 0.18793106079101562, 0.19574928283691406, 0.2035675048828125, 0.21138572692871094, 0.21920394897460938, 0.2270221710205078, 0.23484039306640625, 0.2426586151123047, 0.2504768371582031, 0.25829505920410156, 0.26611328125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 5.0, 7.0, 4.0, 8.0, 5.0, 8.0, 13.0, 11.0, 23.0, 24.0, 21.0, 17.0, 26.0, 26.0, 40.0, 23.0, 46.0, 39.0, 34.0, 44.0, 48.0, 42.0, 41.0, 48.0, 46.0, 36.0, 31.0, 32.0, 29.0, 20.0, 20.0, 27.0, 22.0, 24.0, 29.0, 18.0, 13.0, 14.0, 5.0, 9.0, 4.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 4.0], "bins": [-0.1719970703125, -0.16673660278320312, -0.16147613525390625, -0.15621566772460938, -0.1509552001953125, -0.14569473266601562, -0.14043426513671875, -0.13517379760742188, -0.129913330078125, -0.12465286254882812, -0.11939239501953125, -0.11413192749023438, -0.1088714599609375, -0.10361099243164062, -0.09835052490234375, -0.09309005737304688, -0.08782958984375, -0.08256912231445312, -0.07730865478515625, -0.07204818725585938, -0.0667877197265625, -0.061527252197265625, -0.05626678466796875, -0.051006317138671875, -0.045745849609375, -0.040485382080078125, -0.03522491455078125, -0.029964447021484375, -0.0247039794921875, -0.019443511962890625, -0.01418304443359375, -0.008922576904296875, -0.003662109375, 0.001598358154296875, 0.00685882568359375, 0.012119293212890625, 0.0173797607421875, 0.022640228271484375, 0.02790069580078125, 0.033161163330078125, 0.038421630859375, 0.043682098388671875, 0.04894256591796875, 0.054203033447265625, 0.0594635009765625, 0.06472396850585938, 0.06998443603515625, 0.07524490356445312, 0.08050537109375, 0.08576583862304688, 0.09102630615234375, 0.09628677368164062, 0.1015472412109375, 0.10680770874023438, 0.11206817626953125, 0.11732864379882812, 0.122589111328125, 0.12784957885742188, 0.13311004638671875, 0.13837051391601562, 0.1436309814453125, 0.14889144897460938, 0.15415191650390625, 0.15941238403320312, 0.1646728515625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 2.0, 5.0, 7.0, 6.0, 16.0, 7.0, 21.0, 42.0, 37.0, 73.0, 88.0, 204.0, 372.0, 767.0, 1611.0, 4209.0, 15312.0, 326154.0, 673493.0, 17945.0, 4544.0, 1794.0, 832.0, 406.0, 206.0, 139.0, 78.0, 60.0, 27.0, 36.0, 13.0, 10.0, 12.0, 8.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.0970458984375, -0.09435367584228516, -0.09166145324707031, -0.08896923065185547, -0.08627700805664062, -0.08358478546142578, -0.08089256286621094, -0.0782003402709961, -0.07550811767578125, -0.0728158950805664, -0.07012367248535156, -0.06743144989013672, -0.06473922729492188, -0.06204700469970703, -0.05935478210449219, -0.056662559509277344, -0.0539703369140625, -0.051278114318847656, -0.04858589172363281, -0.04589366912841797, -0.043201446533203125, -0.04050922393798828, -0.03781700134277344, -0.035124778747558594, -0.03243255615234375, -0.029740333557128906, -0.027048110961914062, -0.02435588836669922, -0.021663665771484375, -0.01897144317626953, -0.016279220581054688, -0.013586997985839844, -0.010894775390625, -0.008202552795410156, -0.0055103302001953125, -0.0028181076049804688, -0.000125885009765625, 0.0025663375854492188, 0.0052585601806640625, 0.007950782775878906, 0.01064300537109375, 0.013335227966308594, 0.016027450561523438, 0.01871967315673828, 0.021411895751953125, 0.02410411834716797, 0.026796340942382812, 0.029488563537597656, 0.0321807861328125, 0.034873008728027344, 0.03756523132324219, 0.04025745391845703, 0.042949676513671875, 0.04564189910888672, 0.04833412170410156, 0.051026344299316406, 0.05371856689453125, 0.056410789489746094, 0.05910301208496094, 0.06179523468017578, 0.06448745727539062, 0.06717967987060547, 0.06987190246582031, 0.07256412506103516, 0.07525634765625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 2.0, 9.0, 5.0, 7.0, 13.0, 23.0, 27.0, 61.0, 121.0, 337.0, 191.0, 79.0, 40.0, 22.0, 18.0, 13.0, 13.0, 4.0, 10.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3589859008789062e-05, -1.3173557817935944e-05, -1.2757256627082825e-05, -1.2340955436229706e-05, -1.1924654245376587e-05, -1.1508353054523468e-05, -1.1092051863670349e-05, -1.067575067281723e-05, -1.0259449481964111e-05, -9.843148291110992e-06, -9.426847100257874e-06, -9.010545909404755e-06, -8.594244718551636e-06, -8.177943527698517e-06, -7.761642336845398e-06, -7.345341145992279e-06, -6.92903995513916e-06, -6.512738764286041e-06, -6.096437573432922e-06, -5.6801363825798035e-06, -5.2638351917266846e-06, -4.847534000873566e-06, -4.431232810020447e-06, -4.014931619167328e-06, -3.598630428314209e-06, -3.18232923746109e-06, -2.766028046607971e-06, -2.3497268557548523e-06, -1.9334256649017334e-06, -1.5171244740486145e-06, -1.1008232831954956e-06, -6.845220923423767e-07, -2.682209014892578e-07, 1.4808028936386108e-07, 5.6438148021698e-07, 9.806826710700989e-07, 1.3969838619232178e-06, 1.8132850527763367e-06, 2.2295862436294556e-06, 2.6458874344825745e-06, 3.0621886253356934e-06, 3.4784898161888123e-06, 3.894791007041931e-06, 4.31109219789505e-06, 4.727393388748169e-06, 5.143694579601288e-06, 5.559995770454407e-06, 5.976296961307526e-06, 6.3925981521606445e-06, 6.8088993430137634e-06, 7.225200533866882e-06, 7.641501724720001e-06, 8.05780291557312e-06, 8.474104106426239e-06, 8.890405297279358e-06, 9.306706488132477e-06, 9.723007678985596e-06, 1.0139308869838715e-05, 1.0555610060691833e-05, 1.0971911251544952e-05, 1.1388212442398071e-05, 1.180451363325119e-05, 1.2220814824104309e-05, 1.2637116014957428e-05, 1.3053417205810547e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 4.0, 2.0, 2.0, 3.0, 4.0, 8.0, 11.0, 24.0, 39.0, 68.0, 160.0, 347.0, 886.0, 2831.0, 14047.0, 906676.0, 113912.0, 6730.0, 1701.0, 583.0, 245.0, 101.0, 64.0, 35.0, 24.0, 13.0, 3.0, 6.0, 5.0, 8.0, 7.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.16552734375, -0.1611490249633789, -0.1567707061767578, -0.15239238739013672, -0.14801406860351562, -0.14363574981689453, -0.13925743103027344, -0.13487911224365234, -0.13050079345703125, -0.12612247467041016, -0.12174415588378906, -0.11736583709716797, -0.11298751831054688, -0.10860919952392578, -0.10423088073730469, -0.0998525619506836, -0.0954742431640625, -0.0910959243774414, -0.08671760559082031, -0.08233928680419922, -0.07796096801757812, -0.07358264923095703, -0.06920433044433594, -0.06482601165771484, -0.06044769287109375, -0.056069374084472656, -0.05169105529785156, -0.04731273651123047, -0.042934417724609375, -0.03855609893798828, -0.03417778015136719, -0.029799461364746094, -0.025421142578125, -0.021042823791503906, -0.016664505004882812, -0.012286186218261719, -0.007907867431640625, -0.0035295486450195312, 0.0008487701416015625, 0.005227088928222656, 0.00960540771484375, 0.013983726501464844, 0.018362045288085938, 0.02274036407470703, 0.027118682861328125, 0.03149700164794922, 0.03587532043457031, 0.040253639221191406, 0.0446319580078125, 0.049010276794433594, 0.05338859558105469, 0.05776691436767578, 0.062145233154296875, 0.06652355194091797, 0.07090187072753906, 0.07528018951416016, 0.07965850830078125, 0.08403682708740234, 0.08841514587402344, 0.09279346466064453, 0.09717178344726562, 0.10155010223388672, 0.10592842102050781, 0.1103067398071289, 0.11468505859375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 1.0, 3.0, 1.0, 5.0, 5.0, 6.0, 12.0, 16.0, 37.0, 65.0, 110.0, 271.0, 211.0, 105.0, 51.0, 47.0, 21.0, 12.0, 4.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03369140625, -0.03239250183105469, -0.031093597412109375, -0.029794692993164062, -0.02849578857421875, -0.027196884155273438, -0.025897979736328125, -0.024599075317382812, -0.0233001708984375, -0.022001266479492188, -0.020702362060546875, -0.019403457641601562, -0.01810455322265625, -0.016805648803710938, -0.015506744384765625, -0.014207839965820312, -0.012908935546875, -0.011610031127929688, -0.010311126708984375, -0.009012222290039062, -0.00771331787109375, -0.0064144134521484375, -0.005115509033203125, -0.0038166046142578125, -0.0025177001953125, -0.0012187957763671875, 8.0108642578125e-05, 0.0013790130615234375, 0.00267791748046875, 0.0039768218994140625, 0.005275726318359375, 0.0065746307373046875, 0.00787353515625, 0.009172439575195312, 0.010471343994140625, 0.011770248413085938, 0.01306915283203125, 0.014368057250976562, 0.015666961669921875, 0.016965866088867188, 0.0182647705078125, 0.019563674926757812, 0.020862579345703125, 0.022161483764648438, 0.02346038818359375, 0.024759292602539062, 0.026058197021484375, 0.027357101440429688, 0.028656005859375, 0.029954910278320312, 0.031253814697265625, 0.03255271911621094, 0.03385162353515625, 0.03515052795410156, 0.036449432373046875, 0.03774833679199219, 0.0390472412109375, 0.04034614562988281, 0.041645050048828125, 0.04294395446777344, 0.04424285888671875, 0.04554176330566406, 0.046840667724609375, 0.04813957214355469, 0.0494384765625]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 13.0, 23.0, 36.0, 80.0, 167.0, 201.0, 194.0, 104.0, 81.0, 54.0, 25.0, 11.0, 9.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.618438184261322, -0.6024943590164185, -0.5865505337715149, -0.5706067085266113, -0.5546629428863525, -0.538719117641449, -0.5227752923965454, -0.5068314671516418, -0.4908876419067383, -0.4749438166618347, -0.45900002121925354, -0.44305619597435, -0.4271123707294464, -0.41116857528686523, -0.39522475004196167, -0.3792809247970581, -0.36333712935447693, -0.34739330410957336, -0.3314495086669922, -0.3155056834220886, -0.29956185817718506, -0.2836180329322815, -0.2676742374897003, -0.25173041224479675, -0.23578660190105438, -0.219842791557312, -0.20389896631240845, -0.18795515596866608, -0.1720113456249237, -0.15606752038002014, -0.14012371003627777, -0.1241798922419548, -0.10823610424995422, -0.09229228645563126, -0.07634846866130829, -0.06040465831756592, -0.04446084052324295, -0.028517022728919983, -0.012573212385177612, 0.0033706054091453552, 0.019314423203468323, 0.03525824099779129, 0.05120205506682396, 0.06714586913585663, 0.0830896869301796, 0.09903350472450256, 0.11497731506824493, 0.1309211254119873, 0.14686495065689087, 0.16280876100063324, 0.1787525862455368, 0.19469639658927917, 0.21064022183418274, 0.2265840321779251, 0.24252784252166748, 0.25847166776657104, 0.2744154930114746, 0.2903593182563782, 0.30630311369895935, 0.3222469389438629, 0.3381907641887665, 0.35413455963134766, 0.3700783848762512, 0.3860222101211548, 0.40196600556373596]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 8.0, 13.0, 8.0, 8.0, 17.0, 15.0, 20.0, 13.0, 23.0, 28.0, 29.0, 29.0, 27.0, 35.0, 37.0, 39.0, 41.0, 43.0, 38.0, 43.0, 37.0, 36.0, 36.0, 49.0, 34.0, 29.0, 41.0, 30.0, 27.0, 25.0, 24.0, 20.0, 20.0, 15.0, 19.0, 7.0, 9.0, 8.0, 4.0, 3.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.3023441433906555, -0.2936819791793823, -0.28501978516578674, -0.27635762095451355, -0.26769545674324036, -0.25903329253196716, -0.2503710985183716, -0.2417089343070984, -0.2330467700958252, -0.2243845909833908, -0.21572242677211761, -0.20706024765968323, -0.19839808344841003, -0.18973590433597565, -0.18107372522354126, -0.17241156101226807, -0.16374938189983368, -0.1550872027873993, -0.1464250385761261, -0.1377628594636917, -0.12910069525241852, -0.12043851613998413, -0.11177634447813034, -0.10311417281627655, -0.09445200115442276, -0.08578982949256897, -0.07712765783071518, -0.06846548616886139, -0.0598033107817173, -0.05114113911986351, -0.04247896373271942, -0.03381679207086563, -0.02515462040901184, -0.01649244874715805, -0.007830275222659111, 0.0008318983018398285, 0.009494069963693619, 0.01815624162554741, 0.026818417012691498, 0.03548058867454529, 0.04414276033639908, 0.05280493199825287, 0.06146710366010666, 0.07012927532196045, 0.07879145443439484, 0.08745361864566803, 0.09611579775810242, 0.10477796941995621, 0.11344014108181, 0.12210231274366379, 0.13076448440551758, 0.13942666351795197, 0.14808882772922516, 0.15675100684165955, 0.16541317105293274, 0.17407535016536713, 0.1827375292778015, 0.1913997083902359, 0.2000618726015091, 0.20872405171394348, 0.21738621592521667, 0.22604839503765106, 0.23471057415008545, 0.24337273836135864, 0.25203490257263184]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 5.0, 3.0, 8.0, 13.0, 10.0, 8.0, 12.0, 25.0, 19.0, 17.0, 21.0, 27.0, 19.0, 34.0, 48.0, 52.0, 109.0, 206.0, 581.0, 1953.0, 13075.0, 3081344.0, 1085318.0, 8746.0, 1530.0, 493.0, 205.0, 92.0, 62.0, 37.0, 27.0, 25.0, 26.0, 20.0, 21.0, 19.0, 13.0, 10.0, 11.0, 7.0, 5.0, 8.0, 6.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0], "bins": [-0.51806640625, -0.5007553100585938, -0.4834442138671875, -0.46613311767578125, -0.448822021484375, -0.43151092529296875, -0.4141998291015625, -0.39688873291015625, -0.37957763671875, -0.36226654052734375, -0.3449554443359375, -0.32764434814453125, -0.310333251953125, -0.29302215576171875, -0.2757110595703125, -0.25839996337890625, -0.2410888671875, -0.22377777099609375, -0.2064666748046875, -0.18915557861328125, -0.171844482421875, -0.15453338623046875, -0.1372222900390625, -0.11991119384765625, -0.10260009765625, -0.08528900146484375, -0.0679779052734375, -0.05066680908203125, -0.033355712890625, -0.01604461669921875, 0.0012664794921875, 0.01857757568359375, 0.035888671875, 0.05319976806640625, 0.0705108642578125, 0.08782196044921875, 0.105133056640625, 0.12244415283203125, 0.1397552490234375, 0.15706634521484375, 0.17437744140625, 0.19168853759765625, 0.2089996337890625, 0.22631072998046875, 0.243621826171875, 0.26093292236328125, 0.2782440185546875, 0.29555511474609375, 0.3128662109375, 0.33017730712890625, 0.3474884033203125, 0.36479949951171875, 0.382110595703125, 0.39942169189453125, 0.4167327880859375, 0.43404388427734375, 0.45135498046875, 0.46866607666015625, 0.4859771728515625, 0.5032882690429688, 0.520599365234375, 0.5379104614257812, 0.5552215576171875, 0.5725326538085938, 0.58984375]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 6.0, 4.0, 5.0, 10.0, 15.0, 13.0, 19.0, 24.0, 33.0, 39.0, 55.0, 48.0, 45.0, 59.0, 70.0, 61.0, 74.0, 64.0, 63.0, 60.0, 56.0, 36.0, 27.0, 32.0, 29.0, 12.0, 13.0, 9.0, 2.0, 9.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12481689453125, -0.12087154388427734, -0.11692619323730469, -0.11298084259033203, -0.10903549194335938, -0.10509014129638672, -0.10114479064941406, -0.0971994400024414, -0.09325408935546875, -0.0893087387084961, -0.08536338806152344, -0.08141803741455078, -0.07747268676757812, -0.07352733612060547, -0.06958198547363281, -0.06563663482666016, -0.0616912841796875, -0.057745933532714844, -0.05380058288574219, -0.04985523223876953, -0.045909881591796875, -0.04196453094482422, -0.03801918029785156, -0.034073829650878906, -0.03012847900390625, -0.026183128356933594, -0.022237777709960938, -0.01829242706298828, -0.014347076416015625, -0.010401725769042969, -0.0064563751220703125, -0.0025110244750976562, 0.001434326171875, 0.005379676818847656, 0.009325027465820312, 0.013270378112792969, 0.017215728759765625, 0.02116107940673828, 0.025106430053710938, 0.029051780700683594, 0.03299713134765625, 0.036942481994628906, 0.04088783264160156, 0.04483318328857422, 0.048778533935546875, 0.05272388458251953, 0.05666923522949219, 0.060614585876464844, 0.0645599365234375, 0.06850528717041016, 0.07245063781738281, 0.07639598846435547, 0.08034133911132812, 0.08428668975830078, 0.08823204040527344, 0.0921773910522461, 0.09612274169921875, 0.1000680923461914, 0.10401344299316406, 0.10795879364013672, 0.11190414428710938, 0.11584949493408203, 0.11979484558105469, 0.12374019622802734, 0.127685546875]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 10.0, 13.0, 11.0, 28.0, 42.0, 42.0, 125.0, 226.0, 687.0, 2270.0, 14543.0, 388518.0, 3733725.0, 47413.0, 4769.0, 1091.0, 394.0, 152.0, 58.0, 53.0, 32.0, 22.0, 16.0, 7.0, 8.0, 7.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.234130859375, -0.22359466552734375, -0.2130584716796875, -0.20252227783203125, -0.191986083984375, -0.18144989013671875, -0.1709136962890625, -0.16037750244140625, -0.14984130859375, -0.13930511474609375, -0.1287689208984375, -0.11823272705078125, -0.107696533203125, -0.09716033935546875, -0.0866241455078125, -0.07608795166015625, -0.0655517578125, -0.05501556396484375, -0.0444793701171875, -0.03394317626953125, -0.023406982421875, -0.01287078857421875, -0.0023345947265625, 0.00820159912109375, 0.01873779296875, 0.02927398681640625, 0.0398101806640625, 0.05034637451171875, 0.060882568359375, 0.07141876220703125, 0.0819549560546875, 0.09249114990234375, 0.10302734375, 0.11356353759765625, 0.1240997314453125, 0.13463592529296875, 0.145172119140625, 0.15570831298828125, 0.1662445068359375, 0.17678070068359375, 0.18731689453125, 0.19785308837890625, 0.2083892822265625, 0.21892547607421875, 0.229461669921875, 0.23999786376953125, 0.2505340576171875, 0.26107025146484375, 0.2716064453125, 0.28214263916015625, 0.2926788330078125, 0.30321502685546875, 0.313751220703125, 0.32428741455078125, 0.3348236083984375, 0.34535980224609375, 0.35589599609375, 0.36643218994140625, 0.3769683837890625, 0.38750457763671875, 0.398040771484375, 0.40857696533203125, 0.4191131591796875, 0.42964935302734375, 0.440185546875]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 2.0, 3.0, 15.0, 13.0, 24.0, 20.0, 33.0, 39.0, 52.0, 64.0, 114.0, 149.0, 251.0, 470.0, 668.0, 771.0, 521.0, 309.0, 189.0, 102.0, 77.0, 39.0, 41.0, 34.0, 24.0, 11.0, 14.0, 9.0, 4.0, 5.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.057708740234375, -0.05623483657836914, -0.05476093292236328, -0.05328702926635742, -0.05181312561035156, -0.0503392219543457, -0.048865318298339844, -0.047391414642333984, -0.045917510986328125, -0.044443607330322266, -0.042969703674316406, -0.04149580001831055, -0.04002189636230469, -0.03854799270629883, -0.03707408905029297, -0.03560018539428711, -0.03412628173828125, -0.03265237808227539, -0.03117847442626953, -0.029704570770263672, -0.028230667114257812, -0.026756763458251953, -0.025282859802246094, -0.023808956146240234, -0.022335052490234375, -0.020861148834228516, -0.019387245178222656, -0.017913341522216797, -0.016439437866210938, -0.014965534210205078, -0.013491630554199219, -0.01201772689819336, -0.0105438232421875, -0.00906991958618164, -0.007596015930175781, -0.006122112274169922, -0.0046482086181640625, -0.003174304962158203, -0.0017004013061523438, -0.00022649765014648438, 0.001247406005859375, 0.0027213096618652344, 0.004195213317871094, 0.005669116973876953, 0.0071430206298828125, 0.008616924285888672, 0.010090827941894531, 0.01156473159790039, 0.01303863525390625, 0.01451253890991211, 0.01598644256591797, 0.017460346221923828, 0.018934249877929688, 0.020408153533935547, 0.021882057189941406, 0.023355960845947266, 0.024829864501953125, 0.026303768157958984, 0.027777671813964844, 0.029251575469970703, 0.030725479125976562, 0.03219938278198242, 0.03367328643798828, 0.03514719009399414, 0.03662109375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 3.0, 5.0, 14.0, 14.0, 31.0, 44.0, 77.0, 104.0, 131.0, 160.0, 139.0, 94.0, 70.0, 45.0, 31.0, 20.0, 13.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25304198265075684, -0.2447388917207718, -0.23643580079078674, -0.2281327098608017, -0.21982961893081665, -0.2115265280008316, -0.20322343707084656, -0.19492033123970032, -0.18661725521087646, -0.17831416428089142, -0.17001107335090637, -0.16170798242092133, -0.15340489149093628, -0.14510180056095123, -0.1367987096309662, -0.12849560379981995, -0.1201925128698349, -0.11188942193984985, -0.10358633100986481, -0.09528324007987976, -0.08698014914989471, -0.07867705821990967, -0.07037395983934402, -0.06207086890935898, -0.05376777797937393, -0.045464687049388885, -0.03716159611940384, -0.028858501464128494, -0.020555410534143448, -0.012252319604158401, -0.003949224948883057, 0.00435386598110199, 0.012656956911087036, 0.020960047841072083, 0.029263140633702278, 0.037566233426332474, 0.04586932435631752, 0.054172415286302567, 0.06247550994157791, 0.07077860087156296, 0.079081691801548, 0.08738478273153305, 0.0956878736615181, 0.10399097204208374, 0.11229406297206879, 0.12059715390205383, 0.12890024483203888, 0.13720333576202393, 0.14550642669200897, 0.15380951762199402, 0.16211260855197906, 0.1704156994819641, 0.17871879041194916, 0.1870218813419342, 0.19532498717308044, 0.2036280632019043, 0.21193116903305054, 0.22023425996303558, 0.22853735089302063, 0.23684044182300568, 0.24514353275299072, 0.25344663858413696, 0.2617497146129608, 0.27005282044410706, 0.2783558964729309]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 5.0, 6.0, 7.0, 3.0, 7.0, 13.0, 14.0, 15.0, 21.0, 18.0, 28.0, 33.0, 36.0, 39.0, 49.0, 34.0, 48.0, 42.0, 42.0, 47.0, 56.0, 64.0, 45.0, 44.0, 33.0, 33.0, 43.0, 34.0, 22.0, 23.0, 18.0, 21.0, 24.0, 11.0, 13.0, 4.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09925607591867447, -0.0955699160695076, -0.09188375622034073, -0.08819759637117386, -0.08451143652200699, -0.08082527667284012, -0.07713910937309265, -0.07345294952392578, -0.06976678967475891, -0.06608062982559204, -0.06239446997642517, -0.0587083101272583, -0.05502215027809143, -0.05133599042892456, -0.04764982685446739, -0.04396366700530052, -0.04027751088142395, -0.03659135103225708, -0.03290519118309021, -0.02921902947127819, -0.02553286962211132, -0.02184670977294445, -0.01816054806113243, -0.014474388211965561, -0.01078822836279869, -0.007102068047970533, -0.003415907733142376, 0.0002702530473470688, 0.003956412896513939, 0.007642572745680809, 0.011328734457492828, 0.015014894306659698, 0.018701061606407166, 0.022387221455574036, 0.026073381304740906, 0.029759543016552925, 0.033445701003074646, 0.037131860852241516, 0.040818024426698685, 0.044504184275865555, 0.048190344125032425, 0.051876503974199295, 0.055562663823366165, 0.059248827397823334, 0.0629349872469902, 0.06662114709615707, 0.07030730694532394, 0.07399346679449081, 0.07767962664365768, 0.08136578649282455, 0.08505194634199142, 0.0887381061911583, 0.09242426604032516, 0.09611042588949203, 0.0997965931892395, 0.10348275303840637, 0.10716891288757324, 0.11085507273674011, 0.11454123258590698, 0.11822739243507385, 0.12191355228424072, 0.1255997121334076, 0.12928587198257446, 0.13297203183174133, 0.1366581916809082]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 6.0, 6.0, 9.0, 16.0, 25.0, 27.0, 59.0, 126.0, 233.0, 480.0, 1068.0, 2525.0, 6339.0, 18429.0, 129495.0, 777317.0, 87528.0, 15397.0, 5444.0, 2139.0, 954.0, 451.0, 201.0, 125.0, 61.0, 36.0, 23.0, 9.0, 12.0, 5.0, 7.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1121826171875, -0.10918521881103516, -0.10618782043457031, -0.10319042205810547, -0.10019302368164062, -0.09719562530517578, -0.09419822692871094, -0.0912008285522461, -0.08820343017578125, -0.0852060317993164, -0.08220863342285156, -0.07921123504638672, -0.07621383666992188, -0.07321643829345703, -0.07021903991699219, -0.06722164154052734, -0.0642242431640625, -0.061226844787597656, -0.05822944641113281, -0.05523204803466797, -0.052234649658203125, -0.04923725128173828, -0.04623985290527344, -0.043242454528808594, -0.04024505615234375, -0.037247657775878906, -0.03425025939941406, -0.03125286102294922, -0.028255462646484375, -0.02525806427001953, -0.022260665893554688, -0.019263267517089844, -0.016265869140625, -0.013268470764160156, -0.010271072387695312, -0.007273674011230469, -0.004276275634765625, -0.0012788772583007812, 0.0017185211181640625, 0.004715919494628906, 0.00771331787109375, 0.010710716247558594, 0.013708114624023438, 0.01670551300048828, 0.019702911376953125, 0.02270030975341797, 0.025697708129882812, 0.028695106506347656, 0.0316925048828125, 0.034689903259277344, 0.03768730163574219, 0.04068470001220703, 0.043682098388671875, 0.04667949676513672, 0.04967689514160156, 0.052674293518066406, 0.05567169189453125, 0.058669090270996094, 0.06166648864746094, 0.06466388702392578, 0.06766128540039062, 0.07065868377685547, 0.07365608215332031, 0.07665348052978516, 0.07965087890625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 4.0, 6.0, 10.0, 10.0, 14.0, 15.0, 14.0, 27.0, 24.0, 39.0, 29.0, 50.0, 41.0, 55.0, 51.0, 65.0, 45.0, 51.0, 59.0, 58.0, 40.0, 39.0, 47.0, 34.0, 34.0, 25.0, 32.0, 24.0, 16.0, 14.0, 6.0, 8.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.076904296875, -0.0740365982055664, -0.07116889953613281, -0.06830120086669922, -0.06543350219726562, -0.06256580352783203, -0.05969810485839844, -0.056830406188964844, -0.05396270751953125, -0.051095008850097656, -0.04822731018066406, -0.04535961151123047, -0.042491912841796875, -0.03962421417236328, -0.03675651550292969, -0.033888816833496094, -0.0310211181640625, -0.028153419494628906, -0.025285720825195312, -0.02241802215576172, -0.019550323486328125, -0.01668262481689453, -0.013814926147460938, -0.010947227478027344, -0.00807952880859375, -0.005211830139160156, -0.0023441314697265625, 0.0005235671997070312, 0.003391265869140625, 0.006258964538574219, 0.009126663208007812, 0.011994361877441406, 0.014862060546875, 0.017729759216308594, 0.020597457885742188, 0.02346515655517578, 0.026332855224609375, 0.02920055389404297, 0.03206825256347656, 0.034935951232910156, 0.03780364990234375, 0.040671348571777344, 0.04353904724121094, 0.04640674591064453, 0.049274444580078125, 0.05214214324951172, 0.05500984191894531, 0.057877540588378906, 0.0607452392578125, 0.0636129379272461, 0.06648063659667969, 0.06934833526611328, 0.07221603393554688, 0.07508373260498047, 0.07795143127441406, 0.08081912994384766, 0.08368682861328125, 0.08655452728271484, 0.08942222595214844, 0.09228992462158203, 0.09515762329101562, 0.09802532196044922, 0.10089302062988281, 0.1037607192993164, 0.10662841796875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 7.0, 6.0, 14.0, 22.0, 20.0, 50.0, 79.0, 153.0, 399.0, 1108.0, 4094.0, 23271.0, 521538.0, 470569.0, 21615.0, 3855.0, 1023.0, 387.0, 141.0, 72.0, 40.0, 23.0, 14.0, 14.0, 11.0, 13.0, 8.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11566162109375, -0.11261653900146484, -0.10957145690917969, -0.10652637481689453, -0.10348129272460938, -0.10043621063232422, -0.09739112854003906, -0.0943460464477539, -0.09130096435546875, -0.0882558822631836, -0.08521080017089844, -0.08216571807861328, -0.07912063598632812, -0.07607555389404297, -0.07303047180175781, -0.06998538970947266, -0.0669403076171875, -0.06389522552490234, -0.06085014343261719, -0.05780506134033203, -0.054759979248046875, -0.05171489715576172, -0.04866981506347656, -0.045624732971191406, -0.04257965087890625, -0.039534568786621094, -0.03648948669433594, -0.03344440460205078, -0.030399322509765625, -0.02735424041748047, -0.024309158325195312, -0.021264076232910156, -0.018218994140625, -0.015173912048339844, -0.012128829956054688, -0.009083747863769531, -0.006038665771484375, -0.0029935836791992188, 5.14984130859375e-05, 0.0030965805053710938, 0.00614166259765625, 0.009186744689941406, 0.012231826782226562, 0.015276908874511719, 0.018321990966796875, 0.02136707305908203, 0.024412155151367188, 0.027457237243652344, 0.0305023193359375, 0.033547401428222656, 0.03659248352050781, 0.03963756561279297, 0.042682647705078125, 0.04572772979736328, 0.04877281188964844, 0.051817893981933594, 0.05486297607421875, 0.057908058166503906, 0.06095314025878906, 0.06399822235107422, 0.06704330444335938, 0.07008838653564453, 0.07313346862792969, 0.07617855072021484, 0.0792236328125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 4.0, 7.0, 12.0, 5.0, 7.0, 10.0, 8.0, 14.0, 10.0, 18.0, 20.0, 33.0, 32.0, 28.0, 32.0, 42.0, 45.0, 29.0, 44.0, 49.0, 30.0, 52.0, 44.0, 39.0, 51.0, 41.0, 35.0, 39.0, 16.0, 35.0, 29.0, 23.0, 13.0, 22.0, 13.0, 14.0, 14.0, 12.0, 8.0, 9.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.1610107421875, -0.15622520446777344, -0.15143966674804688, -0.1466541290283203, -0.14186859130859375, -0.1370830535888672, -0.13229751586914062, -0.12751197814941406, -0.1227264404296875, -0.11794090270996094, -0.11315536499023438, -0.10836982727050781, -0.10358428955078125, -0.09879875183105469, -0.09401321411132812, -0.08922767639160156, -0.084442138671875, -0.07965660095214844, -0.07487106323242188, -0.07008552551269531, -0.06529998779296875, -0.06051445007324219, -0.055728912353515625, -0.05094337463378906, -0.0461578369140625, -0.04137229919433594, -0.036586761474609375, -0.03180122375488281, -0.02701568603515625, -0.022230148315429688, -0.017444610595703125, -0.012659072875976562, -0.00787353515625, -0.0030879974365234375, 0.001697540283203125, 0.0064830780029296875, 0.01126861572265625, 0.016054153442382812, 0.020839691162109375, 0.025625228881835938, 0.0304107666015625, 0.03519630432128906, 0.039981842041015625, 0.04476737976074219, 0.04955291748046875, 0.05433845520019531, 0.059123992919921875, 0.06390953063964844, 0.068695068359375, 0.07348060607910156, 0.07826614379882812, 0.08305168151855469, 0.08783721923828125, 0.09262275695800781, 0.09740829467773438, 0.10219383239746094, 0.1069793701171875, 0.11176490783691406, 0.11655044555664062, 0.12133598327636719, 0.12612152099609375, 0.1309070587158203, 0.13569259643554688, 0.14047813415527344, 0.145263671875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 6.0, 5.0, 13.0, 17.0, 26.0, 49.0, 61.0, 107.0, 181.0, 413.0, 992.0, 2753.0, 10055.0, 57676.0, 494707.0, 421199.0, 47246.0, 8741.0, 2480.0, 926.0, 401.0, 193.0, 104.0, 66.0, 39.0, 22.0, 18.0, 14.0, 7.0, 10.0, 4.0, 3.0, 3.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015625, -0.015103340148925781, -0.014581680297851562, -0.014060020446777344, -0.013538360595703125, -0.013016700744628906, -0.012495040893554688, -0.011973381042480469, -0.01145172119140625, -0.010930061340332031, -0.010408401489257812, -0.009886741638183594, -0.009365081787109375, -0.008843421936035156, -0.008321762084960938, -0.007800102233886719, -0.0072784423828125, -0.006756782531738281, -0.0062351226806640625, -0.005713462829589844, -0.005191802978515625, -0.004670143127441406, -0.0041484832763671875, -0.0036268234252929688, -0.00310516357421875, -0.0025835037231445312, -0.0020618438720703125, -0.0015401840209960938, -0.001018524169921875, -0.0004968643188476562, 2.47955322265625e-05, 0.0005464553833007812, 0.001068115234375, 0.0015897750854492188, 0.0021114349365234375, 0.0026330947875976562, 0.003154754638671875, 0.0036764144897460938, 0.0041980743408203125, 0.004719734191894531, 0.00524139404296875, 0.005763053894042969, 0.0062847137451171875, 0.006806373596191406, 0.007328033447265625, 0.007849693298339844, 0.008371353149414062, 0.008893013000488281, 0.0094146728515625, 0.009936332702636719, 0.010457992553710938, 0.010979652404785156, 0.011501312255859375, 0.012022972106933594, 0.012544631958007812, 0.013066291809082031, 0.01358795166015625, 0.014109611511230469, 0.014631271362304688, 0.015152931213378906, 0.015674591064453125, 0.016196250915527344, 0.016717910766601562, 0.01723957061767578, 0.01776123046875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 6.0, 9.0, 4.0, 14.0, 9.0, 14.0, 18.0, 20.0, 31.0, 21.0, 37.0, 54.0, 31.0, 80.0, 81.0, 85.0, 42.0, 69.0, 86.0, 58.0, 29.0, 43.0, 31.0, 23.0, 26.0, 20.0, 16.0, 6.0, 9.0, 7.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-5.662441253662109e-06, -5.500391125679016e-06, -5.338340997695923e-06, -5.17629086971283e-06, -5.014240741729736e-06, -4.852190613746643e-06, -4.69014048576355e-06, -4.5280903577804565e-06, -4.366040229797363e-06, -4.20399010181427e-06, -4.041939973831177e-06, -3.8798898458480835e-06, -3.7178397178649902e-06, -3.555789589881897e-06, -3.3937394618988037e-06, -3.2316893339157104e-06, -3.069639205932617e-06, -2.907589077949524e-06, -2.7455389499664307e-06, -2.5834888219833374e-06, -2.421438694000244e-06, -2.259388566017151e-06, -2.0973384380340576e-06, -1.9352883100509644e-06, -1.773238182067871e-06, -1.6111880540847778e-06, -1.4491379261016846e-06, -1.2870877981185913e-06, -1.125037670135498e-06, -9.629875421524048e-07, -8.009374141693115e-07, -6.388872861862183e-07, -4.76837158203125e-07, -3.1478703022003174e-07, -1.5273690223693848e-07, 9.313225746154785e-09, 1.7136335372924805e-07, 3.334134817123413e-07, 4.954636096954346e-07, 6.575137376785278e-07, 8.195638656616211e-07, 9.816139936447144e-07, 1.1436641216278076e-06, 1.3057142496109009e-06, 1.4677643775939941e-06, 1.6298145055770874e-06, 1.7918646335601807e-06, 1.953914761543274e-06, 2.115964889526367e-06, 2.2780150175094604e-06, 2.4400651454925537e-06, 2.602115273475647e-06, 2.7641654014587402e-06, 2.9262155294418335e-06, 3.0882656574249268e-06, 3.25031578540802e-06, 3.4123659133911133e-06, 3.5744160413742065e-06, 3.7364661693573e-06, 3.898516297340393e-06, 4.060566425323486e-06, 4.22261655330658e-06, 4.384666681289673e-06, 4.546716809272766e-06, 4.708766937255859e-06]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 7.0, 5.0, 3.0, 4.0, 9.0, 11.0, 15.0, 29.0, 64.0, 74.0, 101.0, 211.0, 415.0, 883.0, 2209.0, 6554.0, 28415.0, 197968.0, 627334.0, 151975.0, 22934.0, 5763.0, 1965.0, 741.0, 402.0, 196.0, 105.0, 50.0, 33.0, 27.0, 12.0, 7.0, 8.0, 8.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.018890380859375, -0.018357276916503906, -0.017824172973632812, -0.01729106903076172, -0.016757965087890625, -0.01622486114501953, -0.015691757202148438, -0.015158653259277344, -0.01462554931640625, -0.014092445373535156, -0.013559341430664062, -0.013026237487792969, -0.012493133544921875, -0.011960029602050781, -0.011426925659179688, -0.010893821716308594, -0.0103607177734375, -0.009827613830566406, -0.009294509887695312, -0.008761405944824219, -0.008228302001953125, -0.007695198059082031, -0.0071620941162109375, -0.006628990173339844, -0.00609588623046875, -0.005562782287597656, -0.0050296783447265625, -0.004496574401855469, -0.003963470458984375, -0.0034303665161132812, -0.0028972625732421875, -0.0023641586303710938, -0.0018310546875, -0.0012979507446289062, -0.0007648468017578125, -0.00023174285888671875, 0.000301361083984375, 0.0008344650268554688, 0.0013675689697265625, 0.0019006729125976562, 0.00243377685546875, 0.0029668807983398438, 0.0034999847412109375, 0.004033088684082031, 0.004566192626953125, 0.005099296569824219, 0.0056324005126953125, 0.006165504455566406, 0.0066986083984375, 0.007231712341308594, 0.0077648162841796875, 0.008297920227050781, 0.008831024169921875, 0.009364128112792969, 0.009897232055664062, 0.010430335998535156, 0.01096343994140625, 0.011496543884277344, 0.012029647827148438, 0.012562751770019531, 0.013095855712890625, 0.013628959655761719, 0.014162063598632812, 0.014695167541503906, 0.015228271484375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 9.0, 6.0, 10.0, 11.0, 26.0, 19.0, 35.0, 32.0, 35.0, 59.0, 88.0, 91.0, 75.0, 85.0, 78.0, 76.0, 61.0, 35.0, 36.0, 29.0, 28.0, 17.0, 10.0, 3.0, 7.0, 7.0, 5.0, 6.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.003871917724609375, -0.0037503838539123535, -0.003628849983215332, -0.0035073161125183105, -0.003385782241821289, -0.0032642483711242676, -0.003142714500427246, -0.0030211806297302246, -0.002899646759033203, -0.0027781128883361816, -0.00265657901763916, -0.0025350451469421387, -0.002413511276245117, -0.0022919774055480957, -0.0021704435348510742, -0.0020489096641540527, -0.0019273757934570312, -0.0018058419227600098, -0.0016843080520629883, -0.0015627741813659668, -0.0014412403106689453, -0.0013197064399719238, -0.0011981725692749023, -0.0010766386985778809, -0.0009551048278808594, -0.0008335709571838379, -0.0007120370864868164, -0.0005905032157897949, -0.00046896934509277344, -0.00034743547439575195, -0.00022590160369873047, -0.00010436773300170898, 1.71661376953125e-05, 0.00013870000839233398, 0.00026023387908935547, 0.00038176774978637695, 0.0005033016204833984, 0.0006248354911804199, 0.0007463693618774414, 0.0008679032325744629, 0.0009894371032714844, 0.0011109709739685059, 0.0012325048446655273, 0.0013540387153625488, 0.0014755725860595703, 0.0015971064567565918, 0.0017186403274536133, 0.0018401741981506348, 0.0019617080688476562, 0.0020832419395446777, 0.0022047758102416992, 0.0023263096809387207, 0.002447843551635742, 0.0025693774223327637, 0.002690911293029785, 0.0028124451637268066, 0.002933979034423828, 0.0030555129051208496, 0.003177046775817871, 0.0032985806465148926, 0.003420114517211914, 0.0035416483879089355, 0.003663182258605957, 0.0037847161293029785, 0.00390625]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 3.0, 9.0, 12.0, 22.0, 32.0, 79.0, 79.0, 133.0, 140.0, 159.0, 120.0, 88.0, 42.0, 38.0, 23.0, 13.0, 4.0, 8.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.20603322982788086, -0.2004377394914627, -0.19484224915504456, -0.1892467439174652, -0.18365125358104706, -0.1780557632446289, -0.17246027290821075, -0.1668647825717926, -0.16126927733421326, -0.1556737869977951, -0.15007829666137695, -0.1444827914237976, -0.13888730108737946, -0.1332918107509613, -0.12769632041454315, -0.122100830078125, -0.11650533974170685, -0.1109098494052887, -0.10531435161828995, -0.0997188612818718, -0.09412336349487305, -0.0885278731584549, -0.08293238282203674, -0.07733689248561859, -0.07174139469861984, -0.06614590436220169, -0.06055040657520294, -0.05495491623878479, -0.04935942217707634, -0.04376392811536789, -0.03816843777894974, -0.03257294371724129, -0.026977434754371643, -0.021381940692663193, -0.01578644849359989, -0.01019095629453659, -0.00459546223282814, 0.00100003182888031, 0.006595522165298462, 0.012191016227006912, 0.017786510288715363, 0.023382004350423813, 0.028977496549487114, 0.034572988748550415, 0.040168482810258865, 0.045763976871967316, 0.05135946720838547, 0.05695496127009392, 0.06255045533180237, 0.06814594566822052, 0.07374144345521927, 0.07933693379163742, 0.08493243157863617, 0.09052792191505432, 0.09612341225147247, 0.10171890258789062, 0.10731440037488937, 0.11290989071130753, 0.11850538849830627, 0.12410087883472443, 0.12969636917114258, 0.13529187440872192, 0.14088734984397888, 0.14648285508155823, 0.15207834541797638]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 6.0, 8.0, 9.0, 5.0, 4.0, 9.0, 14.0, 22.0, 14.0, 26.0, 34.0, 31.0, 47.0, 44.0, 49.0, 40.0, 44.0, 54.0, 62.0, 58.0, 57.0, 56.0, 36.0, 42.0, 32.0, 45.0, 24.0, 31.0, 34.0, 23.0, 17.0, 11.0, 7.0, 5.0, 6.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07813102751970291, -0.07540745288133621, -0.07268387824296951, -0.06996030360460281, -0.06723672896623611, -0.06451314687728882, -0.06178957596421242, -0.05906599760055542, -0.05634242296218872, -0.05361884832382202, -0.05089527368545532, -0.04817169904708862, -0.045448120683431625, -0.042724546045064926, -0.04000097140669823, -0.03727739304304123, -0.03455382212996483, -0.03183024749159813, -0.02910667099058628, -0.02638309635221958, -0.023659519851207733, -0.020935945212841034, -0.018212370574474335, -0.015488794073462486, -0.012765219435095787, -0.010041643865406513, -0.007318068761378527, -0.00459449365735054, -0.0018709180876612663, 0.0008526574820280075, 0.0035762321203947067, 0.006299808621406555, 0.009023383259773254, 0.011746958829462528, 0.014470534399151802, 0.0171941090375185, 0.01991768553853035, 0.02264126017689705, 0.025364834815263748, 0.028088411316275597, 0.030811985954642296, 0.033535562455654144, 0.036259137094020844, 0.03898271173238754, 0.04170628637075424, 0.04442986100912094, 0.04715343564748764, 0.04987701401114464, 0.05260058864951134, 0.055324163287878036, 0.058047737926244736, 0.06077131628990173, 0.06349489092826843, 0.06621846556663513, 0.06894204020500183, 0.07166561484336853, 0.07438918948173523, 0.07711276412010193, 0.07983633875846863, 0.08255991339683533, 0.08528348803520203, 0.08800706267356873, 0.09073063731193542, 0.09345421940088272, 0.09617779403924942]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 5.0, 12.0, 10.0, 16.0, 29.0, 44.0, 65.0, 98.0, 170.0, 314.0, 517.0, 985.0, 2021.0, 4517.0, 11774.0, 38137.0, 199954.0, 669989.0, 84590.0, 21635.0, 7411.0, 3122.0, 1439.0, 790.0, 406.0, 185.0, 121.0, 75.0, 56.0, 21.0, 13.0, 15.0, 13.0, 6.0, 6.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0867919921875, -0.08271217346191406, -0.07863235473632812, -0.07455253601074219, -0.07047271728515625, -0.06639289855957031, -0.062313079833984375, -0.05823326110839844, -0.0541534423828125, -0.05007362365722656, -0.045993804931640625, -0.04191398620605469, -0.03783416748046875, -0.03375434875488281, -0.029674530029296875, -0.025594711303710938, -0.021514892578125, -0.017435073852539062, -0.013355255126953125, -0.009275436401367188, -0.00519561767578125, -0.0011157989501953125, 0.002964019775390625, 0.0070438385009765625, 0.0111236572265625, 0.015203475952148438, 0.019283294677734375, 0.023363113403320312, 0.02744293212890625, 0.03152275085449219, 0.035602569580078125, 0.03968238830566406, 0.04376220703125, 0.04784202575683594, 0.051921844482421875, 0.05600166320800781, 0.06008148193359375, 0.06416130065917969, 0.06824111938476562, 0.07232093811035156, 0.0764007568359375, 0.08048057556152344, 0.08456039428710938, 0.08864021301269531, 0.09272003173828125, 0.09679985046386719, 0.10087966918945312, 0.10495948791503906, 0.109039306640625, 0.11311912536621094, 0.11719894409179688, 0.12127876281738281, 0.12535858154296875, 0.1294384002685547, 0.13351821899414062, 0.13759803771972656, 0.1416778564453125, 0.14575767517089844, 0.14983749389648438, 0.1539173126220703, 0.15799713134765625, 0.1620769500732422, 0.16615676879882812, 0.17023658752441406, 0.17431640625]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 9.0, 7.0, 3.0, 10.0, 8.0, 8.0, 18.0, 21.0, 19.0, 30.0, 35.0, 40.0, 44.0, 44.0, 47.0, 53.0, 54.0, 77.0, 45.0, 62.0, 49.0, 43.0, 58.0, 38.0, 24.0, 24.0, 38.0, 26.0, 25.0, 15.0, 9.0, 7.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1494140625, -0.1441936492919922, -0.13897323608398438, -0.13375282287597656, -0.12853240966796875, -0.12331199645996094, -0.11809158325195312, -0.11287117004394531, -0.1076507568359375, -0.10243034362792969, -0.09720993041992188, -0.09198951721191406, -0.08676910400390625, -0.08154869079589844, -0.07632827758789062, -0.07110786437988281, -0.065887451171875, -0.06066703796386719, -0.055446624755859375, -0.05022621154785156, -0.04500579833984375, -0.03978538513183594, -0.034564971923828125, -0.029344558715820312, -0.0241241455078125, -0.018903732299804688, -0.013683319091796875, -0.008462905883789062, -0.00324249267578125, 0.0019779205322265625, 0.007198333740234375, 0.012418746948242188, 0.01763916015625, 0.022859573364257812, 0.028079986572265625, 0.03330039978027344, 0.03852081298828125, 0.04374122619628906, 0.048961639404296875, 0.05418205261230469, 0.0594024658203125, 0.06462287902832031, 0.06984329223632812, 0.07506370544433594, 0.08028411865234375, 0.08550453186035156, 0.09072494506835938, 0.09594535827636719, 0.101165771484375, 0.10638618469238281, 0.11160659790039062, 0.11682701110839844, 0.12204742431640625, 0.12726783752441406, 0.13248825073242188, 0.1377086639404297, 0.1429290771484375, 0.1481494903564453, 0.15336990356445312, 0.15859031677246094, 0.16381072998046875, 0.16903114318847656, 0.17425155639648438, 0.1794719696044922, 0.1846923828125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 4.0, 5.0, 5.0, 17.0, 27.0, 30.0, 58.0, 76.0, 121.0, 210.0, 530.0, 3093.0, 95841.0, 935362.0, 11314.0, 1109.0, 306.0, 143.0, 95.0, 48.0, 47.0, 27.0, 18.0, 30.0, 11.0, 11.0, 5.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47314453125, -0.4600868225097656, -0.44702911376953125, -0.4339714050292969, -0.4209136962890625, -0.4078559875488281, -0.39479827880859375, -0.3817405700683594, -0.368682861328125, -0.3556251525878906, -0.34256744384765625, -0.3295097351074219, -0.3164520263671875, -0.3033943176269531, -0.29033660888671875, -0.2772789001464844, -0.26422119140625, -0.2511634826660156, -0.23810577392578125, -0.22504806518554688, -0.2119903564453125, -0.19893264770507812, -0.18587493896484375, -0.17281723022460938, -0.159759521484375, -0.14670181274414062, -0.13364410400390625, -0.12058639526367188, -0.1075286865234375, -0.09447097778320312, -0.08141326904296875, -0.06835556030273438, -0.0552978515625, -0.042240142822265625, -0.02918243408203125, -0.016124725341796875, -0.0030670166015625, 0.009990692138671875, 0.02304840087890625, 0.036106109619140625, 0.049163818359375, 0.062221527099609375, 0.07527923583984375, 0.08833694458007812, 0.1013946533203125, 0.11445236206054688, 0.12751007080078125, 0.14056777954101562, 0.15362548828125, 0.16668319702148438, 0.17974090576171875, 0.19279861450195312, 0.2058563232421875, 0.21891403198242188, 0.23197174072265625, 0.24502944946289062, 0.258087158203125, 0.2711448669433594, 0.28420257568359375, 0.2972602844238281, 0.3103179931640625, 0.3233757019042969, 0.33643341064453125, 0.3494911193847656, 0.362548828125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 4.0, 7.0, 7.0, 3.0, 9.0, 11.0, 17.0, 25.0, 43.0, 37.0, 54.0, 53.0, 57.0, 63.0, 65.0, 53.0, 72.0, 80.0, 52.0, 47.0, 51.0, 40.0, 36.0, 27.0, 19.0, 20.0, 18.0, 15.0, 10.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.264404296875, -0.2571239471435547, -0.24984359741210938, -0.24256324768066406, -0.23528289794921875, -0.22800254821777344, -0.22072219848632812, -0.2134418487548828, -0.2061614990234375, -0.1988811492919922, -0.19160079956054688, -0.18432044982910156, -0.17704010009765625, -0.16975975036621094, -0.16247940063476562, -0.1551990509033203, -0.147918701171875, -0.1406383514404297, -0.13335800170898438, -0.12607765197753906, -0.11879730224609375, -0.11151695251464844, -0.10423660278320312, -0.09695625305175781, -0.0896759033203125, -0.08239555358886719, -0.07511520385742188, -0.06783485412597656, -0.06055450439453125, -0.05327415466308594, -0.045993804931640625, -0.03871345520019531, -0.03143310546875, -0.024152755737304688, -0.016872406005859375, -0.009592056274414062, -0.00231170654296875, 0.0049686431884765625, 0.012248992919921875, 0.019529342651367188, 0.0268096923828125, 0.03409004211425781, 0.041370391845703125, 0.04865074157714844, 0.05593109130859375, 0.06321144104003906, 0.07049179077148438, 0.07777214050292969, 0.085052490234375, 0.09233283996582031, 0.09961318969726562, 0.10689353942871094, 0.11417388916015625, 0.12145423889160156, 0.12873458862304688, 0.1360149383544922, 0.1432952880859375, 0.1505756378173828, 0.15785598754882812, 0.16513633728027344, 0.17241668701171875, 0.17969703674316406, 0.18697738647460938, 0.1942577362060547, 0.2015380859375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 7.0, 10.0, 10.0, 17.0, 24.0, 33.0, 55.0, 78.0, 133.0, 247.0, 449.0, 918.0, 2384.0, 7469.0, 42421.0, 621680.0, 336352.0, 26908.0, 5720.0, 1900.0, 809.0, 386.0, 191.0, 112.0, 70.0, 49.0, 40.0, 22.0, 13.0, 9.0, 12.0, 6.0, 1.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0457763671875, -0.044599294662475586, -0.04342222213745117, -0.04224514961242676, -0.041068077087402344, -0.03989100456237793, -0.038713932037353516, -0.0375368595123291, -0.03635978698730469, -0.03518271446228027, -0.03400564193725586, -0.032828569412231445, -0.03165149688720703, -0.030474424362182617, -0.029297351837158203, -0.02812027931213379, -0.026943206787109375, -0.02576613426208496, -0.024589061737060547, -0.023411989212036133, -0.02223491668701172, -0.021057844161987305, -0.01988077163696289, -0.018703699111938477, -0.017526626586914062, -0.01634955406188965, -0.015172481536865234, -0.01399540901184082, -0.012818336486816406, -0.011641263961791992, -0.010464191436767578, -0.009287118911743164, -0.00811004638671875, -0.006932973861694336, -0.005755901336669922, -0.004578828811645508, -0.0034017562866210938, -0.0022246837615966797, -0.0010476112365722656, 0.00012946128845214844, 0.0013065338134765625, 0.0024836063385009766, 0.0036606788635253906, 0.004837751388549805, 0.006014823913574219, 0.007191896438598633, 0.008368968963623047, 0.009546041488647461, 0.010723114013671875, 0.011900186538696289, 0.013077259063720703, 0.014254331588745117, 0.015431404113769531, 0.016608476638793945, 0.01778554916381836, 0.018962621688842773, 0.020139694213867188, 0.0213167667388916, 0.022493839263916016, 0.02367091178894043, 0.024847984313964844, 0.026025056838989258, 0.027202129364013672, 0.028379201889038086, 0.0295562744140625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 5.0, 14.0, 9.0, 14.0, 22.0, 44.0, 94.0, 115.0, 149.0, 152.0, 150.0, 77.0, 49.0, 43.0, 16.0, 20.0, 6.0, 4.0, 4.0, 8.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.68899917602539e-06, -7.442198693752289e-06, -7.195398211479187e-06, -6.948597729206085e-06, -6.701797246932983e-06, -6.454996764659882e-06, -6.20819628238678e-06, -5.961395800113678e-06, -5.714595317840576e-06, -5.467794835567474e-06, -5.2209943532943726e-06, -4.974193871021271e-06, -4.727393388748169e-06, -4.480592906475067e-06, -4.233792424201965e-06, -3.9869919419288635e-06, -3.7401914596557617e-06, -3.49339097738266e-06, -3.246590495109558e-06, -2.9997900128364563e-06, -2.7529895305633545e-06, -2.5061890482902527e-06, -2.259388566017151e-06, -2.012588083744049e-06, -1.7657876014709473e-06, -1.5189871191978455e-06, -1.2721866369247437e-06, -1.0253861546516418e-06, -7.7858567237854e-07, -5.317851901054382e-07, -2.849847078323364e-07, -3.818422555923462e-08, 2.086162567138672e-07, 4.55416738986969e-07, 7.022172212600708e-07, 9.490177035331726e-07, 1.1958181858062744e-06, 1.4426186680793762e-06, 1.689419150352478e-06, 1.93621963262558e-06, 2.1830201148986816e-06, 2.4298205971717834e-06, 2.6766210794448853e-06, 2.923421561717987e-06, 3.170222043991089e-06, 3.4170225262641907e-06, 3.6638230085372925e-06, 3.910623490810394e-06, 4.157423973083496e-06, 4.404224455356598e-06, 4.6510249376297e-06, 4.8978254199028015e-06, 5.144625902175903e-06, 5.391426384449005e-06, 5.638226866722107e-06, 5.885027348995209e-06, 6.1318278312683105e-06, 6.378628313541412e-06, 6.625428795814514e-06, 6.872229278087616e-06, 7.119029760360718e-06, 7.36583024263382e-06, 7.612630724906921e-06, 7.859431207180023e-06, 8.106231689453125e-06]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 6.0, 10.0, 17.0, 16.0, 28.0, 39.0, 98.0, 156.0, 286.0, 619.0, 1754.0, 6793.0, 67260.0, 905192.0, 56972.0, 6346.0, 1686.0, 645.0, 296.0, 142.0, 75.0, 44.0, 25.0, 19.0, 6.0, 4.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.05230712890625, -0.050253868103027344, -0.04820060729980469, -0.04614734649658203, -0.044094085693359375, -0.04204082489013672, -0.03998756408691406, -0.037934303283691406, -0.03588104248046875, -0.033827781677246094, -0.03177452087402344, -0.02972126007080078, -0.027667999267578125, -0.02561473846435547, -0.023561477661132812, -0.021508216857910156, -0.0194549560546875, -0.017401695251464844, -0.015348434448242188, -0.013295173645019531, -0.011241912841796875, -0.009188652038574219, -0.0071353912353515625, -0.005082130432128906, -0.00302886962890625, -0.0009756088256835938, 0.0010776519775390625, 0.0031309127807617188, 0.005184173583984375, 0.007237434387207031, 0.009290695190429688, 0.011343955993652344, 0.013397216796875, 0.015450477600097656, 0.017503738403320312, 0.01955699920654297, 0.021610260009765625, 0.02366352081298828, 0.025716781616210938, 0.027770042419433594, 0.02982330322265625, 0.031876564025878906, 0.03392982482910156, 0.03598308563232422, 0.038036346435546875, 0.04008960723876953, 0.04214286804199219, 0.044196128845214844, 0.0462493896484375, 0.048302650451660156, 0.05035591125488281, 0.05240917205810547, 0.054462432861328125, 0.05651569366455078, 0.05856895446777344, 0.060622215270996094, 0.06267547607421875, 0.0647287368774414, 0.06678199768066406, 0.06883525848388672, 0.07088851928710938, 0.07294178009033203, 0.07499504089355469, 0.07704830169677734, 0.0791015625]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 1.0, 6.0, 5.0, 6.0, 13.0, 11.0, 9.0, 15.0, 26.0, 30.0, 33.0, 63.0, 83.0, 94.0, 122.0, 100.0, 103.0, 76.0, 46.0, 46.0, 28.0, 20.0, 17.0, 11.0, 8.0, 3.0, 3.0, 5.0, 2.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01136016845703125, -0.01098942756652832, -0.01061868667602539, -0.010247945785522461, -0.009877204895019531, -0.009506464004516602, -0.009135723114013672, -0.008764982223510742, -0.008394241333007812, -0.008023500442504883, -0.007652759552001953, -0.0072820186614990234, -0.006911277770996094, -0.006540536880493164, -0.006169795989990234, -0.005799055099487305, -0.005428314208984375, -0.005057573318481445, -0.004686832427978516, -0.004316091537475586, -0.003945350646972656, -0.0035746097564697266, -0.003203868865966797, -0.002833127975463867, -0.0024623870849609375, -0.002091646194458008, -0.0017209053039550781, -0.0013501644134521484, -0.0009794235229492188, -0.0006086826324462891, -0.00023794174194335938, 0.0001327991485595703, 0.0005035400390625, 0.0008742809295654297, 0.0012450218200683594, 0.001615762710571289, 0.0019865036010742188, 0.0023572444915771484, 0.002727985382080078, 0.003098726272583008, 0.0034694671630859375, 0.003840208053588867, 0.004210948944091797, 0.0045816898345947266, 0.004952430725097656, 0.005323171615600586, 0.005693912506103516, 0.006064653396606445, 0.006435394287109375, 0.006806135177612305, 0.007176876068115234, 0.007547616958618164, 0.007918357849121094, 0.008289098739624023, 0.008659839630126953, 0.009030580520629883, 0.009401321411132812, 0.009772062301635742, 0.010142803192138672, 0.010513544082641602, 0.010884284973144531, 0.011255025863647461, 0.01162576675415039, 0.01199650764465332, 0.01236724853515625]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 7.0, 6.0, 12.0, 27.0, 58.0, 90.0, 126.0, 164.0, 186.0, 114.0, 74.0, 62.0, 33.0, 19.0, 10.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.4505625069141388, -0.43900638818740845, -0.4274502396583557, -0.41589412093162537, -0.404338002204895, -0.3927818536758423, -0.38122573494911194, -0.3696696162223816, -0.35811346769332886, -0.3465573489665985, -0.3350012004375458, -0.32344508171081543, -0.3118889331817627, -0.30033281445503235, -0.288776695728302, -0.27722054719924927, -0.2656644284725189, -0.2541083097457886, -0.24255216121673584, -0.2309960424900055, -0.21943990886211395, -0.2078837752342224, -0.19632765650749207, -0.18477152287960052, -0.17321538925170898, -0.16165925562381744, -0.1501031219959259, -0.13854700326919556, -0.12699086964130402, -0.11543473601341248, -0.10387860983610153, -0.09232248365879059, -0.08076637983322144, -0.0692102462053299, -0.05765412002801895, -0.04609799012541771, -0.03454186022281647, -0.022985730320215225, -0.011429600417613983, 0.00012652575969696045, 0.011682659387588501, 0.023238789290189743, 0.034794919192790985, 0.04635104909539223, 0.05790717899799347, 0.06946331262588501, 0.08101943880319595, 0.0925755649805069, 0.10413169860839844, 0.11568783223628998, 0.12724396586418152, 0.13880008459091187, 0.1503562182188034, 0.16191235184669495, 0.1734684705734253, 0.18502460420131683, 0.19658073782920837, 0.20813687145709991, 0.21969300508499146, 0.2312491238117218, 0.24280525743961334, 0.2543613910675049, 0.26591750979423523, 0.2774736285209656, 0.2890297770500183]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 3.0, 1.0, 4.0, 8.0, 7.0, 9.0, 3.0, 6.0, 9.0, 19.0, 10.0, 14.0, 12.0, 33.0, 26.0, 28.0, 34.0, 23.0, 29.0, 30.0, 40.0, 34.0, 45.0, 40.0, 37.0, 49.0, 43.0, 44.0, 39.0, 42.0, 32.0, 28.0, 26.0, 34.0, 24.0, 23.0, 19.0, 17.0, 18.0, 12.0, 10.0, 8.0, 14.0, 7.0, 4.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.23896682262420654, -0.2311481088399887, -0.22332940995693207, -0.21551069617271423, -0.2076919972896576, -0.19987328350543976, -0.19205456972122192, -0.18423587083816528, -0.17641717195510864, -0.1685984581708908, -0.16077975928783417, -0.15296104550361633, -0.1451423466205597, -0.13732363283634186, -0.12950491905212402, -0.12168622016906738, -0.11386750638484955, -0.10604880005121231, -0.09823009371757507, -0.09041137993335724, -0.0825926810503006, -0.07477396726608276, -0.06695526093244553, -0.05913655459880829, -0.05131784826517105, -0.043499141931533813, -0.035680435597896576, -0.02786172553896904, -0.020043019205331802, -0.012224312871694565, -0.004405602812767029, 0.0034131035208702087, 0.011231809854507446, 0.019050516188144684, 0.02686922438442707, 0.03468793258070946, 0.042506638914346695, 0.05032534524798393, 0.05814405530691147, 0.0659627616405487, 0.07378146797418594, 0.08160017430782318, 0.08941888064146042, 0.09723758697509766, 0.10505630075931549, 0.11287499964237213, 0.12069371342658997, 0.1285124123096466, 0.13633112609386444, 0.14414983987808228, 0.15196853876113892, 0.15978725254535675, 0.1676059514284134, 0.17542466521263123, 0.18324336409568787, 0.1910620778799057, 0.19888079166412354, 0.20669950544834137, 0.214518204331398, 0.22233691811561584, 0.23015561699867249, 0.23797433078289032, 0.24579304456710815, 0.2536117434501648, 0.26143044233322144]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 0.0, 1.0, 1.0, 4.0, 10.0, 4.0, 9.0, 7.0, 21.0, 22.0, 26.0, 41.0, 53.0, 81.0, 99.0, 141.0, 207.0, 293.0, 385.0, 652.0, 950.0, 1511.0, 2585.0, 4842.0, 9592.0, 23540.0, 85643.0, 697571.0, 2606771.0, 633952.0, 81207.0, 22507.0, 9680.0, 4669.0, 2689.0, 1523.0, 953.0, 643.0, 422.0, 262.0, 198.0, 134.0, 100.0, 64.0, 53.0, 41.0, 38.0, 28.0, 14.0, 11.0, 12.0, 5.0, 7.0, 7.0, 5.0, 4.0, 1.0, 3.0], "bins": [-0.120361328125, -0.11687088012695312, -0.11338043212890625, -0.10988998413085938, -0.1063995361328125, -0.10290908813476562, -0.09941864013671875, -0.09592819213867188, -0.092437744140625, -0.08894729614257812, -0.08545684814453125, -0.08196640014648438, -0.0784759521484375, -0.07498550415039062, -0.07149505615234375, -0.06800460815429688, -0.06451416015625, -0.061023712158203125, -0.05753326416015625, -0.054042816162109375, -0.0505523681640625, -0.047061920166015625, -0.04357147216796875, -0.040081024169921875, -0.036590576171875, -0.033100128173828125, -0.02960968017578125, -0.026119232177734375, -0.0226287841796875, -0.019138336181640625, -0.01564788818359375, -0.012157440185546875, -0.0086669921875, -0.005176544189453125, -0.00168609619140625, 0.001804351806640625, 0.0052947998046875, 0.008785247802734375, 0.01227569580078125, 0.015766143798828125, 0.019256591796875, 0.022747039794921875, 0.02623748779296875, 0.029727935791015625, 0.0332183837890625, 0.036708831787109375, 0.04019927978515625, 0.043689727783203125, 0.04718017578125, 0.050670623779296875, 0.05416107177734375, 0.057651519775390625, 0.0611419677734375, 0.06463241577148438, 0.06812286376953125, 0.07161331176757812, 0.075103759765625, 0.07859420776367188, 0.08208465576171875, 0.08557510375976562, 0.0890655517578125, 0.09255599975585938, 0.09604644775390625, 0.09953689575195312, 0.10302734375]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 6.0, 5.0, 9.0, 4.0, 7.0, 19.0, 19.0, 26.0, 34.0, 31.0, 35.0, 42.0, 47.0, 57.0, 57.0, 46.0, 69.0, 68.0, 62.0, 51.0, 46.0, 46.0, 45.0, 26.0, 22.0, 35.0, 20.0, 14.0, 21.0, 15.0, 9.0, 10.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0888671875, -0.08586597442626953, -0.08286476135253906, -0.0798635482788086, -0.07686233520507812, -0.07386112213134766, -0.07085990905761719, -0.06785869598388672, -0.06485748291015625, -0.06185626983642578, -0.05885505676269531, -0.055853843688964844, -0.052852630615234375, -0.049851417541503906, -0.04685020446777344, -0.04384899139404297, -0.0408477783203125, -0.03784656524658203, -0.03484535217285156, -0.031844139099121094, -0.028842926025390625, -0.025841712951660156, -0.022840499877929688, -0.01983928680419922, -0.01683807373046875, -0.013836860656738281, -0.010835647583007812, -0.007834434509277344, -0.004833221435546875, -0.0018320083618164062, 0.0011692047119140625, 0.004170417785644531, 0.007171630859375, 0.010172843933105469, 0.013174057006835938, 0.016175270080566406, 0.019176483154296875, 0.022177696228027344, 0.025178909301757812, 0.02818012237548828, 0.03118133544921875, 0.03418254852294922, 0.03718376159667969, 0.040184974670410156, 0.043186187744140625, 0.046187400817871094, 0.04918861389160156, 0.05218982696533203, 0.0551910400390625, 0.05819225311279297, 0.06119346618652344, 0.0641946792602539, 0.06719589233398438, 0.07019710540771484, 0.07319831848144531, 0.07619953155517578, 0.07920074462890625, 0.08220195770263672, 0.08520317077636719, 0.08820438385009766, 0.09120559692382812, 0.0942068099975586, 0.09720802307128906, 0.10020923614501953, 0.10321044921875]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 8.0, 14.0, 12.0, 24.0, 43.0, 95.0, 208.0, 693.0, 4499.0, 153897.0, 4005177.0, 27040.0, 1826.0, 411.0, 168.0, 74.0, 35.0, 20.0, 12.0, 9.0, 8.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4326171875, -0.4183387756347656, -0.40406036376953125, -0.3897819519042969, -0.3755035400390625, -0.3612251281738281, -0.34694671630859375, -0.3326683044433594, -0.318389892578125, -0.3041114807128906, -0.28983306884765625, -0.2755546569824219, -0.2612762451171875, -0.24699783325195312, -0.23271942138671875, -0.21844100952148438, -0.20416259765625, -0.18988418579101562, -0.17560577392578125, -0.16132736206054688, -0.1470489501953125, -0.13277053833007812, -0.11849212646484375, -0.10421371459960938, -0.089935302734375, -0.07565689086914062, -0.06137847900390625, -0.047100067138671875, -0.0328216552734375, -0.018543243408203125, -0.00426483154296875, 0.010013580322265625, 0.0242919921875, 0.038570404052734375, 0.05284881591796875, 0.06712722778320312, 0.0814056396484375, 0.09568405151367188, 0.10996246337890625, 0.12424087524414062, 0.138519287109375, 0.15279769897460938, 0.16707611083984375, 0.18135452270507812, 0.1956329345703125, 0.20991134643554688, 0.22418975830078125, 0.23846817016601562, 0.25274658203125, 0.2670249938964844, 0.28130340576171875, 0.2955818176269531, 0.3098602294921875, 0.3241386413574219, 0.33841705322265625, 0.3526954650878906, 0.366973876953125, 0.3812522888183594, 0.39553070068359375, 0.4098091125488281, 0.4240875244140625, 0.4383659362792969, 0.45264434814453125, 0.4669227600097656, 0.481201171875]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 7.0, 4.0, 2.0, 8.0, 7.0, 6.0, 20.0, 22.0, 22.0, 30.0, 33.0, 59.0, 88.0, 114.0, 215.0, 336.0, 609.0, 725.0, 625.0, 411.0, 264.0, 149.0, 87.0, 60.0, 39.0, 42.0, 26.0, 15.0, 11.0, 13.0, 4.0, 4.0, 10.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.039306640625, -0.03788423538208008, -0.036461830139160156, -0.035039424896240234, -0.03361701965332031, -0.03219461441040039, -0.03077220916748047, -0.029349803924560547, -0.027927398681640625, -0.026504993438720703, -0.02508258819580078, -0.02366018295288086, -0.022237777709960938, -0.020815372467041016, -0.019392967224121094, -0.017970561981201172, -0.01654815673828125, -0.015125751495361328, -0.013703346252441406, -0.012280941009521484, -0.010858535766601562, -0.00943613052368164, -0.008013725280761719, -0.006591320037841797, -0.005168914794921875, -0.003746509552001953, -0.0023241043090820312, -0.0009016990661621094, 0.0005207061767578125, 0.0019431114196777344, 0.0033655166625976562, 0.004787921905517578, 0.0062103271484375, 0.007632732391357422, 0.009055137634277344, 0.010477542877197266, 0.011899948120117188, 0.01332235336303711, 0.014744758605957031, 0.016167163848876953, 0.017589569091796875, 0.019011974334716797, 0.02043437957763672, 0.02185678482055664, 0.023279190063476562, 0.024701595306396484, 0.026124000549316406, 0.027546405792236328, 0.02896881103515625, 0.030391216278076172, 0.031813621520996094, 0.033236026763916016, 0.03465843200683594, 0.03608083724975586, 0.03750324249267578, 0.0389256477355957, 0.040348052978515625, 0.04177045822143555, 0.04319286346435547, 0.04461526870727539, 0.04603767395019531, 0.047460079193115234, 0.048882484436035156, 0.05030488967895508, 0.051727294921875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 4.0, 10.0, 12.0, 22.0, 32.0, 44.0, 61.0, 73.0, 109.0, 113.0, 97.0, 100.0, 95.0, 78.0, 36.0, 43.0, 25.0, 20.0, 10.0, 12.0, 10.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22854658961296082, -0.22285278141498566, -0.2171589583158493, -0.21146515011787415, -0.205771341919899, -0.20007753372192383, -0.19438371062278748, -0.18868990242481232, -0.18299609422683716, -0.177302286028862, -0.17160846292972565, -0.1659146547317505, -0.16022084653377533, -0.15452703833580017, -0.14883321523666382, -0.14313940703868866, -0.1374455988407135, -0.13175179064273834, -0.126057967543602, -0.12036415934562683, -0.11467035114765167, -0.10897653549909592, -0.10328271985054016, -0.097588911652565, -0.09189508855342865, -0.0862012729048729, -0.08050746470689774, -0.07481364905834198, -0.06911984086036682, -0.06342602521181107, -0.05773221328854561, -0.05203840136528015, -0.04634459316730499, -0.040650781244039536, -0.03495696932077408, -0.029263155534863472, -0.023569343611598015, -0.017875531688332558, -0.012181717902421951, -0.006487905979156494, -0.000794094055891037, 0.0048997183330357075, 0.010593530721962452, 0.016287343576550484, 0.02198115549981594, 0.027674967423081398, 0.033368781208992004, 0.03906259313225746, 0.04475640505552292, 0.050450216978788376, 0.05614402890205383, 0.06183784455060959, 0.06753165274858475, 0.0732254683971405, 0.07891927659511566, 0.08461309224367142, 0.09030690789222717, 0.09600072354078293, 0.10169453173875809, 0.10738834738731384, 0.113082155585289, 0.11877597123384476, 0.12446978688240051, 0.13016359508037567, 0.13585740327835083]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 7.0, 3.0, 6.0, 8.0, 4.0, 6.0, 18.0, 19.0, 19.0, 23.0, 33.0, 22.0, 27.0, 26.0, 45.0, 34.0, 43.0, 47.0, 37.0, 49.0, 53.0, 45.0, 48.0, 41.0, 40.0, 38.0, 34.0, 30.0, 37.0, 30.0, 17.0, 23.0, 21.0, 20.0, 14.0, 8.0, 16.0, 6.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10078470408916473, -0.09767913073301315, -0.09457355737686157, -0.09146799147129059, -0.08836241811513901, -0.08525684475898743, -0.08215127885341644, -0.07904570549726486, -0.07594013214111328, -0.0728345587849617, -0.06972898542881012, -0.06662341952323914, -0.06351784616708755, -0.060412272810935974, -0.05730670318007469, -0.05420113354921341, -0.05109556019306183, -0.04798998683691025, -0.044884417206048965, -0.04177884757518768, -0.0386732742190361, -0.03556770086288452, -0.03246213123202324, -0.029356559738516808, -0.026250988245010376, -0.023145416751503944, -0.020039845257997513, -0.01693427376449108, -0.01382870227098465, -0.010723130777478218, -0.0076175592839717865, -0.004511987790465355, -0.0014064162969589233, 0.0016991551965475082, 0.00480472669005394, 0.007910298183560371, 0.011015869677066803, 0.014121441170573235, 0.017227012664079666, 0.020332584157586098, 0.02343815565109253, 0.02654372714459896, 0.029649298638105392, 0.032754868268966675, 0.035860441625118256, 0.038966014981269836, 0.04207158461213112, 0.0451771542429924, 0.04828272759914398, 0.05138830095529556, 0.054493870586156845, 0.05759944021701813, 0.06070501357316971, 0.06381058692932129, 0.06691615283489227, 0.07002172619104385, 0.07312729954719543, 0.07623287290334702, 0.0793384462594986, 0.08244401216506958, 0.08554958552122116, 0.08865515887737274, 0.09176072478294373, 0.0948662981390953, 0.09797187149524689]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 6.0, 8.0, 7.0, 9.0, 16.0, 24.0, 44.0, 39.0, 72.0, 93.0, 157.0, 248.0, 455.0, 774.0, 1298.0, 2438.0, 4528.0, 9428.0, 20521.0, 60095.0, 279263.0, 498608.0, 112020.0, 31798.0, 12993.0, 6254.0, 3240.0, 1727.0, 939.0, 547.0, 293.0, 214.0, 134.0, 88.0, 58.0, 33.0, 33.0, 20.0, 12.0, 11.0, 9.0, 0.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03985595703125, -0.038619041442871094, -0.03738212585449219, -0.03614521026611328, -0.034908294677734375, -0.03367137908935547, -0.03243446350097656, -0.031197547912597656, -0.02996063232421875, -0.028723716735839844, -0.027486801147460938, -0.02624988555908203, -0.025012969970703125, -0.02377605438232422, -0.022539138793945312, -0.021302223205566406, -0.0200653076171875, -0.018828392028808594, -0.017591476440429688, -0.01635456085205078, -0.015117645263671875, -0.013880729675292969, -0.012643814086914062, -0.011406898498535156, -0.01016998291015625, -0.008933067321777344, -0.0076961517333984375, -0.006459236145019531, -0.005222320556640625, -0.003985404968261719, -0.0027484893798828125, -0.0015115737915039062, -0.000274658203125, 0.0009622573852539062, 0.0021991729736328125, 0.0034360885620117188, 0.004673004150390625, 0.005909919738769531, 0.0071468353271484375, 0.008383750915527344, 0.00962066650390625, 0.010857582092285156, 0.012094497680664062, 0.013331413269042969, 0.014568328857421875, 0.01580524444580078, 0.017042160034179688, 0.018279075622558594, 0.0195159912109375, 0.020752906799316406, 0.021989822387695312, 0.02322673797607422, 0.024463653564453125, 0.02570056915283203, 0.026937484741210938, 0.028174400329589844, 0.02941131591796875, 0.030648231506347656, 0.03188514709472656, 0.03312206268310547, 0.034358978271484375, 0.03559589385986328, 0.03683280944824219, 0.038069725036621094, 0.039306640625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 5.0, 4.0, 9.0, 7.0, 9.0, 16.0, 16.0, 17.0, 15.0, 19.0, 33.0, 31.0, 26.0, 30.0, 39.0, 27.0, 49.0, 66.0, 52.0, 47.0, 56.0, 52.0, 32.0, 48.0, 43.0, 32.0, 34.0, 33.0, 28.0, 19.0, 17.0, 25.0, 12.0, 19.0, 9.0, 8.0, 7.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.058837890625, -0.056914329528808594, -0.05499076843261719, -0.05306720733642578, -0.051143646240234375, -0.04922008514404297, -0.04729652404785156, -0.045372962951660156, -0.04344940185546875, -0.041525840759277344, -0.03960227966308594, -0.03767871856689453, -0.035755157470703125, -0.03383159637451172, -0.03190803527832031, -0.029984474182128906, -0.0280609130859375, -0.026137351989746094, -0.024213790893554688, -0.02229022979736328, -0.020366668701171875, -0.01844310760498047, -0.016519546508789062, -0.014595985412597656, -0.01267242431640625, -0.010748863220214844, -0.008825302124023438, -0.006901741027832031, -0.004978179931640625, -0.0030546188354492188, -0.0011310577392578125, 0.0007925033569335938, 0.002716064453125, 0.004639625549316406, 0.0065631866455078125, 0.008486747741699219, 0.010410308837890625, 0.012333869934082031, 0.014257431030273438, 0.016180992126464844, 0.01810455322265625, 0.020028114318847656, 0.021951675415039062, 0.02387523651123047, 0.025798797607421875, 0.02772235870361328, 0.029645919799804688, 0.031569480895996094, 0.0334930419921875, 0.035416603088378906, 0.03734016418457031, 0.03926372528076172, 0.041187286376953125, 0.04311084747314453, 0.04503440856933594, 0.046957969665527344, 0.04888153076171875, 0.050805091857910156, 0.05272865295410156, 0.05465221405029297, 0.056575775146484375, 0.05849933624267578, 0.06042289733886719, 0.062346458435058594, 0.06427001953125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 6.0, 6.0, 4.0, 12.0, 10.0, 17.0, 22.0, 31.0, 40.0, 57.0, 91.0, 209.0, 439.0, 1299.0, 4339.0, 18015.0, 129246.0, 744998.0, 125895.0, 17380.0, 4195.0, 1287.0, 470.0, 188.0, 107.0, 54.0, 34.0, 29.0, 13.0, 10.0, 12.0, 8.0, 4.0, 5.0, 8.0, 3.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046356201171875, -0.04472923278808594, -0.043102264404296875, -0.04147529602050781, -0.03984832763671875, -0.03822135925292969, -0.036594390869140625, -0.03496742248535156, -0.0333404541015625, -0.03171348571777344, -0.030086517333984375, -0.028459548950195312, -0.02683258056640625, -0.025205612182617188, -0.023578643798828125, -0.021951675415039062, -0.02032470703125, -0.018697738647460938, -0.017070770263671875, -0.015443801879882812, -0.01381683349609375, -0.012189865112304688, -0.010562896728515625, -0.008935928344726562, -0.0073089599609375, -0.0056819915771484375, -0.004055023193359375, -0.0024280548095703125, -0.00080108642578125, 0.0008258819580078125, 0.002452850341796875, 0.0040798187255859375, 0.005706787109375, 0.0073337554931640625, 0.008960723876953125, 0.010587692260742188, 0.01221466064453125, 0.013841629028320312, 0.015468597412109375, 0.017095565795898438, 0.0187225341796875, 0.020349502563476562, 0.021976470947265625, 0.023603439331054688, 0.02523040771484375, 0.026857376098632812, 0.028484344482421875, 0.030111312866210938, 0.03173828125, 0.03336524963378906, 0.034992218017578125, 0.03661918640136719, 0.03824615478515625, 0.03987312316894531, 0.041500091552734375, 0.04312705993652344, 0.0447540283203125, 0.04638099670410156, 0.048007965087890625, 0.04963493347167969, 0.05126190185546875, 0.05288887023925781, 0.054515838623046875, 0.05614280700683594, 0.057769775390625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 6.0, 5.0, 13.0, 7.0, 7.0, 13.0, 15.0, 13.0, 12.0, 22.0, 24.0, 18.0, 38.0, 36.0, 44.0, 41.0, 48.0, 58.0, 28.0, 43.0, 46.0, 58.0, 49.0, 46.0, 39.0, 48.0, 35.0, 32.0, 29.0, 23.0, 15.0, 18.0, 19.0, 7.0, 12.0, 10.0, 6.0, 4.0, 8.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.12200927734375, -0.11800289154052734, -0.11399650573730469, -0.10999011993408203, -0.10598373413085938, -0.10197734832763672, -0.09797096252441406, -0.0939645767211914, -0.08995819091796875, -0.0859518051147461, -0.08194541931152344, -0.07793903350830078, -0.07393264770507812, -0.06992626190185547, -0.06591987609863281, -0.061913490295410156, -0.0579071044921875, -0.053900718688964844, -0.04989433288574219, -0.04588794708251953, -0.041881561279296875, -0.03787517547607422, -0.03386878967285156, -0.029862403869628906, -0.02585601806640625, -0.021849632263183594, -0.017843246459960938, -0.013836860656738281, -0.009830474853515625, -0.005824089050292969, -0.0018177032470703125, 0.0021886825561523438, 0.006195068359375, 0.010201454162597656, 0.014207839965820312, 0.01821422576904297, 0.022220611572265625, 0.02622699737548828, 0.030233383178710938, 0.034239768981933594, 0.03824615478515625, 0.042252540588378906, 0.04625892639160156, 0.05026531219482422, 0.054271697998046875, 0.05827808380126953, 0.06228446960449219, 0.06629085540771484, 0.0702972412109375, 0.07430362701416016, 0.07831001281738281, 0.08231639862060547, 0.08632278442382812, 0.09032917022705078, 0.09433555603027344, 0.0983419418334961, 0.10234832763671875, 0.1063547134399414, 0.11036109924316406, 0.11436748504638672, 0.11837387084960938, 0.12238025665283203, 0.1263866424560547, 0.13039302825927734, 0.1343994140625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 6.0, 2.0, 11.0, 8.0, 10.0, 14.0, 9.0, 26.0, 35.0, 49.0, 68.0, 114.0, 142.0, 241.0, 376.0, 622.0, 1032.0, 1910.0, 3602.0, 8001.0, 22183.0, 105460.0, 628460.0, 219045.0, 35580.0, 11047.0, 4774.0, 2402.0, 1274.0, 688.0, 486.0, 270.0, 186.0, 125.0, 85.0, 53.0, 39.0, 17.0, 21.0, 25.0, 10.0, 12.0, 12.0, 11.0, 5.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.016357421875, -0.01588571071624756, -0.015413999557495117, -0.014942288398742676, -0.014470577239990234, -0.013998866081237793, -0.013527154922485352, -0.01305544376373291, -0.012583732604980469, -0.012112021446228027, -0.011640310287475586, -0.011168599128723145, -0.010696887969970703, -0.010225176811218262, -0.00975346565246582, -0.009281754493713379, -0.008810043334960938, -0.008338332176208496, -0.007866621017456055, -0.007394909858703613, -0.006923198699951172, -0.0064514875411987305, -0.005979776382446289, -0.005508065223693848, -0.005036354064941406, -0.004564642906188965, -0.0040929317474365234, -0.003621220588684082, -0.0031495094299316406, -0.0026777982711791992, -0.002206087112426758, -0.0017343759536743164, -0.001262664794921875, -0.0007909536361694336, -0.0003192424774169922, 0.00015246868133544922, 0.0006241798400878906, 0.001095890998840332, 0.0015676021575927734, 0.002039313316345215, 0.0025110244750976562, 0.0029827356338500977, 0.003454446792602539, 0.0039261579513549805, 0.004397869110107422, 0.004869580268859863, 0.005341291427612305, 0.005813002586364746, 0.0062847137451171875, 0.006756424903869629, 0.00722813606262207, 0.007699847221374512, 0.008171558380126953, 0.008643269538879395, 0.009114980697631836, 0.009586691856384277, 0.010058403015136719, 0.01053011417388916, 0.011001825332641602, 0.011473536491394043, 0.011945247650146484, 0.012416958808898926, 0.012888669967651367, 0.013360381126403809, 0.01383209228515625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 4.0, 16.0, 8.0, 19.0, 26.0, 45.0, 43.0, 90.0, 89.0, 124.0, 108.0, 124.0, 90.0, 70.0, 48.0, 33.0, 19.0, 10.0, 12.0, 9.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.510185241699219e-06, -7.243826985359192e-06, -6.977468729019165e-06, -6.711110472679138e-06, -6.444752216339111e-06, -6.1783939599990845e-06, -5.912035703659058e-06, -5.645677447319031e-06, -5.379319190979004e-06, -5.112960934638977e-06, -4.84660267829895e-06, -4.580244421958923e-06, -4.3138861656188965e-06, -4.04752790927887e-06, -3.7811696529388428e-06, -3.514811396598816e-06, -3.248453140258789e-06, -2.982094883918762e-06, -2.7157366275787354e-06, -2.4493783712387085e-06, -2.1830201148986816e-06, -1.9166618585586548e-06, -1.650303602218628e-06, -1.383945345878601e-06, -1.1175870895385742e-06, -8.512288331985474e-07, -5.848705768585205e-07, -3.1851232051849365e-07, -5.21540641784668e-08, 2.1420419216156006e-07, 4.805624485015869e-07, 7.469207048416138e-07, 1.0132789611816406e-06, 1.2796372175216675e-06, 1.5459954738616943e-06, 1.8123537302017212e-06, 2.078711986541748e-06, 2.345070242881775e-06, 2.6114284992218018e-06, 2.8777867555618286e-06, 3.1441450119018555e-06, 3.4105032682418823e-06, 3.676861524581909e-06, 3.943219780921936e-06, 4.209578037261963e-06, 4.47593629360199e-06, 4.742294549942017e-06, 5.0086528062820435e-06, 5.27501106262207e-06, 5.541369318962097e-06, 5.807727575302124e-06, 6.074085831642151e-06, 6.340444087982178e-06, 6.606802344322205e-06, 6.8731606006622314e-06, 7.139518857002258e-06, 7.405877113342285e-06, 7.672235369682312e-06, 7.938593626022339e-06, 8.204951882362366e-06, 8.471310138702393e-06, 8.73766839504242e-06, 9.004026651382446e-06, 9.270384907722473e-06, 9.5367431640625e-06]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 6.0, 7.0, 6.0, 6.0, 14.0, 19.0, 26.0, 51.0, 71.0, 134.0, 218.0, 479.0, 968.0, 2269.0, 5625.0, 19753.0, 169328.0, 739909.0, 88020.0, 13751.0, 4472.0, 1768.0, 777.0, 382.0, 191.0, 112.0, 71.0, 42.0, 28.0, 16.0, 10.0, 5.0, 7.0, 3.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0249481201171875, -0.024126768112182617, -0.023305416107177734, -0.02248406410217285, -0.02166271209716797, -0.020841360092163086, -0.020020008087158203, -0.01919865608215332, -0.018377304077148438, -0.017555952072143555, -0.016734600067138672, -0.01591324806213379, -0.015091896057128906, -0.014270544052124023, -0.01344919204711914, -0.012627840042114258, -0.011806488037109375, -0.010985136032104492, -0.01016378402709961, -0.009342432022094727, -0.008521080017089844, -0.007699728012084961, -0.006878376007080078, -0.006057024002075195, -0.0052356719970703125, -0.00441431999206543, -0.003592967987060547, -0.002771615982055664, -0.0019502639770507812, -0.0011289119720458984, -0.0003075599670410156, 0.0005137920379638672, 0.00133514404296875, 0.002156496047973633, 0.0029778480529785156, 0.0037992000579833984, 0.004620552062988281, 0.005441904067993164, 0.006263256072998047, 0.00708460807800293, 0.007905960083007812, 0.008727312088012695, 0.009548664093017578, 0.010370016098022461, 0.011191368103027344, 0.012012720108032227, 0.01283407211303711, 0.013655424118041992, 0.014476776123046875, 0.015298128128051758, 0.01611948013305664, 0.016940832138061523, 0.017762184143066406, 0.01858353614807129, 0.019404888153076172, 0.020226240158081055, 0.021047592163085938, 0.02186894416809082, 0.022690296173095703, 0.023511648178100586, 0.02433300018310547, 0.02515435218811035, 0.025975704193115234, 0.026797056198120117, 0.027618408203125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 2.0, 8.0, 7.0, 11.0, 16.0, 24.0, 33.0, 72.0, 92.0, 148.0, 185.0, 126.0, 98.0, 62.0, 48.0, 20.0, 15.0, 10.0, 5.0, 2.0, 7.0, 2.0, 4.0, 0.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00662994384765625, -0.0064321160316467285, -0.006234288215637207, -0.0060364603996276855, -0.005838632583618164, -0.005640804767608643, -0.005442976951599121, -0.0052451491355896, -0.005047321319580078, -0.004849493503570557, -0.004651665687561035, -0.004453837871551514, -0.004256010055541992, -0.004058182239532471, -0.0038603544235229492, -0.0036625266075134277, -0.0034646987915039062, -0.0032668709754943848, -0.0030690431594848633, -0.002871215343475342, -0.0026733875274658203, -0.002475559711456299, -0.0022777318954467773, -0.002079904079437256, -0.0018820762634277344, -0.0016842484474182129, -0.0014864206314086914, -0.00128859281539917, -0.0010907649993896484, -0.000892937183380127, -0.0006951093673706055, -0.000497281551361084, -0.0002994537353515625, -0.00010162591934204102, 9.620189666748047e-05, 0.00029402971267700195, 0.0004918575286865234, 0.0006896853446960449, 0.0008875131607055664, 0.0010853409767150879, 0.0012831687927246094, 0.0014809966087341309, 0.0016788244247436523, 0.0018766522407531738, 0.0020744800567626953, 0.002272307872772217, 0.0024701356887817383, 0.0026679635047912598, 0.0028657913208007812, 0.0030636191368103027, 0.0032614469528198242, 0.0034592747688293457, 0.003657102584838867, 0.0038549304008483887, 0.00405275821685791, 0.004250586032867432, 0.004448413848876953, 0.004646241664886475, 0.004844069480895996, 0.005041897296905518, 0.005239725112915039, 0.0054375529289245605, 0.005635380744934082, 0.0058332085609436035, 0.006031036376953125]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 9.0, 10.0, 15.0, 51.0, 60.0, 99.0, 140.0, 152.0, 132.0, 134.0, 74.0, 56.0, 32.0, 18.0, 12.0, 7.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2007479965686798, -0.19636370241641998, -0.19197940826416016, -0.18759509921073914, -0.1832108050584793, -0.17882651090621948, -0.17444221675395966, -0.17005792260169983, -0.16567362844944, -0.16128933429718018, -0.15690504014492035, -0.15252074599266052, -0.1481364369392395, -0.14375214278697968, -0.13936784863471985, -0.13498355448246002, -0.1305992603302002, -0.12621496617794037, -0.12183066457509995, -0.11744637042284012, -0.11306207627058029, -0.10867777466773987, -0.10429348051548004, -0.09990918636322021, -0.0955248773097992, -0.09114058315753937, -0.08675628155469894, -0.08237198740243912, -0.07798769325017929, -0.07360339164733887, -0.06921909749507904, -0.06483480334281921, -0.060450516641139984, -0.05606621876358986, -0.05168192461133003, -0.04729762673377991, -0.04291333258152008, -0.038529034703969955, -0.03414473682641983, -0.029760440811514854, -0.02537614479660988, -0.020991848781704903, -0.016607552766799927, -0.012223254889249802, -0.007838958874344826, -0.00345466285943985, 0.0009296350181102753, 0.005313931033015251, 0.009698227047920227, 0.014082523062825203, 0.01846681907773018, 0.022851116955280304, 0.02723541297018528, 0.031619708985090256, 0.03600400686264038, 0.04038830101490021, 0.04477259889245033, 0.04915689677000046, 0.053541190922260284, 0.05792548879981041, 0.062309786677360535, 0.06669408082962036, 0.07107837498188019, 0.07546267658472061, 0.07984697073698044]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 2.0, 5.0, 2.0, 6.0, 6.0, 9.0, 14.0, 10.0, 21.0, 21.0, 28.0, 24.0, 35.0, 36.0, 40.0, 41.0, 39.0, 49.0, 49.0, 58.0, 61.0, 41.0, 49.0, 44.0, 41.0, 40.0, 30.0, 42.0, 30.0, 23.0, 23.0, 23.0, 14.0, 16.0, 10.0, 10.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06404274702072144, -0.062102433294057846, -0.06016211956739426, -0.05822180584073067, -0.05628149211406708, -0.05434117838740349, -0.0524008646607399, -0.05046054720878601, -0.04852023720741272, -0.04657992348074913, -0.04463960975408554, -0.04269929602742195, -0.04075898230075836, -0.03881866857409477, -0.03687835484743118, -0.034938037395477295, -0.032997723668813705, -0.031057409942150116, -0.029117096215486526, -0.027176782488822937, -0.025236468762159348, -0.023296155035495758, -0.02135583944618702, -0.01941552571952343, -0.01747521199285984, -0.015534898266196251, -0.013594584539532661, -0.011654269881546497, -0.009713956154882908, -0.007773642428219318, -0.005833327770233154, -0.003893014043569565, -0.0019527003169059753, -1.238635741174221e-05, 0.001927927602082491, 0.0038682417944073677, 0.005808555521070957, 0.007748869247734547, 0.00968918390572071, 0.0116294976323843, 0.01356981135904789, 0.01551012508571148, 0.01745043881237507, 0.019390754401683807, 0.021331068128347397, 0.023271381855010986, 0.025211695581674576, 0.027152009308338165, 0.029092323035001755, 0.031032636761665344, 0.032972950488328934, 0.03491326421499252, 0.03685357794165611, 0.0387938916683197, 0.04073420912027359, 0.04267451912164688, 0.04461483657360077, 0.04655515030026436, 0.04849546402692795, 0.05043577775359154, 0.05237609148025513, 0.054316405206918716, 0.056256718933582306, 0.058197036385536194, 0.060137346386909485]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 5.0, 2.0, 6.0, 9.0, 9.0, 17.0, 7.0, 33.0, 45.0, 33.0, 67.0, 73.0, 120.0, 185.0, 272.0, 364.0, 586.0, 874.0, 1475.0, 2388.0, 4032.0, 7352.0, 13613.0, 29518.0, 87082.0, 331149.0, 393576.0, 106481.0, 34402.0, 15107.0, 8017.0, 4457.0, 2571.0, 1554.0, 1006.0, 647.0, 440.0, 296.0, 209.0, 146.0, 91.0, 63.0, 45.0, 37.0, 25.0, 23.0, 25.0, 8.0, 8.0, 5.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05548095703125, -0.05363655090332031, -0.051792144775390625, -0.04994773864746094, -0.04810333251953125, -0.04625892639160156, -0.044414520263671875, -0.04257011413574219, -0.0407257080078125, -0.03888130187988281, -0.037036895751953125, -0.03519248962402344, -0.03334808349609375, -0.03150367736816406, -0.029659271240234375, -0.027814865112304688, -0.025970458984375, -0.024126052856445312, -0.022281646728515625, -0.020437240600585938, -0.01859283447265625, -0.016748428344726562, -0.014904022216796875, -0.013059616088867188, -0.0112152099609375, -0.009370803833007812, -0.007526397705078125, -0.0056819915771484375, -0.00383758544921875, -0.0019931793212890625, -0.000148773193359375, 0.0016956329345703125, 0.0035400390625, 0.0053844451904296875, 0.007228851318359375, 0.009073257446289062, 0.01091766357421875, 0.012762069702148438, 0.014606475830078125, 0.016450881958007812, 0.0182952880859375, 0.020139694213867188, 0.021984100341796875, 0.023828506469726562, 0.02567291259765625, 0.027517318725585938, 0.029361724853515625, 0.031206130981445312, 0.033050537109375, 0.03489494323730469, 0.036739349365234375, 0.03858375549316406, 0.04042816162109375, 0.04227256774902344, 0.044116973876953125, 0.04596138000488281, 0.0478057861328125, 0.04965019226074219, 0.051494598388671875, 0.05333900451660156, 0.05518341064453125, 0.05702781677246094, 0.058872222900390625, 0.06071662902832031, 0.06256103515625]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 5.0, 5.0, 6.0, 4.0, 10.0, 14.0, 14.0, 17.0, 28.0, 24.0, 30.0, 24.0, 42.0, 35.0, 45.0, 44.0, 51.0, 72.0, 45.0, 49.0, 47.0, 47.0, 46.0, 48.0, 30.0, 37.0, 36.0, 26.0, 18.0, 15.0, 32.0, 14.0, 16.0, 9.0, 7.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.15087890625, -0.1466541290283203, -0.14242935180664062, -0.13820457458496094, -0.13397979736328125, -0.12975502014160156, -0.12553024291992188, -0.12130546569824219, -0.1170806884765625, -0.11285591125488281, -0.10863113403320312, -0.10440635681152344, -0.10018157958984375, -0.09595680236816406, -0.09173202514648438, -0.08750724792480469, -0.083282470703125, -0.07905769348144531, -0.07483291625976562, -0.07060813903808594, -0.06638336181640625, -0.06215858459472656, -0.057933807373046875, -0.05370903015136719, -0.0494842529296875, -0.04525947570800781, -0.041034698486328125, -0.03680992126464844, -0.03258514404296875, -0.028360366821289062, -0.024135589599609375, -0.019910812377929688, -0.01568603515625, -0.011461257934570312, -0.007236480712890625, -0.0030117034912109375, 0.00121307373046875, 0.0054378509521484375, 0.009662628173828125, 0.013887405395507812, 0.0181121826171875, 0.022336959838867188, 0.026561737060546875, 0.030786514282226562, 0.03501129150390625, 0.03923606872558594, 0.043460845947265625, 0.04768562316894531, 0.051910400390625, 0.05613517761230469, 0.060359954833984375, 0.06458473205566406, 0.06880950927734375, 0.07303428649902344, 0.07725906372070312, 0.08148384094238281, 0.0857086181640625, 0.08993339538574219, 0.09415817260742188, 0.09838294982910156, 0.10260772705078125, 0.10683250427246094, 0.11105728149414062, 0.11528205871582031, 0.1195068359375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 1.0, 3.0, 4.0, 10.0, 15.0, 12.0, 22.0, 22.0, 29.0, 44.0, 41.0, 97.0, 107.0, 213.0, 441.0, 1249.0, 5551.0, 37811.0, 715767.0, 263285.0, 18900.0, 3208.0, 797.0, 357.0, 173.0, 107.0, 93.0, 53.0, 42.0, 24.0, 22.0, 16.0, 9.0, 4.0, 6.0, 5.0, 4.0, 2.0, 8.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.1610107421875, -0.1562519073486328, -0.15149307250976562, -0.14673423767089844, -0.14197540283203125, -0.13721656799316406, -0.13245773315429688, -0.1276988983154297, -0.1229400634765625, -0.11818122863769531, -0.11342239379882812, -0.10866355895996094, -0.10390472412109375, -0.09914588928222656, -0.09438705444335938, -0.08962821960449219, -0.084869384765625, -0.08011054992675781, -0.07535171508789062, -0.07059288024902344, -0.06583404541015625, -0.06107521057128906, -0.056316375732421875, -0.05155754089355469, -0.0467987060546875, -0.04203987121582031, -0.037281036376953125, -0.03252220153808594, -0.02776336669921875, -0.023004531860351562, -0.018245697021484375, -0.013486862182617188, -0.00872802734375, -0.0039691925048828125, 0.000789642333984375, 0.0055484771728515625, 0.01030731201171875, 0.015066146850585938, 0.019824981689453125, 0.024583816528320312, 0.0293426513671875, 0.03410148620605469, 0.038860321044921875, 0.04361915588378906, 0.04837799072265625, 0.05313682556152344, 0.057895660400390625, 0.06265449523925781, 0.067413330078125, 0.07217216491699219, 0.07693099975585938, 0.08168983459472656, 0.08644866943359375, 0.09120750427246094, 0.09596633911132812, 0.10072517395019531, 0.1054840087890625, 0.11024284362792969, 0.11500167846679688, 0.11976051330566406, 0.12451934814453125, 0.12927818298339844, 0.13403701782226562, 0.1387958526611328, 0.1435546875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 4.0, 7.0, 4.0, 6.0, 9.0, 8.0, 11.0, 15.0, 16.0, 19.0, 33.0, 24.0, 41.0, 32.0, 28.0, 42.0, 35.0, 40.0, 46.0, 55.0, 53.0, 56.0, 43.0, 49.0, 30.0, 44.0, 21.0, 29.0, 27.0, 30.0, 28.0, 23.0, 16.0, 13.0, 14.0, 9.0, 3.0, 9.0, 11.0, 6.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1373291015625, -0.1331806182861328, -0.12903213500976562, -0.12488365173339844, -0.12073516845703125, -0.11658668518066406, -0.11243820190429688, -0.10828971862792969, -0.1041412353515625, -0.09999275207519531, -0.09584426879882812, -0.09169578552246094, -0.08754730224609375, -0.08339881896972656, -0.07925033569335938, -0.07510185241699219, -0.070953369140625, -0.06680488586425781, -0.06265640258789062, -0.05850791931152344, -0.05435943603515625, -0.05021095275878906, -0.046062469482421875, -0.04191398620605469, -0.0377655029296875, -0.03361701965332031, -0.029468536376953125, -0.025320053100585938, -0.02117156982421875, -0.017023086547851562, -0.012874603271484375, -0.008726119995117188, -0.00457763671875, -0.0004291534423828125, 0.003719329833984375, 0.007867813110351562, 0.01201629638671875, 0.016164779663085938, 0.020313262939453125, 0.024461746215820312, 0.0286102294921875, 0.03275871276855469, 0.036907196044921875, 0.04105567932128906, 0.04520416259765625, 0.04935264587402344, 0.053501129150390625, 0.05764961242675781, 0.061798095703125, 0.06594657897949219, 0.07009506225585938, 0.07424354553222656, 0.07839202880859375, 0.08254051208496094, 0.08668899536132812, 0.09083747863769531, 0.0949859619140625, 0.09913444519042969, 0.10328292846679688, 0.10743141174316406, 0.11157989501953125, 0.11572837829589844, 0.11987686157226562, 0.12402534484863281, 0.128173828125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 4.0, 11.0, 12.0, 22.0, 23.0, 33.0, 54.0, 87.0, 228.0, 548.0, 2004.0, 14981.0, 418281.0, 589725.0, 19070.0, 2377.0, 591.0, 227.0, 102.0, 57.0, 43.0, 23.0, 16.0, 11.0, 8.0, 3.0, 6.0, 0.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0438232421875, -0.04236459732055664, -0.04090595245361328, -0.03944730758666992, -0.03798866271972656, -0.0365300178527832, -0.035071372985839844, -0.033612728118896484, -0.032154083251953125, -0.030695438385009766, -0.029236793518066406, -0.027778148651123047, -0.026319503784179688, -0.024860858917236328, -0.02340221405029297, -0.02194356918334961, -0.02048492431640625, -0.01902627944946289, -0.01756763458251953, -0.016108989715576172, -0.014650344848632812, -0.013191699981689453, -0.011733055114746094, -0.010274410247802734, -0.008815765380859375, -0.007357120513916016, -0.005898475646972656, -0.004439830780029297, -0.0029811859130859375, -0.0015225410461425781, -6.389617919921875e-05, 0.0013947486877441406, 0.0028533935546875, 0.004312038421630859, 0.005770683288574219, 0.007229328155517578, 0.008687973022460938, 0.010146617889404297, 0.011605262756347656, 0.013063907623291016, 0.014522552490234375, 0.015981197357177734, 0.017439842224121094, 0.018898487091064453, 0.020357131958007812, 0.021815776824951172, 0.02327442169189453, 0.02473306655883789, 0.02619171142578125, 0.02765035629272461, 0.02910900115966797, 0.030567646026611328, 0.03202629089355469, 0.03348493576049805, 0.034943580627441406, 0.036402225494384766, 0.037860870361328125, 0.039319515228271484, 0.040778160095214844, 0.0422368049621582, 0.04369544982910156, 0.04515409469604492, 0.04661273956298828, 0.04807138442993164, 0.049530029296875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 7.0, 9.0, 7.0, 13.0, 23.0, 9.0, 27.0, 44.0, 36.0, 50.0, 90.0, 79.0, 101.0, 119.0, 78.0, 101.0, 44.0, 41.0, 32.0, 27.0, 17.0, 15.0, 12.0, 8.0, 5.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.516674041748047e-06, -3.3760443329811096e-06, -3.2354146242141724e-06, -3.094784915447235e-06, -2.954155206680298e-06, -2.8135254979133606e-06, -2.6728957891464233e-06, -2.532266080379486e-06, -2.391636371612549e-06, -2.2510066628456116e-06, -2.1103769540786743e-06, -1.969747245311737e-06, -1.8291175365447998e-06, -1.6884878277778625e-06, -1.5478581190109253e-06, -1.407228410243988e-06, -1.2665987014770508e-06, -1.1259689927101135e-06, -9.853392839431763e-07, -8.44709575176239e-07, -7.040798664093018e-07, -5.634501576423645e-07, -4.2282044887542725e-07, -2.8219074010849e-07, -1.4156103134155273e-07, -9.313225746154785e-10, 1.3969838619232178e-07, 2.8032809495925903e-07, 4.209578037261963e-07, 5.615875124931335e-07, 7.022172212600708e-07, 8.428469300270081e-07, 9.834766387939453e-07, 1.1241063475608826e-06, 1.2647360563278198e-06, 1.405365765094757e-06, 1.5459954738616943e-06, 1.6866251826286316e-06, 1.8272548913955688e-06, 1.967884600162506e-06, 2.1085143089294434e-06, 2.2491440176963806e-06, 2.389773726463318e-06, 2.530403435230255e-06, 2.6710331439971924e-06, 2.8116628527641296e-06, 2.952292561531067e-06, 3.092922270298004e-06, 3.2335519790649414e-06, 3.3741816878318787e-06, 3.514811396598816e-06, 3.655441105365753e-06, 3.7960708141326904e-06, 3.936700522899628e-06, 4.077330231666565e-06, 4.217959940433502e-06, 4.3585896492004395e-06, 4.499219357967377e-06, 4.639849066734314e-06, 4.780478775501251e-06, 4.9211084842681885e-06, 5.061738193035126e-06, 5.202367901802063e-06, 5.342997610569e-06, 5.4836273193359375e-06]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 8.0, 6.0, 7.0, 4.0, 13.0, 19.0, 21.0, 17.0, 44.0, 128.0, 275.0, 872.0, 2779.0, 13770.0, 474735.0, 536802.0, 14894.0, 2765.0, 837.0, 297.0, 122.0, 48.0, 29.0, 14.0, 15.0, 10.0, 5.0, 4.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.057586669921875, -0.05572986602783203, -0.05387306213378906, -0.052016258239746094, -0.050159454345703125, -0.048302650451660156, -0.04644584655761719, -0.04458904266357422, -0.04273223876953125, -0.04087543487548828, -0.03901863098144531, -0.037161827087402344, -0.035305023193359375, -0.033448219299316406, -0.03159141540527344, -0.02973461151123047, -0.0278778076171875, -0.02602100372314453, -0.024164199829101562, -0.022307395935058594, -0.020450592041015625, -0.018593788146972656, -0.016736984252929688, -0.014880180358886719, -0.01302337646484375, -0.011166572570800781, -0.009309768676757812, -0.007452964782714844, -0.005596160888671875, -0.0037393569946289062, -0.0018825531005859375, -2.574920654296875e-05, 0.0018310546875, 0.0036878585815429688, 0.0055446624755859375, 0.007401466369628906, 0.009258270263671875, 0.011115074157714844, 0.012971878051757812, 0.014828681945800781, 0.01668548583984375, 0.01854228973388672, 0.020399093627929688, 0.022255897521972656, 0.024112701416015625, 0.025969505310058594, 0.027826309204101562, 0.02968311309814453, 0.0315399169921875, 0.03339672088623047, 0.03525352478027344, 0.037110328674316406, 0.038967132568359375, 0.040823936462402344, 0.04268074035644531, 0.04453754425048828, 0.04639434814453125, 0.04825115203857422, 0.05010795593261719, 0.051964759826660156, 0.053821563720703125, 0.055678367614746094, 0.05753517150878906, 0.05939197540283203, 0.061248779296875]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 4.0, 5.0, 13.0, 15.0, 14.0, 27.0, 49.0, 60.0, 72.0, 118.0, 140.0, 143.0, 87.0, 79.0, 51.0, 39.0, 15.0, 17.0, 10.0, 2.0, 1.0, 3.0, 6.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0170440673828125, -0.01652050018310547, -0.015996932983398438, -0.015473365783691406, -0.014949798583984375, -0.014426231384277344, -0.013902664184570312, -0.013379096984863281, -0.01285552978515625, -0.012331962585449219, -0.011808395385742188, -0.011284828186035156, -0.010761260986328125, -0.010237693786621094, -0.009714126586914062, -0.009190559387207031, -0.0086669921875, -0.008143424987792969, -0.0076198577880859375, -0.007096290588378906, -0.006572723388671875, -0.006049156188964844, -0.0055255889892578125, -0.005002021789550781, -0.00447845458984375, -0.003954887390136719, -0.0034313201904296875, -0.0029077529907226562, -0.002384185791015625, -0.0018606185913085938, -0.0013370513916015625, -0.0008134841918945312, -0.0002899169921875, 0.00023365020751953125, 0.0007572174072265625, 0.0012807846069335938, 0.001804351806640625, 0.0023279190063476562, 0.0028514862060546875, 0.0033750534057617188, 0.00389862060546875, 0.004422187805175781, 0.0049457550048828125, 0.005469322204589844, 0.005992889404296875, 0.006516456604003906, 0.0070400238037109375, 0.007563591003417969, 0.008087158203125, 0.008610725402832031, 0.009134292602539062, 0.009657859802246094, 0.010181427001953125, 0.010704994201660156, 0.011228561401367188, 0.011752128601074219, 0.01227569580078125, 0.012799263000488281, 0.013322830200195312, 0.013846397399902344, 0.014369964599609375, 0.014893531799316406, 0.015417098999023438, 0.01594066619873047, 0.0164642333984375]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 27.0, 108.0, 352.0, 328.0, 146.0, 38.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2014520168304443, -1.1774336099624634, -1.1534150838851929, -1.129396677017212, -1.1053781509399414, -1.0813597440719604, -1.0573413372039795, -1.033322811126709, -1.009304404258728, -0.9852859377861023, -0.9612674713134766, -0.9372490644454956, -0.9132305979728699, -0.8892121315002441, -0.8651936650276184, -0.8411751985549927, -0.8171567916870117, -0.793138325214386, -0.7691198587417603, -0.7451014518737793, -0.7210829854011536, -0.6970645189285278, -0.6730460524559021, -0.6490275859832764, -0.6250091195106506, -0.6009906530380249, -0.5769721865653992, -0.5529537796974182, -0.5289353132247925, -0.5049168467521667, -0.480898380279541, -0.45687994360923767, -0.4328615367412567, -0.408843070268631, -0.38482463359832764, -0.3608061671257019, -0.33678773045539856, -0.3127692639827728, -0.2887508273124695, -0.26473236083984375, -0.2407139092683792, -0.21669545769691467, -0.19267700612545013, -0.1686585545539856, -0.14464008808135986, -0.12062164396047592, -0.09660318493843079, -0.07258473336696625, -0.04856628179550171, -0.02454782836139202, -0.0005293749272823334, 0.023489080369472504, 0.04750753194093704, 0.07152598351240158, 0.09554444253444672, 0.11956289410591125, 0.1435813456773758, 0.16759979724884033, 0.19161824882030487, 0.2156367003917694, 0.23965516686439514, 0.2636736035346985, 0.2876920700073242, 0.31171053647994995, 0.3357289731502533]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 5.0, 6.0, 4.0, 5.0, 15.0, 9.0, 14.0, 18.0, 29.0, 22.0, 27.0, 22.0, 30.0, 30.0, 41.0, 53.0, 41.0, 49.0, 42.0, 49.0, 54.0, 48.0, 44.0, 44.0, 42.0, 37.0, 33.0, 24.0, 29.0, 32.0, 27.0, 18.0, 18.0, 10.0, 12.0, 8.0, 7.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.23862014710903168, -0.23129092156887054, -0.2239616960287094, -0.21663247048854828, -0.20930324494838715, -0.20197400450706482, -0.1946447789669037, -0.18731555342674255, -0.17998632788658142, -0.1726571023464203, -0.16532787680625916, -0.15799865126609802, -0.1506694257259369, -0.14334020018577576, -0.13601097464561462, -0.1286817342042923, -0.12135251611471176, -0.11402329057455063, -0.1066940650343895, -0.09936483204364777, -0.09203560650348663, -0.0847063809633255, -0.07737715542316437, -0.07004792988300323, -0.0627187043428421, -0.05538947880268097, -0.04806024953722954, -0.040731023997068405, -0.033401794731616974, -0.02607256919145584, -0.018743343651294708, -0.011414114385843277, -0.004084885120391846, 0.003244341816753149, 0.010573568753898144, 0.01790279522538185, 0.025232022628188133, 0.032561250030994415, 0.03989047557115555, 0.04721970483660698, 0.05454893037676811, 0.061878155916929245, 0.06920738518238068, 0.07653661072254181, 0.08386583626270294, 0.09119506180286407, 0.09852428734302521, 0.10585352033376694, 0.11318274587392807, 0.1205119714140892, 0.12784120440483093, 0.13517042994499207, 0.1424996554851532, 0.14982888102531433, 0.15715810656547546, 0.1644873321056366, 0.17181655764579773, 0.17914578318595886, 0.18647500872612, 0.19380423426628113, 0.20113345980644226, 0.2084626853466034, 0.21579191088676453, 0.22312115132808685, 0.23045037686824799]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 11.0, 9.0, 13.0, 15.0, 23.0, 31.0, 27.0, 60.0, 93.0, 129.0, 245.0, 458.0, 932.0, 2012.0, 4507.0, 12198.0, 54653.0, 1149307.0, 2792097.0, 146474.0, 19365.0, 6480.0, 2542.0, 1209.0, 558.0, 298.0, 167.0, 108.0, 63.0, 49.0, 34.0, 23.0, 19.0, 16.0, 10.0, 8.0, 9.0, 4.0, 4.0, 4.0, 6.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1455078125, -0.1406879425048828, -0.13586807250976562, -0.13104820251464844, -0.12622833251953125, -0.12140846252441406, -0.11658859252929688, -0.11176872253417969, -0.1069488525390625, -0.10212898254394531, -0.09730911254882812, -0.09248924255371094, -0.08766937255859375, -0.08284950256347656, -0.07802963256835938, -0.07320976257324219, -0.068389892578125, -0.06357002258300781, -0.058750152587890625, -0.05393028259277344, -0.04911041259765625, -0.04429054260253906, -0.039470672607421875, -0.03465080261230469, -0.0298309326171875, -0.025011062622070312, -0.020191192626953125, -0.015371322631835938, -0.01055145263671875, -0.0057315826416015625, -0.000911712646484375, 0.0039081573486328125, 0.00872802734375, 0.013547897338867188, 0.018367767333984375, 0.023187637329101562, 0.02800750732421875, 0.03282737731933594, 0.037647247314453125, 0.04246711730957031, 0.0472869873046875, 0.05210685729980469, 0.056926727294921875, 0.06174659729003906, 0.06656646728515625, 0.07138633728027344, 0.07620620727539062, 0.08102607727050781, 0.085845947265625, 0.09066581726074219, 0.09548568725585938, 0.10030555725097656, 0.10512542724609375, 0.10994529724121094, 0.11476516723632812, 0.11958503723144531, 0.1244049072265625, 0.1292247772216797, 0.13404464721679688, 0.13886451721191406, 0.14368438720703125, 0.14850425720214844, 0.15332412719726562, 0.1581439971923828, 0.1629638671875]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 3.0, 7.0, 6.0, 8.0, 8.0, 4.0, 6.0, 14.0, 18.0, 21.0, 22.0, 28.0, 24.0, 20.0, 42.0, 48.0, 36.0, 55.0, 46.0, 52.0, 55.0, 56.0, 44.0, 40.0, 43.0, 43.0, 37.0, 24.0, 30.0, 31.0, 20.0, 23.0, 19.0, 24.0, 13.0, 8.0, 7.0, 9.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06585693359375, -0.06384086608886719, -0.061824798583984375, -0.05980873107910156, -0.05779266357421875, -0.05577659606933594, -0.053760528564453125, -0.05174446105957031, -0.0497283935546875, -0.04771232604980469, -0.045696258544921875, -0.04368019104003906, -0.04166412353515625, -0.03964805603027344, -0.037631988525390625, -0.03561592102050781, -0.033599853515625, -0.03158378601074219, -0.029567718505859375, -0.027551651000976562, -0.02553558349609375, -0.023519515991210938, -0.021503448486328125, -0.019487380981445312, -0.0174713134765625, -0.015455245971679688, -0.013439178466796875, -0.011423110961914062, -0.00940704345703125, -0.0073909759521484375, -0.005374908447265625, -0.0033588409423828125, -0.0013427734375, 0.0006732940673828125, 0.002689361572265625, 0.0047054290771484375, 0.00672149658203125, 0.008737564086914062, 0.010753631591796875, 0.012769699096679688, 0.0147857666015625, 0.016801834106445312, 0.018817901611328125, 0.020833969116210938, 0.02285003662109375, 0.024866104125976562, 0.026882171630859375, 0.028898239135742188, 0.030914306640625, 0.03293037414550781, 0.034946441650390625, 0.03696250915527344, 0.03897857666015625, 0.04099464416503906, 0.043010711669921875, 0.04502677917480469, 0.0470428466796875, 0.04905891418457031, 0.051074981689453125, 0.05309104919433594, 0.05510711669921875, 0.05712318420410156, 0.059139251708984375, 0.06115531921386719, 0.06317138671875]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 8.0, 7.0, 14.0, 18.0, 24.0, 50.0, 59.0, 111.0, 209.0, 498.0, 1689.0, 8866.0, 110193.0, 3951781.0, 109228.0, 8790.0, 1731.0, 505.0, 206.0, 94.0, 65.0, 46.0, 25.0, 21.0, 9.0, 10.0, 4.0, 9.0, 0.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.295166015625, -0.2854881286621094, -0.27581024169921875, -0.2661323547363281, -0.2564544677734375, -0.24677658081054688, -0.23709869384765625, -0.22742080688476562, -0.217742919921875, -0.20806503295898438, -0.19838714599609375, -0.18870925903320312, -0.1790313720703125, -0.16935348510742188, -0.15967559814453125, -0.14999771118164062, -0.14031982421875, -0.13064193725585938, -0.12096405029296875, -0.11128616333007812, -0.1016082763671875, -0.09193038940429688, -0.08225250244140625, -0.07257461547851562, -0.062896728515625, -0.053218841552734375, -0.04354095458984375, -0.033863067626953125, -0.0241851806640625, -0.014507293701171875, -0.00482940673828125, 0.004848480224609375, 0.0145263671875, 0.024204254150390625, 0.03388214111328125, 0.043560028076171875, 0.0532379150390625, 0.06291580200195312, 0.07259368896484375, 0.08227157592773438, 0.091949462890625, 0.10162734985351562, 0.11130523681640625, 0.12098312377929688, 0.1306610107421875, 0.14033889770507812, 0.15001678466796875, 0.15969467163085938, 0.16937255859375, 0.17905044555664062, 0.18872833251953125, 0.19840621948242188, 0.2080841064453125, 0.21776199340820312, 0.22743988037109375, 0.23711776733398438, 0.246795654296875, 0.2564735412597656, 0.26615142822265625, 0.2758293151855469, 0.2855072021484375, 0.2951850891113281, 0.30486297607421875, 0.3145408630371094, 0.32421875]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 6.0, 6.0, 7.0, 8.0, 14.0, 23.0, 15.0, 34.0, 39.0, 48.0, 84.0, 120.0, 198.0, 348.0, 526.0, 732.0, 648.0, 422.0, 275.0, 158.0, 81.0, 77.0, 55.0, 40.0, 27.0, 18.0, 13.0, 13.0, 7.0, 11.0, 7.0, 8.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.052947998046875, -0.05154561996459961, -0.05014324188232422, -0.04874086380004883, -0.04733848571777344, -0.04593610763549805, -0.044533729553222656, -0.043131351470947266, -0.041728973388671875, -0.040326595306396484, -0.038924217224121094, -0.0375218391418457, -0.03611946105957031, -0.03471708297729492, -0.03331470489501953, -0.03191232681274414, -0.03050994873046875, -0.02910757064819336, -0.02770519256591797, -0.026302814483642578, -0.024900436401367188, -0.023498058319091797, -0.022095680236816406, -0.020693302154541016, -0.019290924072265625, -0.017888545989990234, -0.016486167907714844, -0.015083789825439453, -0.013681411743164062, -0.012279033660888672, -0.010876655578613281, -0.00947427749633789, -0.0080718994140625, -0.006669521331787109, -0.005267143249511719, -0.003864765167236328, -0.0024623870849609375, -0.0010600090026855469, 0.00034236907958984375, 0.0017447471618652344, 0.003147125244140625, 0.004549503326416016, 0.005951881408691406, 0.007354259490966797, 0.008756637573242188, 0.010159015655517578, 0.011561393737792969, 0.01296377182006836, 0.01436614990234375, 0.01576852798461914, 0.01717090606689453, 0.018573284149169922, 0.019975662231445312, 0.021378040313720703, 0.022780418395996094, 0.024182796478271484, 0.025585174560546875, 0.026987552642822266, 0.028389930725097656, 0.029792308807373047, 0.031194686889648438, 0.03259706497192383, 0.03399944305419922, 0.03540182113647461, 0.03680419921875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 4.0, 1.0, 5.0, 10.0, 7.0, 9.0, 7.0, 13.0, 15.0, 22.0, 26.0, 32.0, 34.0, 41.0, 50.0, 55.0, 48.0, 56.0, 64.0, 69.0, 51.0, 54.0, 54.0, 43.0, 36.0, 49.0, 27.0, 19.0, 20.0, 17.0, 8.0, 10.0, 8.0, 5.0, 11.0, 5.0, 2.0, 4.0, 2.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.1027679517865181, -0.09981711208820343, -0.09686627238988876, -0.0939154252409935, -0.09096458554267883, -0.08801374584436417, -0.0850629061460495, -0.08211205899715424, -0.07916121929883957, -0.0762103796005249, -0.07325953990221024, -0.07030869275331497, -0.0673578530550003, -0.06440701335668564, -0.06145617365837097, -0.058505330234766006, -0.05555449053645134, -0.05260365083813667, -0.04965280741453171, -0.04670196771621704, -0.043751124292612076, -0.04080028459429741, -0.037849441170692444, -0.03489860147237778, -0.03194776177406311, -0.028996920213103294, -0.02604607865214348, -0.02309523895382881, -0.020144395530223846, -0.01719355583190918, -0.014242714270949364, -0.011291872709989548, -0.008341029286384583, -0.0053901877254247665, -0.002439346630126238, 0.0005114944651722908, 0.0034623360261321068, 0.006413177587091923, 0.009364018216729164, 0.01231485977768898, 0.015265701338648796, 0.018216542899608612, 0.021167384460568428, 0.024118226021528244, 0.02706906571984291, 0.030019909143447876, 0.03297074884176254, 0.03592158854007721, 0.038872431963682175, 0.04182327166199684, 0.04477411508560181, 0.04772495478391647, 0.05067579820752144, 0.053626637905836105, 0.05657748132944107, 0.05952832102775574, 0.062479160726070404, 0.06543000042438507, 0.06838084012269974, 0.071331687271595, 0.07428252696990967, 0.07723336666822433, 0.080184206366539, 0.08313505351543427, 0.08608589321374893]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 4.0, 3.0, 14.0, 7.0, 12.0, 7.0, 17.0, 20.0, 11.0, 26.0, 31.0, 22.0, 26.0, 33.0, 33.0, 38.0, 44.0, 44.0, 54.0, 54.0, 41.0, 44.0, 40.0, 46.0, 46.0, 35.0, 42.0, 27.0, 34.0, 19.0, 20.0, 14.0, 11.0, 19.0, 20.0, 12.0, 10.0, 10.0, 5.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.085527203977108, -0.08281069993972778, -0.08009420335292816, -0.07737770676612854, -0.07466120272874832, -0.0719446986913681, -0.06922820210456848, -0.06651170551776886, -0.06379520148038864, -0.06107870116829872, -0.0583622008562088, -0.05564570054411888, -0.05292920023202896, -0.05021269991993904, -0.04749619960784912, -0.0447796992957592, -0.04206319898366928, -0.03934669867157936, -0.03663019835948944, -0.03391369804739952, -0.0311971977353096, -0.02848069742321968, -0.02576419711112976, -0.02304769679903984, -0.02033119648694992, -0.01761469617486, -0.01489819586277008, -0.01218169555068016, -0.00946519523859024, -0.0067486949265003204, -0.0040321946144104, -0.0013156943023204803, 0.0014008134603500366, 0.004117313772439957, 0.006833814084529877, 0.009550314396619797, 0.012266814708709717, 0.014983315020799637, 0.017699815332889557, 0.020416315644979477, 0.023132815957069397, 0.025849316269159317, 0.028565816581249237, 0.03128231689333916, 0.03399881720542908, 0.036715317517519, 0.03943181782960892, 0.04214831814169884, 0.04486481845378876, 0.04758131876587868, 0.0502978190779686, 0.05301431939005852, 0.05573081970214844, 0.05844732001423836, 0.06116382032632828, 0.0638803243637085, 0.06659682095050812, 0.06931331753730774, 0.07202982157468796, 0.07474632561206818, 0.0774628221988678, 0.08017931878566742, 0.08289582282304764, 0.08561232686042786, 0.08832882344722748]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 10.0, 15.0, 10.0, 23.0, 34.0, 35.0, 61.0, 107.0, 153.0, 246.0, 392.0, 724.0, 1259.0, 2242.0, 4099.0, 8658.0, 23162.0, 127062.0, 655597.0, 176433.0, 28087.0, 9813.0, 4582.0, 2463.0, 1313.0, 757.0, 436.0, 303.0, 173.0, 103.0, 78.0, 43.0, 23.0, 30.0, 10.0, 8.0, 8.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03851318359375, -0.037210941314697266, -0.03590869903564453, -0.0346064567565918, -0.03330421447753906, -0.03200197219848633, -0.030699729919433594, -0.02939748764038086, -0.028095245361328125, -0.02679300308227539, -0.025490760803222656, -0.024188518524169922, -0.022886276245117188, -0.021584033966064453, -0.02028179168701172, -0.018979549407958984, -0.01767730712890625, -0.016375064849853516, -0.015072822570800781, -0.013770580291748047, -0.012468338012695312, -0.011166095733642578, -0.009863853454589844, -0.00856161117553711, -0.007259368896484375, -0.005957126617431641, -0.004654884338378906, -0.003352642059326172, -0.0020503997802734375, -0.0007481575012207031, 0.0005540847778320312, 0.0018563270568847656, 0.0031585693359375, 0.004460811614990234, 0.005763053894042969, 0.007065296173095703, 0.008367538452148438, 0.009669780731201172, 0.010972023010253906, 0.01227426528930664, 0.013576507568359375, 0.01487874984741211, 0.016180992126464844, 0.017483234405517578, 0.018785476684570312, 0.020087718963623047, 0.02138996124267578, 0.022692203521728516, 0.02399444580078125, 0.025296688079833984, 0.02659893035888672, 0.027901172637939453, 0.029203414916992188, 0.030505657196044922, 0.031807899475097656, 0.03311014175415039, 0.034412384033203125, 0.03571462631225586, 0.037016868591308594, 0.03831911087036133, 0.03962135314941406, 0.0409235954284668, 0.04222583770751953, 0.043528079986572266, 0.044830322265625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 6.0, 3.0, 8.0, 2.0, 11.0, 9.0, 17.0, 14.0, 21.0, 29.0, 26.0, 29.0, 40.0, 33.0, 39.0, 54.0, 39.0, 45.0, 62.0, 52.0, 63.0, 45.0, 40.0, 49.0, 41.0, 39.0, 26.0, 23.0, 31.0, 26.0, 13.0, 15.0, 11.0, 16.0, 11.0, 9.0, 6.0, 6.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06646728515625, -0.0644845962524414, -0.06250190734863281, -0.06051921844482422, -0.058536529541015625, -0.05655384063720703, -0.05457115173339844, -0.052588462829589844, -0.05060577392578125, -0.048623085021972656, -0.04664039611816406, -0.04465770721435547, -0.042675018310546875, -0.04069232940673828, -0.03870964050292969, -0.036726951599121094, -0.0347442626953125, -0.032761573791503906, -0.030778884887695312, -0.02879619598388672, -0.026813507080078125, -0.02483081817626953, -0.022848129272460938, -0.020865440368652344, -0.01888275146484375, -0.016900062561035156, -0.014917373657226562, -0.012934684753417969, -0.010951995849609375, -0.008969306945800781, -0.0069866180419921875, -0.005003929138183594, -0.003021240234375, -0.0010385513305664062, 0.0009441375732421875, 0.0029268264770507812, 0.004909515380859375, 0.006892204284667969, 0.008874893188476562, 0.010857582092285156, 0.01284027099609375, 0.014822959899902344, 0.016805648803710938, 0.01878833770751953, 0.020771026611328125, 0.02275371551513672, 0.024736404418945312, 0.026719093322753906, 0.0287017822265625, 0.030684471130371094, 0.03266716003417969, 0.03464984893798828, 0.036632537841796875, 0.03861522674560547, 0.04059791564941406, 0.042580604553222656, 0.04456329345703125, 0.046545982360839844, 0.04852867126464844, 0.05051136016845703, 0.052494049072265625, 0.05447673797607422, 0.05645942687988281, 0.058442115783691406, 0.0604248046875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 4.0, 2.0, 7.0, 7.0, 10.0, 11.0, 14.0, 18.0, 28.0, 33.0, 56.0, 99.0, 198.0, 379.0, 821.0, 2308.0, 7341.0, 33551.0, 333778.0, 594582.0, 59167.0, 10872.0, 3152.0, 1111.0, 464.0, 228.0, 92.0, 74.0, 49.0, 26.0, 20.0, 16.0, 7.0, 7.0, 8.0, 5.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037200927734375, -0.035924434661865234, -0.03464794158935547, -0.0333714485168457, -0.03209495544433594, -0.030818462371826172, -0.029541969299316406, -0.02826547622680664, -0.026988983154296875, -0.02571249008178711, -0.024435997009277344, -0.023159503936767578, -0.021883010864257812, -0.020606517791748047, -0.01933002471923828, -0.018053531646728516, -0.01677703857421875, -0.015500545501708984, -0.014224052429199219, -0.012947559356689453, -0.011671066284179688, -0.010394573211669922, -0.009118080139160156, -0.00784158706665039, -0.006565093994140625, -0.005288600921630859, -0.004012107849121094, -0.002735614776611328, -0.0014591217041015625, -0.00018262863159179688, 0.0010938644409179688, 0.0023703575134277344, 0.0036468505859375, 0.004923343658447266, 0.006199836730957031, 0.007476329803466797, 0.008752822875976562, 0.010029315948486328, 0.011305809020996094, 0.01258230209350586, 0.013858795166015625, 0.01513528823852539, 0.016411781311035156, 0.017688274383544922, 0.018964767456054688, 0.020241260528564453, 0.02151775360107422, 0.022794246673583984, 0.02407073974609375, 0.025347232818603516, 0.02662372589111328, 0.027900218963623047, 0.029176712036132812, 0.030453205108642578, 0.031729698181152344, 0.03300619125366211, 0.034282684326171875, 0.03555917739868164, 0.036835670471191406, 0.03811216354370117, 0.03938865661621094, 0.0406651496887207, 0.04194164276123047, 0.043218135833740234, 0.04449462890625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 3.0, 5.0, 10.0, 7.0, 15.0, 23.0, 15.0, 21.0, 26.0, 26.0, 32.0, 31.0, 39.0, 34.0, 28.0, 47.0, 54.0, 37.0, 45.0, 52.0, 34.0, 50.0, 41.0, 62.0, 31.0, 26.0, 28.0, 28.0, 19.0, 14.0, 27.0, 21.0, 15.0, 9.0, 8.0, 8.0, 4.0, 5.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.137451171875, -0.13332176208496094, -0.12919235229492188, -0.1250629425048828, -0.12093353271484375, -0.11680412292480469, -0.11267471313476562, -0.10854530334472656, -0.1044158935546875, -0.10028648376464844, -0.09615707397460938, -0.09202766418457031, -0.08789825439453125, -0.08376884460449219, -0.07963943481445312, -0.07551002502441406, -0.071380615234375, -0.06725120544433594, -0.06312179565429688, -0.05899238586425781, -0.05486297607421875, -0.05073356628417969, -0.046604156494140625, -0.04247474670410156, -0.0383453369140625, -0.03421592712402344, -0.030086517333984375, -0.025957107543945312, -0.02182769775390625, -0.017698287963867188, -0.013568878173828125, -0.009439468383789062, -0.00531005859375, -0.0011806488037109375, 0.002948760986328125, 0.0070781707763671875, 0.01120758056640625, 0.015336990356445312, 0.019466400146484375, 0.023595809936523438, 0.0277252197265625, 0.03185462951660156, 0.035984039306640625, 0.04011344909667969, 0.04424285888671875, 0.04837226867675781, 0.052501678466796875, 0.05663108825683594, 0.060760498046875, 0.06488990783691406, 0.06901931762695312, 0.07314872741699219, 0.07727813720703125, 0.08140754699707031, 0.08553695678710938, 0.08966636657714844, 0.0937957763671875, 0.09792518615722656, 0.10205459594726562, 0.10618400573730469, 0.11031341552734375, 0.11444282531738281, 0.11857223510742188, 0.12270164489746094, 0.1268310546875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 7.0, 6.0, 7.0, 22.0, 40.0, 50.0, 85.0, 143.0, 368.0, 873.0, 2530.0, 11345.0, 136673.0, 811649.0, 73422.0, 8055.0, 1962.0, 688.0, 295.0, 149.0, 71.0, 45.0, 20.0, 16.0, 9.0, 7.0, 6.0, 2.0, 3.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0173187255859375, -0.01663684844970703, -0.015954971313476562, -0.015273094177246094, -0.014591217041015625, -0.013909339904785156, -0.013227462768554688, -0.012545585632324219, -0.01186370849609375, -0.011181831359863281, -0.010499954223632812, -0.009818077087402344, -0.009136199951171875, -0.008454322814941406, -0.0077724456787109375, -0.007090568542480469, -0.00640869140625, -0.005726814270019531, -0.0050449371337890625, -0.004363059997558594, -0.003681182861328125, -0.0029993057250976562, -0.0023174285888671875, -0.0016355514526367188, -0.00095367431640625, -0.00027179718017578125, 0.0004100799560546875, 0.0010919570922851562, 0.001773834228515625, 0.0024557113647460938, 0.0031375885009765625, 0.0038194656372070312, 0.0045013427734375, 0.005183219909667969, 0.0058650970458984375, 0.006546974182128906, 0.007228851318359375, 0.007910728454589844, 0.008592605590820312, 0.009274482727050781, 0.00995635986328125, 0.010638236999511719, 0.011320114135742188, 0.012001991271972656, 0.012683868408203125, 0.013365745544433594, 0.014047622680664062, 0.014729499816894531, 0.015411376953125, 0.01609325408935547, 0.016775131225585938, 0.017457008361816406, 0.018138885498046875, 0.018820762634277344, 0.019502639770507812, 0.02018451690673828, 0.02086639404296875, 0.02154827117919922, 0.022230148315429688, 0.022912025451660156, 0.023593902587890625, 0.024275779724121094, 0.024957656860351562, 0.02563953399658203, 0.0263214111328125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 6.0, 8.0, 18.0, 22.0, 37.0, 51.0, 71.0, 118.0, 135.0, 145.0, 110.0, 112.0, 67.0, 43.0, 18.0, 14.0, 11.0, 2.0, 5.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.59634780883789e-06, -9.299255907535553e-06, -9.002164006233215e-06, -8.705072104930878e-06, -8.40798020362854e-06, -8.110888302326202e-06, -7.813796401023865e-06, -7.516704499721527e-06, -7.2196125984191895e-06, -6.922520697116852e-06, -6.625428795814514e-06, -6.3283368945121765e-06, -6.031244993209839e-06, -5.734153091907501e-06, -5.4370611906051636e-06, -5.139969289302826e-06, -4.842877388000488e-06, -4.545785486698151e-06, -4.248693585395813e-06, -3.951601684093475e-06, -3.6545097827911377e-06, -3.3574178814888e-06, -3.0603259801864624e-06, -2.7632340788841248e-06, -2.466142177581787e-06, -2.1690502762794495e-06, -1.8719583749771118e-06, -1.5748664736747742e-06, -1.2777745723724365e-06, -9.806826710700989e-07, -6.835907697677612e-07, -3.864988684654236e-07, -8.940696716308594e-08, 2.076849341392517e-07, 5.047768354415894e-07, 8.01868736743927e-07, 1.0989606380462646e-06, 1.3960525393486023e-06, 1.69314444065094e-06, 1.9902363419532776e-06, 2.2873282432556152e-06, 2.584420144557953e-06, 2.8815120458602905e-06, 3.178603947162628e-06, 3.475695848464966e-06, 3.7727877497673035e-06, 4.069879651069641e-06, 4.366971552371979e-06, 4.664063453674316e-06, 4.961155354976654e-06, 5.258247256278992e-06, 5.555339157581329e-06, 5.852431058883667e-06, 6.149522960186005e-06, 6.446614861488342e-06, 6.74370676279068e-06, 7.040798664093018e-06, 7.337890565395355e-06, 7.634982466697693e-06, 7.93207436800003e-06, 8.229166269302368e-06, 8.526258170604706e-06, 8.823350071907043e-06, 9.120441973209381e-06, 9.417533874511719e-06]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 6.0, 3.0, 7.0, 5.0, 13.0, 7.0, 27.0, 26.0, 36.0, 49.0, 68.0, 95.0, 132.0, 197.0, 288.0, 444.0, 621.0, 1023.0, 1838.0, 3003.0, 5599.0, 11208.0, 23930.0, 55666.0, 134985.0, 275806.0, 281411.0, 141066.0, 59268.0, 25609.0, 11906.0, 5947.0, 3194.0, 1860.0, 1099.0, 667.0, 456.0, 296.0, 182.0, 137.0, 102.0, 73.0, 54.0, 40.0, 32.0, 17.0, 20.0, 17.0, 12.0, 6.0, 4.0, 2.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.00681304931640625, -0.0066002607345581055, -0.006387472152709961, -0.006174683570861816, -0.005961894989013672, -0.005749106407165527, -0.005536317825317383, -0.005323529243469238, -0.005110740661621094, -0.004897952079772949, -0.004685163497924805, -0.00447237491607666, -0.004259586334228516, -0.004046797752380371, -0.0038340091705322266, -0.003621220588684082, -0.0034084320068359375, -0.003195643424987793, -0.0029828548431396484, -0.002770066261291504, -0.0025572776794433594, -0.002344489097595215, -0.0021317005157470703, -0.0019189119338989258, -0.0017061233520507812, -0.0014933347702026367, -0.0012805461883544922, -0.0010677576065063477, -0.0008549690246582031, -0.0006421804428100586, -0.00042939186096191406, -0.00021660327911376953, -3.814697265625e-06, 0.00020897388458251953, 0.00042176246643066406, 0.0006345510482788086, 0.0008473396301269531, 0.0010601282119750977, 0.0012729167938232422, 0.0014857053756713867, 0.0016984939575195312, 0.0019112825393676758, 0.0021240711212158203, 0.002336859703063965, 0.0025496482849121094, 0.002762436866760254, 0.0029752254486083984, 0.003188014030456543, 0.0034008026123046875, 0.003613591194152832, 0.0038263797760009766, 0.004039168357849121, 0.004251956939697266, 0.00446474552154541, 0.004677534103393555, 0.004890322685241699, 0.005103111267089844, 0.005315899848937988, 0.005528688430786133, 0.005741477012634277, 0.005954265594482422, 0.006167054176330566, 0.006379842758178711, 0.0065926313400268555, 0.006805419921875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 4.0, 1.0, 4.0, 2.0, 2.0, 3.0, 15.0, 6.0, 11.0, 13.0, 16.0, 23.0, 18.0, 27.0, 36.0, 51.0, 58.0, 57.0, 65.0, 50.0, 56.0, 57.0, 60.0, 61.0, 44.0, 43.0, 52.0, 30.0, 19.0, 24.0, 19.0, 16.0, 12.0, 6.0, 12.0, 6.0, 6.0, 8.0, 0.0, 4.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.002399444580078125, -0.002327144145965576, -0.0022548437118530273, -0.0021825432777404785, -0.0021102428436279297, -0.002037942409515381, -0.001965641975402832, -0.0018933415412902832, -0.0018210411071777344, -0.0017487406730651855, -0.0016764402389526367, -0.0016041398048400879, -0.001531839370727539, -0.0014595389366149902, -0.0013872385025024414, -0.0013149380683898926, -0.0012426376342773438, -0.001170337200164795, -0.001098036766052246, -0.0010257363319396973, -0.0009534358978271484, -0.0008811354637145996, -0.0008088350296020508, -0.000736534595489502, -0.0006642341613769531, -0.0005919337272644043, -0.0005196332931518555, -0.00044733285903930664, -0.0003750324249267578, -0.000302731990814209, -0.00023043155670166016, -0.00015813112258911133, -8.58306884765625e-05, -1.3530254364013672e-05, 5.8770179748535156e-05, 0.00013107061386108398, 0.0002033710479736328, 0.00027567148208618164, 0.00034797191619873047, 0.0004202723503112793, 0.0004925727844238281, 0.000564873218536377, 0.0006371736526489258, 0.0007094740867614746, 0.0007817745208740234, 0.0008540749549865723, 0.0009263753890991211, 0.00099867582321167, 0.0010709762573242188, 0.0011432766914367676, 0.0012155771255493164, 0.0012878775596618652, 0.001360177993774414, 0.0014324784278869629, 0.0015047788619995117, 0.0015770792961120605, 0.0016493797302246094, 0.0017216801643371582, 0.001793980598449707, 0.0018662810325622559, 0.0019385814666748047, 0.0020108819007873535, 0.0020831823348999023, 0.002155482769012451, 0.002227783203125]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 3.0, 1.0, 4.0, 5.0, 2.0, 2.0, 5.0, 6.0, 7.0, 5.0, 19.0, 18.0, 23.0, 22.0, 35.0, 29.0, 31.0, 43.0, 56.0, 50.0, 49.0, 63.0, 52.0, 59.0, 50.0, 41.0, 39.0, 46.0, 40.0, 30.0, 33.0, 17.0, 21.0, 13.0, 15.0, 7.0, 4.0, 13.0, 8.0, 8.0, 5.0, 7.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.05102512985467911, -0.04939844086766243, -0.04777175560593605, -0.04614506661891937, -0.044518377631902695, -0.042891692370176315, -0.04126500338315964, -0.03963831812143326, -0.03801162913441658, -0.0363849401473999, -0.03475825488567352, -0.033131565898656845, -0.03150487691164017, -0.029878191649913788, -0.02825150266289711, -0.02662481553852558, -0.024998126551508904, -0.023371439427137375, -0.021744750440120697, -0.02011806331574917, -0.01849137619137764, -0.016864687204360962, -0.015238000079989433, -0.013611312955617905, -0.011984624899923801, -0.010357936844229698, -0.00873124971985817, -0.007104561664164066, -0.00547787407413125, -0.0038511864840984344, -0.002224498428404331, -0.0005978113040328026, 0.0010288767516613007, 0.0026555643416941166, 0.0042822519317269325, 0.005908939987421036, 0.007535627577453852, 0.009162315167486668, 0.010789003223180771, 0.0124156903475523, 0.014042378403246403, 0.015669066458940506, 0.017295753583312035, 0.018922440707683563, 0.02054912969470024, 0.02217581681907177, 0.0238025039434433, 0.025429192930459976, 0.027055880054831505, 0.028682567179203033, 0.03030925616621971, 0.03193594515323639, 0.03356263041496277, 0.035189319401979446, 0.036816008388996124, 0.038442693650722504, 0.04006938263773918, 0.04169607162475586, 0.04332275688648224, 0.04494944587349892, 0.046576134860515594, 0.048202820122241974, 0.04982950910925865, 0.05145619809627533, 0.05308288335800171]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 8.0, 8.0, 6.0, 6.0, 18.0, 11.0, 19.0, 15.0, 30.0, 22.0, 22.0, 37.0, 29.0, 40.0, 45.0, 53.0, 41.0, 61.0, 52.0, 45.0, 42.0, 46.0, 46.0, 45.0, 34.0, 34.0, 36.0, 20.0, 15.0, 19.0, 23.0, 17.0, 13.0, 16.0, 12.0, 6.0, 7.0, 1.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05878680944442749, -0.0570182241499424, -0.055249642580747604, -0.05348105728626251, -0.05171247199177742, -0.04994388669729233, -0.048175305128097534, -0.04640671983361244, -0.04463813453912735, -0.04286954924464226, -0.041100967675447464, -0.03933238238096237, -0.03756379708647728, -0.03579521179199219, -0.034026630222797394, -0.0322580449283123, -0.030489463359117508, -0.028720879927277565, -0.026952294632792473, -0.02518371120095253, -0.023415125906467438, -0.021646542474627495, -0.019877959042787552, -0.01810937374830246, -0.016340790316462517, -0.0145722059533, -0.012803621590137482, -0.011035038158297539, -0.009266453795135021, -0.007497869431972504, -0.005729286000132561, -0.003960701636970043, -0.0021921172738075256, -0.00042353314347565174, 0.0013450509868562222, 0.0031136348843574524, 0.00488221924751997, 0.0066508036106824875, 0.00841938704252243, 0.010187971405684948, 0.011956555768847466, 0.013725140132009983, 0.0154937244951725, 0.017262307927012444, 0.019030891358852386, 0.02079947665333748, 0.02256806008517742, 0.024336643517017365, 0.026105228811502457, 0.0278738122433424, 0.029642397537827492, 0.031410980969667435, 0.03317956626415253, 0.03494814783334732, 0.03671673312783241, 0.038485318422317505, 0.0402538999915123, 0.04202248528599739, 0.043791066855192184, 0.04555965214967728, 0.04732823744416237, 0.04909682273864746, 0.050865404307842255, 0.05263398960232735, 0.05440257489681244]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 8.0, 6.0, 11.0, 12.0, 23.0, 35.0, 61.0, 78.0, 109.0, 227.0, 404.0, 620.0, 1148.0, 2323.0, 4282.0, 8485.0, 19840.0, 54875.0, 206434.0, 473940.0, 188463.0, 51387.0, 18733.0, 8186.0, 4183.0, 1999.0, 1127.0, 644.0, 369.0, 203.0, 126.0, 73.0, 48.0, 31.0, 19.0, 21.0, 12.0, 5.0, 6.0, 1.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09771728515625, -0.09451007843017578, -0.09130287170410156, -0.08809566497802734, -0.08488845825195312, -0.0816812515258789, -0.07847404479980469, -0.07526683807373047, -0.07205963134765625, -0.06885242462158203, -0.06564521789550781, -0.062438011169433594, -0.059230804443359375, -0.056023597717285156, -0.05281639099121094, -0.04960918426513672, -0.0464019775390625, -0.04319477081298828, -0.03998756408691406, -0.036780357360839844, -0.033573150634765625, -0.030365943908691406, -0.027158737182617188, -0.02395153045654297, -0.02074432373046875, -0.01753711700439453, -0.014329910278320312, -0.011122703552246094, -0.007915496826171875, -0.004708290100097656, -0.0015010833740234375, 0.0017061233520507812, 0.004913330078125, 0.008120536804199219, 0.011327743530273438, 0.014534950256347656, 0.017742156982421875, 0.020949363708496094, 0.024156570434570312, 0.02736377716064453, 0.03057098388671875, 0.03377819061279297, 0.03698539733886719, 0.040192604064941406, 0.043399810791015625, 0.046607017517089844, 0.04981422424316406, 0.05302143096923828, 0.0562286376953125, 0.05943584442138672, 0.06264305114746094, 0.06585025787353516, 0.06905746459960938, 0.0722646713256836, 0.07547187805175781, 0.07867908477783203, 0.08188629150390625, 0.08509349822998047, 0.08830070495605469, 0.0915079116821289, 0.09471511840820312, 0.09792232513427734, 0.10112953186035156, 0.10433673858642578, 0.1075439453125]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 5.0, 4.0, 3.0, 9.0, 16.0, 14.0, 22.0, 18.0, 28.0, 20.0, 29.0, 33.0, 40.0, 49.0, 38.0, 58.0, 55.0, 63.0, 53.0, 55.0, 48.0, 39.0, 45.0, 34.0, 41.0, 31.0, 27.0, 27.0, 19.0, 11.0, 16.0, 14.0, 13.0, 6.0, 8.0, 5.0, 0.0, 4.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.117431640625, -0.11417102813720703, -0.11091041564941406, -0.1076498031616211, -0.10438919067382812, -0.10112857818603516, -0.09786796569824219, -0.09460735321044922, -0.09134674072265625, -0.08808612823486328, -0.08482551574707031, -0.08156490325927734, -0.07830429077148438, -0.0750436782836914, -0.07178306579589844, -0.06852245330810547, -0.0652618408203125, -0.06200122833251953, -0.05874061584472656, -0.055480003356933594, -0.052219390869140625, -0.048958778381347656, -0.04569816589355469, -0.04243755340576172, -0.03917694091796875, -0.03591632843017578, -0.03265571594238281, -0.029395103454589844, -0.026134490966796875, -0.022873878479003906, -0.019613265991210938, -0.01635265350341797, -0.013092041015625, -0.009831428527832031, -0.0065708160400390625, -0.0033102035522460938, -4.9591064453125e-05, 0.0032110214233398438, 0.0064716339111328125, 0.009732246398925781, 0.01299285888671875, 0.01625347137451172, 0.019514083862304688, 0.022774696350097656, 0.026035308837890625, 0.029295921325683594, 0.03255653381347656, 0.03581714630126953, 0.0390777587890625, 0.04233837127685547, 0.04559898376464844, 0.048859596252441406, 0.052120208740234375, 0.055380821228027344, 0.05864143371582031, 0.06190204620361328, 0.06516265869140625, 0.06842327117919922, 0.07168388366699219, 0.07494449615478516, 0.07820510864257812, 0.0814657211303711, 0.08472633361816406, 0.08798694610595703, 0.09124755859375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 2.0, 6.0, 4.0, 11.0, 15.0, 22.0, 25.0, 37.0, 57.0, 84.0, 120.0, 202.0, 318.0, 634.0, 1332.0, 3177.0, 8166.0, 24798.0, 94689.0, 428919.0, 371525.0, 79452.0, 21892.0, 7447.0, 2932.0, 1221.0, 598.0, 317.0, 186.0, 139.0, 82.0, 39.0, 28.0, 17.0, 21.0, 18.0, 8.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1328125, -0.12865447998046875, -0.1244964599609375, -0.12033843994140625, -0.116180419921875, -0.11202239990234375, -0.1078643798828125, -0.10370635986328125, -0.09954833984375, -0.09539031982421875, -0.0912322998046875, -0.08707427978515625, -0.082916259765625, -0.07875823974609375, -0.0746002197265625, -0.07044219970703125, -0.0662841796875, -0.06212615966796875, -0.0579681396484375, -0.05381011962890625, -0.049652099609375, -0.04549407958984375, -0.0413360595703125, -0.03717803955078125, -0.03302001953125, -0.02886199951171875, -0.0247039794921875, -0.02054595947265625, -0.016387939453125, -0.01222991943359375, -0.0080718994140625, -0.00391387939453125, 0.000244140625, 0.00440216064453125, 0.0085601806640625, 0.01271820068359375, 0.016876220703125, 0.02103424072265625, 0.0251922607421875, 0.02935028076171875, 0.03350830078125, 0.03766632080078125, 0.0418243408203125, 0.04598236083984375, 0.050140380859375, 0.05429840087890625, 0.0584564208984375, 0.06261444091796875, 0.0667724609375, 0.07093048095703125, 0.0750885009765625, 0.07924652099609375, 0.083404541015625, 0.08756256103515625, 0.0917205810546875, 0.09587860107421875, 0.10003662109375, 0.10419464111328125, 0.1083526611328125, 0.11251068115234375, 0.116668701171875, 0.12082672119140625, 0.1249847412109375, 0.12914276123046875, 0.13330078125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 3.0, 3.0, 5.0, 8.0, 10.0, 21.0, 27.0, 12.0, 16.0, 36.0, 30.0, 30.0, 58.0, 45.0, 49.0, 56.0, 54.0, 67.0, 48.0, 66.0, 58.0, 46.0, 42.0, 42.0, 32.0, 41.0, 21.0, 17.0, 14.0, 3.0, 7.0, 5.0, 9.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1131591796875, -0.10931205749511719, -0.10546493530273438, -0.10161781311035156, -0.09777069091796875, -0.09392356872558594, -0.09007644653320312, -0.08622932434082031, -0.0823822021484375, -0.07853507995605469, -0.07468795776367188, -0.07084083557128906, -0.06699371337890625, -0.06314659118652344, -0.059299468994140625, -0.05545234680175781, -0.051605224609375, -0.04775810241699219, -0.043910980224609375, -0.04006385803222656, -0.03621673583984375, -0.03236961364746094, -0.028522491455078125, -0.024675369262695312, -0.0208282470703125, -0.016981124877929688, -0.013134002685546875, -0.009286880493164062, -0.00543975830078125, -0.0015926361083984375, 0.002254486083984375, 0.0061016082763671875, 0.00994873046875, 0.013795852661132812, 0.017642974853515625, 0.021490097045898438, 0.02533721923828125, 0.029184341430664062, 0.033031463623046875, 0.03687858581542969, 0.0407257080078125, 0.04457283020019531, 0.048419952392578125, 0.05226707458496094, 0.05611419677734375, 0.05996131896972656, 0.06380844116210938, 0.06765556335449219, 0.071502685546875, 0.07534980773925781, 0.07919692993164062, 0.08304405212402344, 0.08689117431640625, 0.09073829650878906, 0.09458541870117188, 0.09843254089355469, 0.1022796630859375, 0.10612678527832031, 0.10997390747070312, 0.11382102966308594, 0.11766815185546875, 0.12151527404785156, 0.12536239624023438, 0.1292095184326172, 0.133056640625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 5.0, 5.0, 5.0, 2.0, 7.0, 7.0, 21.0, 26.0, 33.0, 60.0, 116.0, 165.0, 300.0, 528.0, 887.0, 1702.0, 3426.0, 7415.0, 18074.0, 53113.0, 177722.0, 450940.0, 225855.0, 68437.0, 22479.0, 8723.0, 4045.0, 1962.0, 1071.0, 569.0, 318.0, 201.0, 141.0, 67.0, 49.0, 25.0, 15.0, 15.0, 10.0, 5.0, 7.0, 5.0, 1.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.018463134765625, -0.01789689064025879, -0.017330646514892578, -0.016764402389526367, -0.016198158264160156, -0.015631914138793945, -0.015065670013427734, -0.014499425888061523, -0.013933181762695312, -0.013366937637329102, -0.01280069351196289, -0.01223444938659668, -0.011668205261230469, -0.011101961135864258, -0.010535717010498047, -0.009969472885131836, -0.009403228759765625, -0.008836984634399414, -0.008270740509033203, -0.007704496383666992, -0.007138252258300781, -0.00657200813293457, -0.006005764007568359, -0.0054395198822021484, -0.0048732757568359375, -0.0043070316314697266, -0.0037407875061035156, -0.0031745433807373047, -0.0026082992553710938, -0.002042055130004883, -0.0014758110046386719, -0.0009095668792724609, -0.00034332275390625, 0.00022292137145996094, 0.0007891654968261719, 0.0013554096221923828, 0.0019216537475585938, 0.0024878978729248047, 0.0030541419982910156, 0.0036203861236572266, 0.0041866302490234375, 0.0047528743743896484, 0.005319118499755859, 0.00588536262512207, 0.006451606750488281, 0.007017850875854492, 0.007584095001220703, 0.008150339126586914, 0.008716583251953125, 0.009282827377319336, 0.009849071502685547, 0.010415315628051758, 0.010981559753417969, 0.01154780387878418, 0.01211404800415039, 0.012680292129516602, 0.013246536254882812, 0.013812780380249023, 0.014379024505615234, 0.014945268630981445, 0.015511512756347656, 0.016077756881713867, 0.016644001007080078, 0.01721024513244629, 0.0177764892578125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 7.0, 5.0, 6.0, 9.0, 5.0, 18.0, 19.0, 19.0, 36.0, 46.0, 54.0, 66.0, 76.0, 78.0, 95.0, 100.0, 61.0, 50.0, 57.0, 34.0, 30.0, 29.0, 23.0, 18.0, 17.0, 6.0, 7.0, 10.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6954879760742188e-06, -3.579072654247284e-06, -3.462657332420349e-06, -3.3462420105934143e-06, -3.2298266887664795e-06, -3.1134113669395447e-06, -2.99699604511261e-06, -2.880580723285675e-06, -2.7641654014587402e-06, -2.6477500796318054e-06, -2.5313347578048706e-06, -2.414919435977936e-06, -2.298504114151001e-06, -2.182088792324066e-06, -2.0656734704971313e-06, -1.9492581486701965e-06, -1.8328428268432617e-06, -1.716427505016327e-06, -1.600012183189392e-06, -1.4835968613624573e-06, -1.3671815395355225e-06, -1.2507662177085876e-06, -1.1343508958816528e-06, -1.017935574054718e-06, -9.015202522277832e-07, -7.851049304008484e-07, -6.686896085739136e-07, -5.522742867469788e-07, -4.3585896492004395e-07, -3.1944364309310913e-07, -2.0302832126617432e-07, -8.66129994392395e-08, 2.9802322387695312e-08, 1.4621764421463013e-07, 2.6263296604156494e-07, 3.7904828786849976e-07, 4.954636096954346e-07, 6.118789315223694e-07, 7.282942533493042e-07, 8.44709575176239e-07, 9.611248970031738e-07, 1.0775402188301086e-06, 1.1939555406570435e-06, 1.3103708624839783e-06, 1.426786184310913e-06, 1.543201506137848e-06, 1.6596168279647827e-06, 1.7760321497917175e-06, 1.8924474716186523e-06, 2.008862793445587e-06, 2.125278115272522e-06, 2.2416934370994568e-06, 2.3581087589263916e-06, 2.4745240807533264e-06, 2.5909394025802612e-06, 2.707354724407196e-06, 2.823770046234131e-06, 2.9401853680610657e-06, 3.0566006898880005e-06, 3.1730160117149353e-06, 3.28943133354187e-06, 3.405846655368805e-06, 3.5222619771957397e-06, 3.6386772990226746e-06, 3.7550926208496094e-06]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 9.0, 6.0, 10.0, 16.0, 12.0, 30.0, 46.0, 55.0, 66.0, 113.0, 173.0, 245.0, 355.0, 583.0, 830.0, 1291.0, 2104.0, 3457.0, 5889.0, 10642.0, 21665.0, 48487.0, 127491.0, 373708.0, 267867.0, 102218.0, 40126.0, 18191.0, 9284.0, 5222.0, 2958.0, 1880.0, 1200.0, 807.0, 470.0, 313.0, 227.0, 144.0, 119.0, 61.0, 47.0, 37.0, 28.0, 18.0, 12.0, 6.0, 13.0, 6.0, 10.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.0181732177734375, -0.017603397369384766, -0.01703357696533203, -0.016463756561279297, -0.015893936157226562, -0.015324115753173828, -0.014754295349121094, -0.01418447494506836, -0.013614654541015625, -0.01304483413696289, -0.012475013732910156, -0.011905193328857422, -0.011335372924804688, -0.010765552520751953, -0.010195732116699219, -0.009625911712646484, -0.00905609130859375, -0.008486270904541016, -0.007916450500488281, -0.007346630096435547, -0.0067768096923828125, -0.006206989288330078, -0.005637168884277344, -0.005067348480224609, -0.004497528076171875, -0.003927707672119141, -0.0033578872680664062, -0.002788066864013672, -0.0022182464599609375, -0.0016484260559082031, -0.0010786056518554688, -0.0005087852478027344, 6.103515625e-05, 0.0006308555603027344, 0.0012006759643554688, 0.0017704963684082031, 0.0023403167724609375, 0.002910137176513672, 0.0034799575805664062, 0.004049777984619141, 0.004619598388671875, 0.005189418792724609, 0.005759239196777344, 0.006329059600830078, 0.0068988800048828125, 0.007468700408935547, 0.008038520812988281, 0.008608341217041016, 0.00917816162109375, 0.009747982025146484, 0.010317802429199219, 0.010887622833251953, 0.011457443237304688, 0.012027263641357422, 0.012597084045410156, 0.01316690444946289, 0.013736724853515625, 0.01430654525756836, 0.014876365661621094, 0.015446186065673828, 0.016016006469726562, 0.016585826873779297, 0.01715564727783203, 0.017725467681884766, 0.0182952880859375]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 9.0, 6.0, 11.0, 13.0, 12.0, 22.0, 29.0, 53.0, 56.0, 82.0, 101.0, 206.0, 102.0, 85.0, 64.0, 42.0, 37.0, 25.0, 11.0, 8.0, 6.0, 3.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014404296875, -0.013816356658935547, -0.013228416442871094, -0.01264047622680664, -0.012052536010742188, -0.011464595794677734, -0.010876655578613281, -0.010288715362548828, -0.009700775146484375, -0.009112834930419922, -0.008524894714355469, -0.007936954498291016, -0.0073490142822265625, -0.006761074066162109, -0.006173133850097656, -0.005585193634033203, -0.00499725341796875, -0.004409313201904297, -0.0038213729858398438, -0.0032334327697753906, -0.0026454925537109375, -0.0020575523376464844, -0.0014696121215820312, -0.0008816719055175781, -0.000293731689453125, 0.0002942085266113281, 0.0008821487426757812, 0.0014700889587402344, 0.0020580291748046875, 0.0026459693908691406, 0.0032339096069335938, 0.003821849822998047, 0.0044097900390625, 0.004997730255126953, 0.005585670471191406, 0.006173610687255859, 0.0067615509033203125, 0.007349491119384766, 0.007937431335449219, 0.008525371551513672, 0.009113311767578125, 0.009701251983642578, 0.010289192199707031, 0.010877132415771484, 0.011465072631835938, 0.01205301284790039, 0.012640953063964844, 0.013228893280029297, 0.01381683349609375, 0.014404773712158203, 0.014992713928222656, 0.01558065414428711, 0.016168594360351562, 0.016756534576416016, 0.01734447479248047, 0.017932415008544922, 0.018520355224609375, 0.019108295440673828, 0.01969623565673828, 0.020284175872802734, 0.020872116088867188, 0.02146005630493164, 0.022047996520996094, 0.022635936737060547, 0.023223876953125]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 3.0, 7.0, 9.0, 8.0, 24.0, 33.0, 50.0, 62.0, 119.0, 136.0, 141.0, 119.0, 104.0, 61.0, 53.0, 32.0, 16.0, 7.0, 13.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.36785775423049927, -0.359567791223526, -0.35127779841423035, -0.3429878354072571, -0.3346978425979614, -0.32640787959098816, -0.3181179165840149, -0.30982792377471924, -0.30153796076774597, -0.2932479977607727, -0.28495800495147705, -0.2766680419445038, -0.2683780789375305, -0.26008808612823486, -0.2517981231212616, -0.24350814521312714, -0.23521816730499268, -0.22692818939685822, -0.21863821148872375, -0.2103482484817505, -0.20205827057361603, -0.19376829266548157, -0.1854783296585083, -0.17718835175037384, -0.16889837384223938, -0.16060839593410492, -0.15231841802597046, -0.1440284550189972, -0.13573847711086273, -0.12744849920272827, -0.11915852874517441, -0.11086855828762054, -0.10257861018180847, -0.09428863227367401, -0.08599866181612015, -0.07770869135856628, -0.06941871345043182, -0.06112873926758766, -0.0528387650847435, -0.04454879090189934, -0.036258816719055176, -0.027968842536211014, -0.019678868353366852, -0.01138889417052269, -0.003098919987678528, 0.005191054195165634, 0.013481028378009796, 0.021771002560853958, 0.03006097674369812, 0.03835095092654228, 0.046640925109386444, 0.054930899292230606, 0.06322087347507477, 0.07151085138320923, 0.07980082184076309, 0.08809079229831696, 0.09638077020645142, 0.10467074811458588, 0.11296071857213974, 0.1212506890296936, 0.12954066693782806, 0.13783064484596252, 0.1461206078529358, 0.15441058576107025, 0.1627005636692047]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 5.0, 3.0, 5.0, 9.0, 9.0, 11.0, 15.0, 8.0, 20.0, 27.0, 13.0, 23.0, 37.0, 29.0, 40.0, 38.0, 33.0, 46.0, 47.0, 36.0, 49.0, 39.0, 43.0, 43.0, 64.0, 48.0, 24.0, 42.0, 22.0, 23.0, 28.0, 18.0, 17.0, 17.0, 11.0, 13.0, 14.0, 7.0, 6.0, 4.0, 4.0, 5.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17499539256095886, -0.16934356093406677, -0.16369174420833588, -0.1580399125814438, -0.1523880958557129, -0.1467362642288208, -0.1410844326019287, -0.13543261587619781, -0.12978079915046692, -0.12412897497415543, -0.11847715079784393, -0.11282531917095184, -0.10717350244522095, -0.10152167081832886, -0.09586984664201736, -0.09021802246570587, -0.08456619083881378, -0.07891436666250229, -0.0732625424861908, -0.0676107108592987, -0.06195889040827751, -0.05630706623196602, -0.05065523833036423, -0.045003414154052734, -0.03935158997774124, -0.03369976580142975, -0.028047939762473106, -0.022396113723516464, -0.01674428954720497, -0.011092465370893478, -0.005440637469291687, 0.0002111867070198059, 0.005863025784492493, 0.01151485089212656, 0.017166675999760628, 0.02281850203871727, 0.028470326215028763, 0.034122150391340256, 0.03977397829294205, 0.04542580246925354, 0.05107762664556503, 0.056729450821876526, 0.06238127499818802, 0.06803309917449951, 0.0736849308013916, 0.0793367475271225, 0.08498857915401459, 0.09064040333032608, 0.09629222750663757, 0.10194405168294907, 0.10759587585926056, 0.11324770748615265, 0.11889952421188354, 0.12455135583877563, 0.13020318746566772, 0.13585500419139862, 0.14150682091712952, 0.1471586525440216, 0.1528104692697525, 0.1584623008966446, 0.1641141176223755, 0.16976594924926758, 0.17541778087615967, 0.18106959760189056, 0.18672142922878265]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 2.0, 10.0, 3.0, 6.0, 16.0, 23.0, 23.0, 41.0, 46.0, 65.0, 74.0, 97.0, 135.0, 177.0, 219.0, 327.0, 366.0, 636.0, 946.0, 1544.0, 5191.0, 1035301.0, 1867.0, 960.0, 709.0, 434.0, 356.0, 252.0, 192.0, 160.0, 99.0, 86.0, 55.0, 52.0, 36.0, 22.0, 20.0, 10.0, 15.0, 8.0, 9.0, 2.0, 2.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.23735788464546204, -0.23019158840179443, -0.22302527725696564, -0.21585898101329803, -0.20869266986846924, -0.20152637362480164, -0.19436007738113403, -0.18719376623630524, -0.18002746999263763, -0.17286117374897003, -0.16569486260414124, -0.15852856636047363, -0.15136225521564484, -0.14419595897197723, -0.13702964782714844, -0.12986335158348083, -0.12269704788923264, -0.11553074419498444, -0.10836444050073624, -0.10119813680648804, -0.09403184056282043, -0.08686553686857224, -0.07969923317432404, -0.07253293693065643, -0.06536662578582764, -0.05820032209157944, -0.051034022122621536, -0.04386771842837334, -0.036701418459415436, -0.029535114765167236, -0.022368811070919037, -0.015202511101961136, -0.008036211133003235, -0.0008699088357388973, 0.00629639346152544, 0.013462696224451065, 0.020628998056054115, 0.027795299887657166, 0.034961603581905365, 0.042127903550863266, 0.049294207245111465, 0.056460510939359665, 0.06362681090831757, 0.07079311460256577, 0.07795941829681396, 0.08512571454048157, 0.09229202568531036, 0.09945832192897797, 0.10662462562322617, 0.11379092931747437, 0.12095723301172256, 0.12812353670597076, 0.13528983294963837, 0.14245614409446716, 0.14962244033813477, 0.15678873658180237, 0.16395504772663116, 0.17112134397029877, 0.17828765511512756, 0.18545395135879517, 0.19262026250362396, 0.19978655874729156, 0.20695286989212036, 0.21411916613578796, 0.22128546237945557]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 11.0, 35.0, 81.0, 164.0, 351.0, 715.0, 2182.0, 51463196.0, 2178.0, 719.0, 375.0, 181.0, 77.0, 36.0, 10.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.037178039550781, -14.60129451751709, -14.165410995483398, -13.729527473449707, -13.293643951416016, -12.857759475708008, -12.421875953674316, -11.985992431640625, -11.550108909606934, -11.114225387573242, -10.67834186553955, -10.24245834350586, -9.806573867797852, -9.370691299438477, -8.934806823730469, -8.498923301696777, -8.063039779663086, -7.6271562576293945, -7.191272735595703, -6.7553887367248535, -6.319505214691162, -5.883621692657471, -5.447737693786621, -5.01185417175293, -4.575970649719238, -4.140087127685547, -3.7042033672332764, -3.268319606781006, -2.8324360847473145, -2.396552562713623, -1.9606688022613525, -1.524785041809082, -1.0889015197753906, -0.6530178785324097, -0.2171342372894287, 0.21874940395355225, 0.6546330451965332, 1.0905165672302246, 1.5264003276824951, 1.9622840881347656, 2.398167610168457, 2.8340511322021484, 3.269934892654419, 3.7058186531066895, 4.141702175140381, 4.577585697174072, 5.013469696044922, 5.449353218078613, 5.885236740112305, 6.321120262145996, 6.7570037841796875, 7.192887783050537, 7.6287713050842285, 8.064655303955078, 8.50053882598877, 8.936422348022461, 9.372305870056152, 9.808189392089844, 10.244072914123535, 10.679956436157227, 11.115840911865234, 11.55172348022461, 11.987607955932617, 12.423491477966309, 12.859375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 6.0, 11.0, 17.0, 15.0, 28.0, 23.0, 67.0, 86.0, 124.0, 189.0, 339.0, 450.0, 812.0, 1119.0, 1941.0, 3300.0, 5780.0, 10671.0, 20078.0, 39358.0, 77760.0, 152343.0, 293168.0, 526494.0, 3530526.0, 820511.0, 382079.0, 205652.0, 105403.0, 53032.0, 27279.0, 14125.0, 7610.0, 4362.0, 2522.0, 1457.0, 967.0, 629.0, 357.0, 273.0, 166.0, 95.0, 63.0, 48.0, 29.0, 26.0, 20.0, 11.0, 4.0, 3.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3759765625, -0.3644866943359375, -0.352996826171875, -0.3415069580078125, -0.33001708984375, -0.3185272216796875, -0.307037353515625, -0.2955474853515625, -0.2840576171875, -0.2725677490234375, -0.261077880859375, -0.2495880126953125, -0.23809814453125, -0.2266082763671875, -0.215118408203125, -0.2036285400390625, -0.192138671875, -0.1806488037109375, -0.169158935546875, -0.1576690673828125, -0.14617919921875, -0.1346893310546875, -0.123199462890625, -0.1117095947265625, -0.1002197265625, -0.0887298583984375, -0.077239990234375, -0.0657501220703125, -0.05426025390625, -0.0427703857421875, -0.031280517578125, -0.0197906494140625, -0.00830078125, 0.0031890869140625, 0.014678955078125, 0.0261688232421875, 0.03765869140625, 0.0491485595703125, 0.060638427734375, 0.0721282958984375, 0.0836181640625, 0.0951080322265625, 0.106597900390625, 0.1180877685546875, 0.12957763671875, 0.1410675048828125, 0.152557373046875, 0.1640472412109375, 0.175537109375, 0.1870269775390625, 0.198516845703125, 0.2100067138671875, 0.22149658203125, 0.2329864501953125, 0.244476318359375, 0.2559661865234375, 0.2674560546875, 0.2789459228515625, 0.290435791015625, 0.3019256591796875, 0.31341552734375, 0.3249053955078125, 0.336395263671875, 0.3478851318359375, 0.359375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 7.0, 5.0, 12.0, 15.0, 19.0, 17.0, 15.0, 23.0, 22.0, 26.0, 35.0, 33.0, 29.0, 33.0, 33.0, 45.0, 55.0, 142.0, 681.0, 298.0, 55.0, 64.0, 39.0, 46.0, 38.0, 50.0, 23.0, 30.0, 30.0, 11.0, 20.0, 19.0, 7.0, 14.0, 6.0, 7.0, 3.0, 2.0, 5.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.091796875, -2.0279693603515625, -1.964141845703125, -1.9003143310546875, -1.83648681640625, -1.7726593017578125, -1.708831787109375, -1.6450042724609375, -1.5811767578125, -1.5173492431640625, -1.453521728515625, -1.3896942138671875, -1.32586669921875, -1.2620391845703125, -1.198211669921875, -1.1343841552734375, -1.070556640625, -1.0067291259765625, -0.942901611328125, -0.8790740966796875, -0.81524658203125, -0.7514190673828125, -0.687591552734375, -0.6237640380859375, -0.5599365234375, -0.4961090087890625, -0.432281494140625, -0.3684539794921875, -0.30462646484375, -0.2407989501953125, -0.176971435546875, -0.1131439208984375, -0.04931640625, 0.0145111083984375, 0.078338623046875, 0.1421661376953125, 0.20599365234375, 0.2698211669921875, 0.333648681640625, 0.3974761962890625, 0.4613037109375, 0.5251312255859375, 0.588958740234375, 0.6527862548828125, 0.71661376953125, 0.7804412841796875, 0.844268798828125, 0.9080963134765625, 0.971923828125, 1.0357513427734375, 1.099578857421875, 1.1634063720703125, 1.22723388671875, 1.2910614013671875, 1.354888916015625, 1.4187164306640625, 1.4825439453125, 1.5463714599609375, 1.610198974609375, 1.6740264892578125, 1.73785400390625, 1.8016815185546875, 1.865509033203125, 1.9293365478515625, 1.9931640625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 8.0, 5.0, 8.0, 9.0, 24.0, 33.0, 62.0, 94.0, 152.0, 220.0, 407.0, 553.0, 937.0, 1504.0, 2424.0, 3930.0, 6448.0, 10332.0, 17564.0, 29004.0, 48549.0, 78882.0, 125231.0, 195277.0, 285537.0, 386234.0, 2747942.0, 1255965.0, 361722.0, 264218.0, 177348.0, 113117.0, 69998.0, 42484.0, 26041.0, 15348.0, 9438.0, 5562.0, 3427.0, 2020.0, 1271.0, 780.0, 486.0, 310.0, 201.0, 118.0, 92.0, 52.0, 30.0, 15.0, 11.0, 13.0, 6.0, 4.0], "bins": [-0.230224609375, -0.2239837646484375, -0.217742919921875, -0.2115020751953125, -0.20526123046875, -0.1990203857421875, -0.192779541015625, -0.1865386962890625, -0.1802978515625, -0.1740570068359375, -0.167816162109375, -0.1615753173828125, -0.15533447265625, -0.1490936279296875, -0.142852783203125, -0.1366119384765625, -0.13037109375, -0.1241302490234375, -0.117889404296875, -0.1116485595703125, -0.10540771484375, -0.0991668701171875, -0.092926025390625, -0.0866851806640625, -0.0804443359375, -0.0742034912109375, -0.067962646484375, -0.0617218017578125, -0.05548095703125, -0.0492401123046875, -0.042999267578125, -0.0367584228515625, -0.030517578125, -0.0242767333984375, -0.018035888671875, -0.0117950439453125, -0.00555419921875, 0.0006866455078125, 0.006927490234375, 0.0131683349609375, 0.0194091796875, 0.0256500244140625, 0.031890869140625, 0.0381317138671875, 0.04437255859375, 0.0506134033203125, 0.056854248046875, 0.0630950927734375, 0.0693359375, 0.0755767822265625, 0.081817626953125, 0.0880584716796875, 0.09429931640625, 0.1005401611328125, 0.106781005859375, 0.1130218505859375, 0.1192626953125, 0.1255035400390625, 0.131744384765625, 0.1379852294921875, 0.14422607421875, 0.1504669189453125, 0.156707763671875, 0.1629486083984375, 0.169189453125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 6.0, 3.0, 1.0, 1.0, 5.0, 7.0, 10.0, 8.0, 10.0, 11.0, 11.0, 16.0, 13.0, 14.0, 18.0, 16.0, 22.0, 21.0, 20.0, 28.0, 18.0, 31.0, 30.0, 45.0, 33.0, 40.0, 386.0, 635.0, 113.0, 30.0, 42.0, 30.0, 34.0, 33.0, 30.0, 39.0, 24.0, 20.0, 22.0, 22.0, 21.0, 19.0, 15.0, 11.0, 14.0, 10.0, 5.0, 9.0, 10.0, 3.0, 4.0, 5.0, 5.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0], "bins": [-1.5595703125, -1.511199951171875, -1.46282958984375, -1.414459228515625, -1.3660888671875, -1.317718505859375, -1.26934814453125, -1.220977783203125, -1.172607421875, -1.124237060546875, -1.07586669921875, -1.027496337890625, -0.9791259765625, -0.930755615234375, -0.88238525390625, -0.834014892578125, -0.78564453125, -0.737274169921875, -0.68890380859375, -0.640533447265625, -0.5921630859375, -0.543792724609375, -0.49542236328125, -0.447052001953125, -0.398681640625, -0.350311279296875, -0.30194091796875, -0.253570556640625, -0.2052001953125, -0.156829833984375, -0.10845947265625, -0.060089111328125, -0.01171875, 0.036651611328125, 0.08502197265625, 0.133392333984375, 0.1817626953125, 0.230133056640625, 0.27850341796875, 0.326873779296875, 0.375244140625, 0.423614501953125, 0.47198486328125, 0.520355224609375, 0.5687255859375, 0.617095947265625, 0.66546630859375, 0.713836669921875, 0.76220703125, 0.810577392578125, 0.85894775390625, 0.907318115234375, 0.9556884765625, 1.004058837890625, 1.05242919921875, 1.100799560546875, 1.149169921875, 1.197540283203125, 1.24591064453125, 1.294281005859375, 1.3426513671875, 1.391021728515625, 1.43939208984375, 1.487762451171875, 1.5361328125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 4.0, 6.0, 2.0, 4.0, 9.0, 14.0, 14.0, 15.0, 18.0, 29.0, 30.0, 38.0, 45.0, 77.0, 72.0, 115.0, 163.0, 183.0, 263.0, 338.0, 514.0, 726.0, 992.0, 1683.0, 3165.0, 6413.0, 15056.0, 37747.0, 100554.0, 5125828.0, 840043.0, 94186.0, 34932.0, 13846.0, 6075.0, 3041.0, 1633.0, 1030.0, 688.0, 500.0, 361.0, 257.0, 183.0, 118.0, 126.0, 64.0, 48.0, 43.0, 31.0, 27.0, 17.0, 15.0, 25.0, 13.0, 10.0, 8.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0], "bins": [-0.7294921875, -0.7059326171875, -0.682373046875, -0.6588134765625, -0.63525390625, -0.6116943359375, -0.588134765625, -0.5645751953125, -0.541015625, -0.5174560546875, -0.493896484375, -0.4703369140625, -0.44677734375, -0.4232177734375, -0.399658203125, -0.3760986328125, -0.3525390625, -0.3289794921875, -0.305419921875, -0.2818603515625, -0.25830078125, -0.2347412109375, -0.211181640625, -0.1876220703125, -0.1640625, -0.1405029296875, -0.116943359375, -0.0933837890625, -0.06982421875, -0.0462646484375, -0.022705078125, 0.0008544921875, 0.0244140625, 0.0479736328125, 0.071533203125, 0.0950927734375, 0.11865234375, 0.1422119140625, 0.165771484375, 0.1893310546875, 0.212890625, 0.2364501953125, 0.260009765625, 0.2835693359375, 0.30712890625, 0.3306884765625, 0.354248046875, 0.3778076171875, 0.4013671875, 0.4249267578125, 0.448486328125, 0.4720458984375, 0.49560546875, 0.5191650390625, 0.542724609375, 0.5662841796875, 0.58984375, 0.6134033203125, 0.636962890625, 0.6605224609375, 0.68408203125, 0.7076416015625, 0.731201171875, 0.7547607421875, 0.7783203125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 8.0, 5.0, 7.0, 11.0, 11.0, 11.0, 16.0, 23.0, 23.0, 22.0, 27.0, 45.0, 29.0, 38.0, 50.0, 29.0, 47.0, 51.0, 349.0, 737.0, 80.0, 41.0, 34.0, 36.0, 43.0, 32.0, 30.0, 36.0, 34.0, 17.0, 20.0, 17.0, 15.0, 13.0, 4.0, 7.0, 6.0, 10.0, 2.0, 2.0, 6.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.126953125, -2.0609130859375, -1.994873046875, -1.9288330078125, -1.86279296875, -1.7967529296875, -1.730712890625, -1.6646728515625, -1.5986328125, -1.5325927734375, -1.466552734375, -1.4005126953125, -1.33447265625, -1.2684326171875, -1.202392578125, -1.1363525390625, -1.0703125, -1.0042724609375, -0.938232421875, -0.8721923828125, -0.80615234375, -0.7401123046875, -0.674072265625, -0.6080322265625, -0.5419921875, -0.4759521484375, -0.409912109375, -0.3438720703125, -0.27783203125, -0.2117919921875, -0.145751953125, -0.0797119140625, -0.013671875, 0.0523681640625, 0.118408203125, 0.1844482421875, 0.25048828125, 0.3165283203125, 0.382568359375, 0.4486083984375, 0.5146484375, 0.5806884765625, 0.646728515625, 0.7127685546875, 0.77880859375, 0.8448486328125, 0.910888671875, 0.9769287109375, 1.04296875, 1.1090087890625, 1.175048828125, 1.2410888671875, 1.30712890625, 1.3731689453125, 1.439208984375, 1.5052490234375, 1.5712890625, 1.6373291015625, 1.703369140625, 1.7694091796875, 1.83544921875, 1.9014892578125, 1.967529296875, 2.0335693359375, 2.099609375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 1.0, 4.0, 3.0, 5.0, 9.0, 13.0, 14.0, 29.0, 33.0, 38.0, 54.0, 79.0, 158.0, 243.0, 92.0, 69.0, 34.0, 29.0, 27.0, 17.0, 18.0, 10.0, 7.0, 4.0, 1.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.225685119628906, -18.520082473754883, -17.814477920532227, -17.108875274658203, -16.403270721435547, -15.697668075561523, -14.9920654296875, -14.28646183013916, -13.58085823059082, -12.87525463104248, -12.16965103149414, -11.464048385620117, -10.758444786071777, -10.052841186523438, -9.347238540649414, -8.641634941101074, -7.936031341552734, -7.2304277420043945, -6.524824619293213, -5.819221496582031, -5.113617897033691, -4.408014297485352, -3.70241117477417, -2.9968080520629883, -2.2912044525146484, -1.5856010913848877, -0.879997730255127, -0.1743943691253662, 0.5312089920043945, 1.2368123531341553, 1.942415714263916, 2.6480188369750977, 3.3536205291748047, 4.0592241287231445, 4.764827251434326, 5.470430374145508, 6.176033973693848, 6.8816375732421875, 7.587240695953369, 8.29284381866455, 8.99844741821289, 9.70405101776123, 10.40965461730957, 11.115257263183594, 11.820860862731934, 12.526464462280273, 13.232067108154297, 13.937670707702637, 14.643274307250977, 15.348877906799316, 16.054481506347656, 16.76008415222168, 17.465686798095703, 18.17129135131836, 18.876893997192383, 19.582496643066406, 20.288101196289062, 20.993703842163086, 21.699308395385742, 22.404911041259766, 23.110515594482422, 23.816118240356445, 24.52172088623047, 25.227325439453125, 25.93292808532715]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 2.0, 5.0, 6.0, 6.0, 11.0, 8.0, 11.0, 10.0, 22.0, 15.0, 20.0, 22.0, 31.0, 34.0, 42.0, 74.0, 123.0, 155.0, 87.0, 54.0, 37.0, 31.0, 34.0, 28.0, 15.0, 24.0, 15.0, 12.0, 8.0, 13.0, 5.0, 7.0, 5.0, 8.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-44.22477722167969, -42.76165008544922, -41.29852294921875, -39.83539581298828, -38.37226867675781, -36.909141540527344, -35.446014404296875, -33.982887268066406, -32.51976013183594, -31.05663299560547, -29.593505859375, -28.13037872314453, -26.667251586914062, -25.204124450683594, -23.740997314453125, -22.277870178222656, -20.814741134643555, -19.351613998413086, -17.888486862182617, -16.42535972595215, -14.96223258972168, -13.499105453491211, -12.035977363586426, -10.572850227355957, -9.109723091125488, -7.6465959548950195, -6.183468818664551, -4.720341205596924, -3.257214069366455, -1.7940869331359863, -0.3309593200683594, 1.1321678161621094, 2.595294952392578, 4.058422088623047, 5.521549224853516, 6.984676837921143, 8.447803497314453, 9.910930633544922, 11.374058723449707, 12.837185859680176, 14.300312995910645, 15.763440132141113, 17.2265682220459, 18.689695358276367, 20.152822494506836, 21.615949630737305, 23.079076766967773, 24.542203903198242, 26.00533103942871, 27.46845817565918, 28.93158531188965, 30.394712448120117, 31.857839584350586, 33.32096862792969, 34.784095764160156, 36.247222900390625, 37.710350036621094, 39.17347717285156, 40.63660430908203, 42.0997314453125, 43.56285858154297, 45.02598571777344, 46.489112854003906, 47.952239990234375, 49.415367126464844]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 9.0, 8.0, 16.0, 15.0, 18.0, 34.0, 50.0, 61.0, 110.0, 163.0, 269.0, 366.0, 661.0, 1119.0, 2171.0, 4570.0, 11810.0, 46200.0, 3299952.0, 769936.0, 36147.0, 10864.0, 4482.0, 2202.0, 1171.0, 651.0, 425.0, 262.0, 165.0, 111.0, 79.0, 55.0, 42.0, 30.0, 13.0, 20.0, 11.0, 7.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038787841796875, -0.03749227523803711, -0.03619670867919922, -0.03490114212036133, -0.03360557556152344, -0.03231000900268555, -0.031014442443847656, -0.029718875885009766, -0.028423309326171875, -0.027127742767333984, -0.025832176208496094, -0.024536609649658203, -0.023241043090820312, -0.021945476531982422, -0.02064990997314453, -0.01935434341430664, -0.01805877685546875, -0.01676321029663086, -0.015467643737792969, -0.014172077178955078, -0.012876510620117188, -0.011580944061279297, -0.010285377502441406, -0.008989810943603516, -0.007694244384765625, -0.006398677825927734, -0.005103111267089844, -0.003807544708251953, -0.0025119781494140625, -0.0012164115905761719, 7.915496826171875e-05, 0.0013747215270996094, 0.0026702880859375, 0.003965854644775391, 0.005261421203613281, 0.006556987762451172, 0.007852554321289062, 0.009148120880126953, 0.010443687438964844, 0.011739253997802734, 0.013034820556640625, 0.014330387115478516, 0.015625953674316406, 0.016921520233154297, 0.018217086791992188, 0.019512653350830078, 0.02080821990966797, 0.02210378646850586, 0.02339935302734375, 0.02469491958618164, 0.02599048614501953, 0.027286052703857422, 0.028581619262695312, 0.029877185821533203, 0.031172752380371094, 0.032468318939208984, 0.033763885498046875, 0.035059452056884766, 0.036355018615722656, 0.03765058517456055, 0.03894615173339844, 0.04024171829223633, 0.04153728485107422, 0.04283285140991211, 0.04412841796875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 1.0, 4.0, 4.0, 5.0, 6.0, 10.0, 11.0, 15.0, 19.0, 27.0, 32.0, 29.0, 40.0, 57.0, 394.0, 87.0, 55.0, 45.0, 27.0, 19.0, 22.0, 15.0, 15.0, 15.0, 6.0, 8.0, 7.0, 6.0, 2.0, 2.0, 5.0, 3.0, 5.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0204620361328125, -0.019802093505859375, -0.01914215087890625, -0.018482208251953125, -0.017822265625, -0.017162322998046875, -0.01650238037109375, -0.015842437744140625, -0.0151824951171875, -0.014522552490234375, -0.01386260986328125, -0.013202667236328125, -0.012542724609375, -0.011882781982421875, -0.01122283935546875, -0.010562896728515625, -0.0099029541015625, -0.009243011474609375, -0.00858306884765625, -0.007923126220703125, -0.00726318359375, -0.006603240966796875, -0.00594329833984375, -0.005283355712890625, -0.0046234130859375, -0.003963470458984375, -0.00330352783203125, -0.002643585205078125, -0.001983642578125, -0.001323699951171875, -0.00066375732421875, -3.814697265625e-06, 0.0006561279296875, 0.001316070556640625, 0.00197601318359375, 0.002635955810546875, 0.0032958984375, 0.003955841064453125, 0.00461578369140625, 0.005275726318359375, 0.0059356689453125, 0.006595611572265625, 0.00725555419921875, 0.007915496826171875, 0.008575439453125, 0.009235382080078125, 0.00989532470703125, 0.010555267333984375, 0.0112152099609375, 0.011875152587890625, 0.01253509521484375, 0.013195037841796875, 0.01385498046875, 0.014514923095703125, 0.01517486572265625, 0.015834808349609375, 0.0164947509765625, 0.017154693603515625, 0.01781463623046875, 0.018474578857421875, 0.019134521484375, 0.019794464111328125, 0.02045440673828125, 0.021114349365234375, 0.0217742919921875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 7.0, 5.0, 5.0, 10.0, 19.0, 31.0, 48.0, 80.0, 120.0, 214.0, 571.0, 1459.0, 4465.0, 18442.0, 125084.0, 3660554.0, 334354.0, 36554.0, 8262.0, 2415.0, 832.0, 314.0, 174.0, 72.0, 60.0, 36.0, 32.0, 29.0, 12.0, 11.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0594482421875, -0.05773353576660156, -0.056018829345703125, -0.05430412292480469, -0.05258941650390625, -0.05087471008300781, -0.049160003662109375, -0.04744529724121094, -0.0457305908203125, -0.04401588439941406, -0.042301177978515625, -0.04058647155761719, -0.03887176513671875, -0.03715705871582031, -0.035442352294921875, -0.03372764587402344, -0.032012939453125, -0.030298233032226562, -0.028583526611328125, -0.026868820190429688, -0.02515411376953125, -0.023439407348632812, -0.021724700927734375, -0.020009994506835938, -0.0182952880859375, -0.016580581665039062, -0.014865875244140625, -0.013151168823242188, -0.01143646240234375, -0.009721755981445312, -0.008007049560546875, -0.0062923431396484375, -0.00457763671875, -0.0028629302978515625, -0.001148223876953125, 0.0005664825439453125, 0.00228118896484375, 0.0039958953857421875, 0.005710601806640625, 0.0074253082275390625, 0.0091400146484375, 0.010854721069335938, 0.012569427490234375, 0.014284133911132812, 0.01599884033203125, 0.017713546752929688, 0.019428253173828125, 0.021142959594726562, 0.022857666015625, 0.024572372436523438, 0.026287078857421875, 0.028001785278320312, 0.02971649169921875, 0.03143119812011719, 0.033145904541015625, 0.03486061096191406, 0.0365753173828125, 0.03829002380371094, 0.040004730224609375, 0.04171943664550781, 0.04343414306640625, 0.04514884948730469, 0.046863555908203125, 0.04857826232910156, 0.05029296875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 4.0, 3.0, 7.0, 9.0, 7.0, 10.0, 17.0, 25.0, 27.0, 39.0, 68.0, 61.0, 119.0, 216.0, 537.0, 1313.0, 746.0, 312.0, 149.0, 108.0, 61.0, 49.0, 35.0, 20.0, 24.0, 27.0, 13.0, 14.0, 9.0, 15.0, 8.0, 5.0, 4.0, 10.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0191802978515625, -0.018611431121826172, -0.018042564392089844, -0.017473697662353516, -0.016904830932617188, -0.01633596420288086, -0.01576709747314453, -0.015198230743408203, -0.014629364013671875, -0.014060497283935547, -0.013491630554199219, -0.01292276382446289, -0.012353897094726562, -0.011785030364990234, -0.011216163635253906, -0.010647296905517578, -0.01007843017578125, -0.009509563446044922, -0.008940696716308594, -0.008371829986572266, -0.0078029632568359375, -0.007234096527099609, -0.006665229797363281, -0.006096363067626953, -0.005527496337890625, -0.004958629608154297, -0.004389762878417969, -0.0038208961486816406, -0.0032520294189453125, -0.0026831626892089844, -0.0021142959594726562, -0.0015454292297363281, -0.0009765625, -0.0004076957702636719, 0.00016117095947265625, 0.0007300376892089844, 0.0012989044189453125, 0.0018677711486816406, 0.0024366378784179688, 0.003005504608154297, 0.003574371337890625, 0.004143238067626953, 0.004712104797363281, 0.005280971527099609, 0.0058498382568359375, 0.006418704986572266, 0.006987571716308594, 0.007556438446044922, 0.00812530517578125, 0.008694171905517578, 0.009263038635253906, 0.009831905364990234, 0.010400772094726562, 0.01096963882446289, 0.011538505554199219, 0.012107372283935547, 0.012676239013671875, 0.013245105743408203, 0.013813972473144531, 0.01438283920288086, 0.014951705932617188, 0.015520572662353516, 0.016089439392089844, 0.016658306121826172, 0.0172271728515625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 5.0, 40.0, 402.0, 481.0, 61.0, 10.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06465546041727066, -0.05390220135450363, -0.0431489422917366, -0.032395679503679276, -0.021642420440912247, -0.010889161378145218, -0.00013589859008789062, 0.010617360472679138, 0.021370619535446167, 0.032123878598213196, 0.042877137660980225, 0.05363040044903755, 0.06438365578651428, 0.07513691484928131, 0.08589018136262894, 0.09664344042539597, 0.107396699488163, 0.11814995855093002, 0.12890322506427765, 0.13965648412704468, 0.1504097431898117, 0.16116300225257874, 0.17191626131534576, 0.1826695203781128, 0.19342277944087982, 0.20417603850364685, 0.21492929756641388, 0.2256825566291809, 0.23643581569194794, 0.24718907475471497, 0.2579423487186432, 0.268695592880249, 0.27944883704185486, 0.2902021110057831, 0.3009553551673889, 0.31170862913131714, 0.322461873292923, 0.3332151472568512, 0.34396839141845703, 0.35472166538238525, 0.3654749095439911, 0.3762281835079193, 0.38698142766952515, 0.39773470163345337, 0.4084879457950592, 0.4192412197589874, 0.42999446392059326, 0.4407477378845215, 0.4515010118484497, 0.46225428581237793, 0.47300752997398376, 0.483760803937912, 0.4945140480995178, 0.505267322063446, 0.5160205960273743, 0.5267738103866577, 0.5375270843505859, 0.5482803583145142, 0.5590336322784424, 0.5697868466377258, 0.580540120601654, 0.5912933945655823, 0.6020466685295105, 0.612799882888794, 0.6235531568527222]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 0.0, 1.0, 4.0, 11.0, 3.0, 3.0, 9.0, 13.0, 15.0, 12.0, 19.0, 21.0, 30.0, 25.0, 38.0, 41.0, 73.0, 52.0, 55.0, 52.0, 59.0, 51.0, 50.0, 48.0, 50.0, 51.0, 49.0, 31.0, 32.0, 25.0, 22.0, 19.0, 20.0, 5.0, 8.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.09513932466506958, -0.0924723893404007, -0.08980545401573181, -0.08713851869106293, -0.08447158336639404, -0.08180464804172516, -0.07913771271705627, -0.07647077739238739, -0.0738038420677185, -0.07113690674304962, -0.06846997141838074, -0.06580303609371185, -0.06313610076904297, -0.060469165444374084, -0.0578022301197052, -0.055135294795036316, -0.05246835947036743, -0.04980142414569855, -0.04713448882102966, -0.04446755349636078, -0.041800618171691895, -0.03913368284702301, -0.036466747522354126, -0.03379981219768524, -0.031132876873016357, -0.028465941548347473, -0.02579900622367859, -0.023132070899009705, -0.02046513557434082, -0.017798200249671936, -0.015131264925003052, -0.012464329600334167, -0.009797394275665283, -0.007130458950996399, -0.004463523626327515, -0.0017965883016586304, 0.0008703470230102539, 0.003537282347679138, 0.0062042176723480225, 0.008871152997016907, 0.011538088321685791, 0.014205023646354675, 0.01687195897102356, 0.019538894295692444, 0.022205829620361328, 0.024872764945030212, 0.027539700269699097, 0.03020663559436798, 0.032873570919036865, 0.03554050624370575, 0.038207441568374634, 0.04087437689304352, 0.0435413122177124, 0.04620824754238129, 0.04887518286705017, 0.051542118191719055, 0.05420905351638794, 0.056875988841056824, 0.05954292416572571, 0.06220985949039459, 0.06487679481506348, 0.06754373013973236, 0.07021066546440125, 0.07287760078907013, 0.07554453611373901]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 12.0, 13.0, 9.0, 14.0, 27.0, 46.0, 45.0, 75.0, 121.0, 153.0, 244.0, 383.0, 519.0, 765.0, 1279.0, 2027.0, 3212.0, 5691.0, 9989.0, 19980.0, 44920.0, 144195.0, 661855.0, 85401.0, 32294.0, 15261.0, 7942.0, 4417.0, 2774.0, 1731.0, 1101.0, 656.0, 455.0, 349.0, 199.0, 131.0, 86.0, 66.0, 34.0, 26.0, 19.0, 9.0, 8.0, 8.0, 7.0, 1.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0438232421875, -0.04250764846801758, -0.041192054748535156, -0.039876461029052734, -0.03856086730957031, -0.03724527359008789, -0.03592967987060547, -0.03461408615112305, -0.033298492431640625, -0.0319828987121582, -0.03066730499267578, -0.02935171127319336, -0.028036117553710938, -0.026720523834228516, -0.025404930114746094, -0.024089336395263672, -0.02277374267578125, -0.021458148956298828, -0.020142555236816406, -0.018826961517333984, -0.017511367797851562, -0.01619577407836914, -0.014880180358886719, -0.013564586639404297, -0.012248992919921875, -0.010933399200439453, -0.009617805480957031, -0.00830221176147461, -0.0069866180419921875, -0.005671024322509766, -0.004355430603027344, -0.003039836883544922, -0.0017242431640625, -0.0004086494445800781, 0.0009069442749023438, 0.0022225379943847656, 0.0035381317138671875, 0.004853725433349609, 0.006169319152832031, 0.007484912872314453, 0.008800506591796875, 0.010116100311279297, 0.011431694030761719, 0.01274728775024414, 0.014062881469726562, 0.015378475189208984, 0.016694068908691406, 0.018009662628173828, 0.01932525634765625, 0.020640850067138672, 0.021956443786621094, 0.023272037506103516, 0.024587631225585938, 0.02590322494506836, 0.02721881866455078, 0.028534412384033203, 0.029850006103515625, 0.031165599822998047, 0.03248119354248047, 0.03379678726196289, 0.03511238098144531, 0.036427974700927734, 0.037743568420410156, 0.03905916213989258, 0.040374755859375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 4.0, 4.0, 3.0, 2.0, 6.0, 6.0, 6.0, 12.0, 15.0, 22.0, 27.0, 22.0, 33.0, 42.0, 55.0, 252.0, 220.0, 67.0, 41.0, 29.0, 24.0, 18.0, 24.0, 9.0, 19.0, 7.0, 5.0, 9.0, 1.0, 5.0, 3.0, 3.0, 7.0, 4.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020751953125, -0.020085811614990234, -0.01941967010498047, -0.018753528594970703, -0.018087387084960938, -0.017421245574951172, -0.016755104064941406, -0.01608896255493164, -0.015422821044921875, -0.01475667953491211, -0.014090538024902344, -0.013424396514892578, -0.012758255004882812, -0.012092113494873047, -0.011425971984863281, -0.010759830474853516, -0.01009368896484375, -0.009427547454833984, -0.008761405944824219, -0.008095264434814453, -0.0074291229248046875, -0.006762981414794922, -0.006096839904785156, -0.005430698394775391, -0.004764556884765625, -0.004098415374755859, -0.0034322738647460938, -0.002766132354736328, -0.0020999908447265625, -0.0014338493347167969, -0.0007677078247070312, -0.00010156631469726562, 0.0005645751953125, 0.0012307167053222656, 0.0018968582153320312, 0.002562999725341797, 0.0032291412353515625, 0.003895282745361328, 0.004561424255371094, 0.005227565765380859, 0.005893707275390625, 0.006559848785400391, 0.007225990295410156, 0.007892131805419922, 0.008558273315429688, 0.009224414825439453, 0.009890556335449219, 0.010556697845458984, 0.01122283935546875, 0.011888980865478516, 0.012555122375488281, 0.013221263885498047, 0.013887405395507812, 0.014553546905517578, 0.015219688415527344, 0.01588582992553711, 0.016551971435546875, 0.01721811294555664, 0.017884254455566406, 0.018550395965576172, 0.019216537475585938, 0.019882678985595703, 0.02054882049560547, 0.021214962005615234, 0.021881103515625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 1.0, 7.0, 9.0, 12.0, 16.0, 16.0, 24.0, 36.0, 59.0, 89.0, 97.0, 139.0, 231.0, 418.0, 776.0, 1721.0, 5350.0, 22662.0, 150600.0, 694923.0, 141035.0, 21619.0, 5060.0, 1751.0, 759.0, 397.0, 242.0, 137.0, 103.0, 77.0, 49.0, 38.0, 35.0, 21.0, 12.0, 16.0, 9.0, 6.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.057464599609375, -0.05574846267700195, -0.054032325744628906, -0.05231618881225586, -0.05060005187988281, -0.048883914947509766, -0.04716777801513672, -0.04545164108276367, -0.043735504150390625, -0.04201936721801758, -0.04030323028564453, -0.038587093353271484, -0.03687095642089844, -0.03515481948852539, -0.033438682556152344, -0.0317225456237793, -0.03000640869140625, -0.028290271759033203, -0.026574134826660156, -0.02485799789428711, -0.023141860961914062, -0.021425724029541016, -0.01970958709716797, -0.017993450164794922, -0.016277313232421875, -0.014561176300048828, -0.012845039367675781, -0.011128902435302734, -0.009412765502929688, -0.007696628570556641, -0.005980491638183594, -0.004264354705810547, -0.0025482177734375, -0.0008320808410644531, 0.0008840560913085938, 0.0026001930236816406, 0.0043163299560546875, 0.006032466888427734, 0.007748603820800781, 0.009464740753173828, 0.011180877685546875, 0.012897014617919922, 0.014613151550292969, 0.016329288482666016, 0.018045425415039062, 0.01976156234741211, 0.021477699279785156, 0.023193836212158203, 0.02490997314453125, 0.026626110076904297, 0.028342247009277344, 0.03005838394165039, 0.03177452087402344, 0.033490657806396484, 0.03520679473876953, 0.03692293167114258, 0.038639068603515625, 0.04035520553588867, 0.04207134246826172, 0.043787479400634766, 0.04550361633300781, 0.04721975326538086, 0.048935890197753906, 0.05065202713012695, 0.0523681640625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 6.0, 10.0, 12.0, 8.0, 16.0, 15.0, 26.0, 25.0, 35.0, 23.0, 41.0, 40.0, 40.0, 48.0, 36.0, 50.0, 56.0, 42.0, 41.0, 57.0, 45.0, 33.0, 32.0, 33.0, 28.0, 29.0, 21.0, 31.0, 21.0, 21.0, 19.0, 13.0, 17.0, 6.0, 8.0, 5.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.08544921875, -0.08315610885620117, -0.08086299896240234, -0.07856988906860352, -0.07627677917480469, -0.07398366928100586, -0.07169055938720703, -0.0693974494934082, -0.06710433959960938, -0.06481122970581055, -0.06251811981201172, -0.06022500991821289, -0.05793190002441406, -0.055638790130615234, -0.053345680236816406, -0.05105257034301758, -0.04875946044921875, -0.04646635055541992, -0.044173240661621094, -0.041880130767822266, -0.03958702087402344, -0.03729391098022461, -0.03500080108642578, -0.03270769119262695, -0.030414581298828125, -0.028121471405029297, -0.02582836151123047, -0.02353525161743164, -0.021242141723632812, -0.018949031829833984, -0.016655921936035156, -0.014362812042236328, -0.0120697021484375, -0.009776592254638672, -0.007483482360839844, -0.005190372467041016, -0.0028972625732421875, -0.0006041526794433594, 0.0016889572143554688, 0.003982067108154297, 0.006275177001953125, 0.008568286895751953, 0.010861396789550781, 0.01315450668334961, 0.015447616577148438, 0.017740726470947266, 0.020033836364746094, 0.022326946258544922, 0.02462005615234375, 0.026913166046142578, 0.029206275939941406, 0.031499385833740234, 0.03379249572753906, 0.03608560562133789, 0.03837871551513672, 0.04067182540893555, 0.042964935302734375, 0.0452580451965332, 0.04755115509033203, 0.04984426498413086, 0.05213737487792969, 0.054430484771728516, 0.056723594665527344, 0.05901670455932617, 0.061309814453125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 9.0, 20.0, 21.0, 25.0, 79.0, 129.0, 239.0, 556.0, 1603.0, 7862.0, 197388.0, 819547.0, 17024.0, 2608.0, 762.0, 308.0, 170.0, 79.0, 46.0, 26.0, 11.0, 13.0, 8.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0316162109375, -0.030601978302001953, -0.029587745666503906, -0.02857351303100586, -0.027559280395507812, -0.026545047760009766, -0.02553081512451172, -0.024516582489013672, -0.023502349853515625, -0.022488117218017578, -0.02147388458251953, -0.020459651947021484, -0.019445419311523438, -0.01843118667602539, -0.017416954040527344, -0.016402721405029297, -0.01538848876953125, -0.014374256134033203, -0.013360023498535156, -0.01234579086303711, -0.011331558227539062, -0.010317325592041016, -0.009303092956542969, -0.008288860321044922, -0.007274627685546875, -0.006260395050048828, -0.005246162414550781, -0.004231929779052734, -0.0032176971435546875, -0.0022034645080566406, -0.0011892318725585938, -0.00017499923706054688, 0.0008392333984375, 0.0018534660339355469, 0.0028676986694335938, 0.0038819313049316406, 0.0048961639404296875, 0.005910396575927734, 0.006924629211425781, 0.007938861846923828, 0.008953094482421875, 0.009967327117919922, 0.010981559753417969, 0.011995792388916016, 0.013010025024414062, 0.01402425765991211, 0.015038490295410156, 0.016052722930908203, 0.01706695556640625, 0.018081188201904297, 0.019095420837402344, 0.02010965347290039, 0.021123886108398438, 0.022138118743896484, 0.02315235137939453, 0.024166584014892578, 0.025180816650390625, 0.026195049285888672, 0.02720928192138672, 0.028223514556884766, 0.029237747192382812, 0.03025197982788086, 0.031266212463378906, 0.03228044509887695, 0.033294677734375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 6.0, 8.0, 13.0, 9.0, 13.0, 21.0, 24.0, 25.0, 30.0, 39.0, 55.0, 60.0, 66.0, 45.0, 71.0, 69.0, 66.0, 63.0, 41.0, 53.0, 48.0, 27.0, 28.0, 30.0, 28.0, 32.0, 10.0, 7.0, 6.0, 9.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1563301086425781e-05, -1.1213123798370361e-05, -1.0862946510314941e-05, -1.0512769222259521e-05, -1.0162591934204102e-05, -9.812414646148682e-06, -9.462237358093262e-06, -9.112060070037842e-06, -8.761882781982422e-06, -8.411705493927002e-06, -8.061528205871582e-06, -7.711350917816162e-06, -7.361173629760742e-06, -7.010996341705322e-06, -6.660819053649902e-06, -6.310641765594482e-06, -5.9604644775390625e-06, -5.610287189483643e-06, -5.260109901428223e-06, -4.909932613372803e-06, -4.559755325317383e-06, -4.209578037261963e-06, -3.859400749206543e-06, -3.509223461151123e-06, -3.159046173095703e-06, -2.808868885040283e-06, -2.4586915969848633e-06, -2.1085143089294434e-06, -1.7583370208740234e-06, -1.4081597328186035e-06, -1.0579824447631836e-06, -7.078051567077637e-07, -3.5762786865234375e-07, -7.450580596923828e-09, 3.427267074584961e-07, 6.92903995513916e-07, 1.043081283569336e-06, 1.3932585716247559e-06, 1.7434358596801758e-06, 2.0936131477355957e-06, 2.4437904357910156e-06, 2.7939677238464355e-06, 3.1441450119018555e-06, 3.4943222999572754e-06, 3.844499588012695e-06, 4.194676876068115e-06, 4.544854164123535e-06, 4.895031452178955e-06, 5.245208740234375e-06, 5.595386028289795e-06, 5.945563316345215e-06, 6.295740604400635e-06, 6.645917892456055e-06, 6.996095180511475e-06, 7.3462724685668945e-06, 7.696449756622314e-06, 8.046627044677734e-06, 8.396804332733154e-06, 8.746981620788574e-06, 9.097158908843994e-06, 9.447336196899414e-06, 9.797513484954834e-06, 1.0147690773010254e-05, 1.0497868061065674e-05, 1.0848045349121094e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 3.0, 6.0, 5.0, 6.0, 7.0, 18.0, 26.0, 40.0, 49.0, 89.0, 167.0, 366.0, 780.0, 2370.0, 9471.0, 75666.0, 756400.0, 181316.0, 16377.0, 3431.0, 1056.0, 417.0, 209.0, 113.0, 59.0, 38.0, 24.0, 16.0, 10.0, 6.0, 4.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.02227783203125, -0.021635055541992188, -0.020992279052734375, -0.020349502563476562, -0.01970672607421875, -0.019063949584960938, -0.018421173095703125, -0.017778396606445312, -0.0171356201171875, -0.016492843627929688, -0.015850067138671875, -0.015207290649414062, -0.01456451416015625, -0.013921737670898438, -0.013278961181640625, -0.012636184692382812, -0.011993408203125, -0.011350631713867188, -0.010707855224609375, -0.010065078735351562, -0.00942230224609375, -0.008779525756835938, -0.008136749267578125, -0.0074939727783203125, -0.0068511962890625, -0.0062084197998046875, -0.005565643310546875, -0.0049228668212890625, -0.00428009033203125, -0.0036373138427734375, -0.002994537353515625, -0.0023517608642578125, -0.001708984375, -0.0010662078857421875, -0.000423431396484375, 0.0002193450927734375, 0.00086212158203125, 0.0015048980712890625, 0.002147674560546875, 0.0027904510498046875, 0.0034332275390625, 0.0040760040283203125, 0.004718780517578125, 0.0053615570068359375, 0.00600433349609375, 0.0066471099853515625, 0.007289886474609375, 0.007932662963867188, 0.008575439453125, 0.009218215942382812, 0.009860992431640625, 0.010503768920898438, 0.01114654541015625, 0.011789321899414062, 0.012432098388671875, 0.013074874877929688, 0.0137176513671875, 0.014360427856445312, 0.015003204345703125, 0.015645980834960938, 0.01628875732421875, 0.016931533813476562, 0.017574310302734375, 0.018217086791992188, 0.01885986328125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 3.0, 11.0, 12.0, 11.0, 15.0, 17.0, 34.0, 41.0, 78.0, 73.0, 108.0, 106.0, 97.0, 87.0, 73.0, 66.0, 48.0, 38.0, 30.0, 18.0, 13.0, 6.0, 8.0, 2.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.024169921875, -0.0234830379486084, -0.022796154022216797, -0.022109270095825195, -0.021422386169433594, -0.020735502243041992, -0.02004861831665039, -0.01936173439025879, -0.018674850463867188, -0.017987966537475586, -0.017301082611083984, -0.016614198684692383, -0.01592731475830078, -0.01524043083190918, -0.014553546905517578, -0.013866662979125977, -0.013179779052734375, -0.012492895126342773, -0.011806011199951172, -0.01111912727355957, -0.010432243347167969, -0.009745359420776367, -0.009058475494384766, -0.008371591567993164, -0.0076847076416015625, -0.006997823715209961, -0.006310939788818359, -0.005624055862426758, -0.004937171936035156, -0.004250288009643555, -0.003563404083251953, -0.0028765201568603516, -0.00218963623046875, -0.0015027523040771484, -0.0008158683776855469, -0.0001289844512939453, 0.0005578994750976562, 0.0012447834014892578, 0.0019316673278808594, 0.002618551254272461, 0.0033054351806640625, 0.003992319107055664, 0.004679203033447266, 0.005366086959838867, 0.006052970886230469, 0.00673985481262207, 0.007426738739013672, 0.008113622665405273, 0.008800506591796875, 0.009487390518188477, 0.010174274444580078, 0.01086115837097168, 0.011548042297363281, 0.012234926223754883, 0.012921810150146484, 0.013608694076538086, 0.014295578002929688, 0.014982461929321289, 0.01566934585571289, 0.016356229782104492, 0.017043113708496094, 0.017729997634887695, 0.018416881561279297, 0.0191037654876709, 0.0197906494140625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [2.0, 13.0, 31.0, 395.0, 538.0, 31.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20775380730628967, -0.15670248866081238, -0.10565116256475449, -0.054599836468696594, -0.0035485178232192993, 0.04750281572341919, 0.09855413436889648, 0.14960545301437378, 0.20065677165985107, 0.25170809030532837, 0.30275940895080566, 0.35381072759628296, 0.40486204624176025, 0.45591339468955994, 0.5069646835327148, 0.5580160617828369, 0.6090673208236694, 0.6601186394691467, 0.711169958114624, 0.7622212767601013, 0.8132725954055786, 0.8643239736557007, 0.9153752326965332, 0.9664266109466553, 1.0174779891967773, 1.0685293674468994, 1.119580626487732, 1.170632004737854, 1.2216832637786865, 1.2727346420288086, 1.3237859010696411, 1.3748372793197632, 1.4258884191513062, 1.4769397974014282, 1.5279910564422607, 1.5790424346923828, 1.6300936937332153, 1.6811450719833374, 1.73219633102417, 1.783247709274292, 1.8342989683151245, 1.8853503465652466, 1.936401605606079, 1.9874529838562012, 2.0385043621063232, 2.089555501937866, 2.1406068801879883, 2.1916582584381104, 2.2427096366882324, 2.2937610149383545, 2.3448123931884766, 2.3958635330200195, 2.4469149112701416, 2.4979662895202637, 2.5490176677703857, 2.6000688076019287, 2.651120185852051, 2.702171564102173, 2.753222942352295, 2.804274082183838, 2.85532546043396, 2.906376838684082, 2.957428216934204, 3.008479356765747, 3.059530735015869]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 8.0, 1.0, 4.0, 3.0, 7.0, 9.0, 9.0, 7.0, 8.0, 9.0, 14.0, 32.0, 48.0, 102.0, 110.0, 167.0, 153.0, 127.0, 69.0, 36.0, 18.0, 19.0, 6.0, 5.0, 2.0, 4.0, 3.0, 4.0, 3.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4588866233825684, -1.418999433517456, -1.3791122436523438, -1.3392250537872314, -1.2993378639221191, -1.2594506740570068, -1.2195634841918945, -1.1796762943267822, -1.13978910446167, -1.0999019145965576, -1.0600147247314453, -1.020127534866333, -0.9802403450012207, -0.9403531551361084, -0.9004659652709961, -0.8605787754058838, -0.8206915855407715, -0.7808043956756592, -0.7409172058105469, -0.7010300159454346, -0.6611428260803223, -0.62125563621521, -0.5813684463500977, -0.5414812564849854, -0.501594066619873, -0.46170687675476074, -0.42181968688964844, -0.38193249702453613, -0.34204530715942383, -0.3021581172943115, -0.2622709274291992, -0.22238373756408691, -0.1824965476989746, -0.1426093578338623, -0.10272216796875, -0.0628349781036377, -0.02294778823852539, 0.016939401626586914, 0.05682659149169922, 0.09671378135681152, 0.13660097122192383, 0.17648816108703613, 0.21637535095214844, 0.25626254081726074, 0.29614973068237305, 0.33603692054748535, 0.37592411041259766, 0.41581130027770996, 0.45569849014282227, 0.49558568000793457, 0.5354728698730469, 0.5753600597381592, 0.6152472496032715, 0.6551344394683838, 0.6950216293334961, 0.7349088191986084, 0.7747960090637207, 0.814683198928833, 0.8545703887939453, 0.8944575786590576, 0.9343447685241699, 0.9742319583892822, 1.0141191482543945, 1.0540063381195068, 1.0938935279846191]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 8.0, 9.0, 19.0, 21.0, 25.0, 40.0, 46.0, 85.0, 103.0, 184.0, 236.0, 368.0, 568.0, 887.0, 1470.0, 2372.0, 4193.0, 7981.0, 16318.0, 43379.0, 255070.0, 3706340.0, 100439.0, 27748.0, 11918.0, 6051.0, 3261.0, 1913.0, 1148.0, 662.0, 508.0, 324.0, 195.0, 125.0, 67.0, 64.0, 40.0, 32.0, 25.0, 13.0, 10.0, 7.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.098388671875, -0.09534263610839844, -0.09229660034179688, -0.08925056457519531, -0.08620452880859375, -0.08315849304199219, -0.08011245727539062, -0.07706642150878906, -0.0740203857421875, -0.07097434997558594, -0.06792831420898438, -0.06488227844238281, -0.06183624267578125, -0.05879020690917969, -0.055744171142578125, -0.05269813537597656, -0.049652099609375, -0.04660606384277344, -0.043560028076171875, -0.04051399230957031, -0.03746795654296875, -0.03442192077636719, -0.031375885009765625, -0.028329849243164062, -0.0252838134765625, -0.022237777709960938, -0.019191741943359375, -0.016145706176757812, -0.01309967041015625, -0.010053634643554688, -0.007007598876953125, -0.0039615631103515625, -0.00091552734375, 0.0021305084228515625, 0.005176544189453125, 0.008222579956054688, 0.01126861572265625, 0.014314651489257812, 0.017360687255859375, 0.020406723022460938, 0.0234527587890625, 0.026498794555664062, 0.029544830322265625, 0.03259086608886719, 0.03563690185546875, 0.03868293762207031, 0.041728973388671875, 0.04477500915527344, 0.047821044921875, 0.05086708068847656, 0.053913116455078125, 0.05695915222167969, 0.06000518798828125, 0.06305122375488281, 0.06609725952148438, 0.06914329528808594, 0.0721893310546875, 0.07523536682128906, 0.07828140258789062, 0.08132743835449219, 0.08437347412109375, 0.08741950988769531, 0.09046554565429688, 0.09351158142089844, 0.0965576171875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 7.0, 5.0, 6.0, 7.0, 15.0, 13.0, 15.0, 27.0, 22.0, 25.0, 36.0, 43.0, 81.0, 182.0, 191.0, 96.0, 41.0, 34.0, 33.0, 17.0, 18.0, 17.0, 12.0, 17.0, 5.0, 8.0, 6.0, 8.0, 4.0, 2.0, 1.0, 2.0, 0.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0208587646484375, -0.0203096866607666, -0.019760608673095703, -0.019211530685424805, -0.018662452697753906, -0.018113374710083008, -0.01756429672241211, -0.01701521873474121, -0.016466140747070312, -0.015917062759399414, -0.015367984771728516, -0.014818906784057617, -0.014269828796386719, -0.01372075080871582, -0.013171672821044922, -0.012622594833374023, -0.012073516845703125, -0.011524438858032227, -0.010975360870361328, -0.01042628288269043, -0.009877204895019531, -0.009328126907348633, -0.008779048919677734, -0.008229970932006836, -0.0076808929443359375, -0.007131814956665039, -0.006582736968994141, -0.006033658981323242, -0.005484580993652344, -0.004935503005981445, -0.004386425018310547, -0.0038373470306396484, -0.00328826904296875, -0.0027391910552978516, -0.002190113067626953, -0.0016410350799560547, -0.0010919570922851562, -0.0005428791046142578, 6.198883056640625e-06, 0.0005552768707275391, 0.0011043548583984375, 0.001653432846069336, 0.0022025108337402344, 0.002751588821411133, 0.0033006668090820312, 0.0038497447967529297, 0.004398822784423828, 0.0049479007720947266, 0.005496978759765625, 0.0060460567474365234, 0.006595134735107422, 0.00714421272277832, 0.007693290710449219, 0.008242368698120117, 0.008791446685791016, 0.009340524673461914, 0.009889602661132812, 0.010438680648803711, 0.01098775863647461, 0.011536836624145508, 0.012085914611816406, 0.012634992599487305, 0.013184070587158203, 0.013733148574829102, 0.0142822265625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 5.0, 1.0, 3.0, 4.0, 5.0, 8.0, 16.0, 13.0, 13.0, 22.0, 40.0, 48.0, 78.0, 125.0, 220.0, 389.0, 668.0, 1433.0, 3366.0, 8682.0, 26489.0, 111000.0, 3259480.0, 680511.0, 70604.0, 19197.0, 6634.0, 2682.0, 1128.0, 593.0, 290.0, 204.0, 115.0, 65.0, 51.0, 33.0, 22.0, 12.0, 10.0, 7.0, 3.0, 8.0, 4.0, 0.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09619140625, -0.09317207336425781, -0.09015274047851562, -0.08713340759277344, -0.08411407470703125, -0.08109474182128906, -0.07807540893554688, -0.07505607604980469, -0.0720367431640625, -0.06901741027832031, -0.06599807739257812, -0.06297874450683594, -0.05995941162109375, -0.05694007873535156, -0.053920745849609375, -0.05090141296386719, -0.047882080078125, -0.04486274719238281, -0.041843414306640625, -0.03882408142089844, -0.03580474853515625, -0.03278541564941406, -0.029766082763671875, -0.026746749877929688, -0.0237274169921875, -0.020708084106445312, -0.017688751220703125, -0.014669418334960938, -0.01165008544921875, -0.008630752563476562, -0.005611419677734375, -0.0025920867919921875, 0.00042724609375, 0.0034465789794921875, 0.006465911865234375, 0.009485244750976562, 0.01250457763671875, 0.015523910522460938, 0.018543243408203125, 0.021562576293945312, 0.0245819091796875, 0.027601242065429688, 0.030620574951171875, 0.03363990783691406, 0.03665924072265625, 0.03967857360839844, 0.042697906494140625, 0.04571723937988281, 0.048736572265625, 0.05175590515136719, 0.054775238037109375, 0.05779457092285156, 0.06081390380859375, 0.06383323669433594, 0.06685256958007812, 0.06987190246582031, 0.0728912353515625, 0.07591056823730469, 0.07892990112304688, 0.08194923400878906, 0.08496856689453125, 0.08798789978027344, 0.09100723266601562, 0.09402656555175781, 0.0970458984375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 5.0, 2.0, 14.0, 9.0, 13.0, 15.0, 16.0, 28.0, 53.0, 58.0, 82.0, 136.0, 251.0, 629.0, 1837.0, 365.0, 172.0, 107.0, 65.0, 52.0, 37.0, 25.0, 21.0, 17.0, 14.0, 10.0, 8.0, 4.0, 3.0, 6.0, 7.0, 2.0, 0.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0224151611328125, -0.021828889846801758, -0.021242618560791016, -0.020656347274780273, -0.02007007598876953, -0.01948380470275879, -0.018897533416748047, -0.018311262130737305, -0.017724990844726562, -0.01713871955871582, -0.016552448272705078, -0.015966176986694336, -0.015379905700683594, -0.014793634414672852, -0.01420736312866211, -0.013621091842651367, -0.013034820556640625, -0.012448549270629883, -0.01186227798461914, -0.011276006698608398, -0.010689735412597656, -0.010103464126586914, -0.009517192840576172, -0.00893092155456543, -0.008344650268554688, -0.007758378982543945, -0.007172107696533203, -0.006585836410522461, -0.005999565124511719, -0.0054132938385009766, -0.004827022552490234, -0.004240751266479492, -0.00365447998046875, -0.003068208694458008, -0.0024819374084472656, -0.0018956661224365234, -0.0013093948364257812, -0.0007231235504150391, -0.00013685226440429688, 0.0004494190216064453, 0.0010356903076171875, 0.0016219615936279297, 0.002208232879638672, 0.002794504165649414, 0.0033807754516601562, 0.0039670467376708984, 0.004553318023681641, 0.005139589309692383, 0.005725860595703125, 0.006312131881713867, 0.006898403167724609, 0.0074846744537353516, 0.008070945739746094, 0.008657217025756836, 0.009243488311767578, 0.00982975959777832, 0.010416030883789062, 0.011002302169799805, 0.011588573455810547, 0.012174844741821289, 0.012761116027832031, 0.013347387313842773, 0.013933658599853516, 0.014519929885864258, 0.015106201171875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 32.0, 142.0, 435.0, 303.0, 68.0, 19.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08249970525503159, -0.07544651627540588, -0.06839332729578018, -0.06134013831615448, -0.05428694933652878, -0.047233764082193375, -0.04018057510256767, -0.03312738612294197, -0.02607419714331627, -0.019021008163690567, -0.01196782011538744, -0.0049146320670843124, 0.0021385569125413895, 0.009191744029521942, 0.016244933009147644, 0.023298121988773346, 0.030351310968399048, 0.03740449994802475, 0.04445768892765045, 0.051510877907276154, 0.058564066886901855, 0.06561724841594696, 0.07267044484615326, 0.07972362637519836, 0.08677682280540466, 0.09383001178503036, 0.10088320076465607, 0.10793638974428177, 0.11498957872390747, 0.12204276025295258, 0.12909595668315887, 0.13614913821220398, 0.14320231974124908, 0.1502555012702942, 0.1573086977005005, 0.1643618792295456, 0.1714150756597519, 0.178468257188797, 0.1855214536190033, 0.1925746351480484, 0.1996278315782547, 0.2066810131072998, 0.2137342095375061, 0.2207873910665512, 0.2278405874967575, 0.2348937690258026, 0.2419469654560089, 0.24900014698505402, 0.2560533285140991, 0.2631065249443054, 0.27015969157218933, 0.27721288800239563, 0.28426608443260193, 0.2913192808628082, 0.29837244749069214, 0.30542564392089844, 0.31247884035110474, 0.31953203678131104, 0.32658520340919495, 0.33363839983940125, 0.34069159626960754, 0.34774479269981384, 0.35479795932769775, 0.36185115575790405, 0.36890435218811035]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 10.0, 6.0, 9.0, 16.0, 13.0, 19.0, 25.0, 35.0, 51.0, 49.0, 75.0, 57.0, 77.0, 86.0, 77.0, 76.0, 59.0, 53.0, 33.0, 35.0, 28.0, 25.0, 10.0, 21.0, 11.0, 4.0, 8.0, 6.0, 5.0, 4.0, 4.0, 2.0, 0.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.08272719383239746, -0.08022410422563553, -0.0777210146188736, -0.07521792501211166, -0.07271483540534973, -0.0702117532491684, -0.06770866364240646, -0.06520557403564453, -0.0627024844288826, -0.060199394822120667, -0.057696305215358734, -0.0551932193338871, -0.05269012972712517, -0.050187040120363235, -0.0476839542388916, -0.04518086463212967, -0.04267777502536774, -0.040174685418605804, -0.03767159581184387, -0.03516850993037224, -0.032665420323610306, -0.030162330716848373, -0.02765924297273159, -0.025156155228614807, -0.022653065621852875, -0.020149976015090942, -0.01764688827097416, -0.015143799595534801, -0.012640710920095444, -0.010137622244656086, -0.007634533569216728, -0.005131445825099945, -0.0026283562183380127, -0.00012526754289865494, 0.002377821132540703, 0.004880909807980061, 0.007383998483419418, 0.009887087158858776, 0.012390175834298134, 0.014893263578414917, 0.01739635318517685, 0.019899442791938782, 0.022402530536055565, 0.024905618280172348, 0.02740870788693428, 0.029911797493696213, 0.03241488337516785, 0.03491797298192978, 0.03742106258869171, 0.039924152195453644, 0.042427241802215576, 0.04493032768368721, 0.04743341729044914, 0.049936506897211075, 0.05243959277868271, 0.05494268238544464, 0.057445771992206573, 0.059948861598968506, 0.06245195120573044, 0.06495504081249237, 0.0674581229686737, 0.06996121257543564, 0.07246430218219757, 0.0749673917889595, 0.07747048139572144]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 5.0, 2.0, 3.0, 10.0, 8.0, 17.0, 13.0, 24.0, 43.0, 44.0, 78.0, 126.0, 204.0, 336.0, 537.0, 997.0, 1892.0, 3656.0, 8401.0, 21395.0, 73443.0, 622629.0, 240371.0, 46349.0, 15355.0, 6187.0, 2935.0, 1409.0, 781.0, 499.0, 287.0, 186.0, 108.0, 70.0, 48.0, 40.0, 13.0, 13.0, 16.0, 14.0, 9.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11676025390625, -0.11350154876708984, -0.11024284362792969, -0.10698413848876953, -0.10372543334960938, -0.10046672821044922, -0.09720802307128906, -0.0939493179321289, -0.09069061279296875, -0.0874319076538086, -0.08417320251464844, -0.08091449737548828, -0.07765579223632812, -0.07439708709716797, -0.07113838195800781, -0.06787967681884766, -0.0646209716796875, -0.061362266540527344, -0.05810356140136719, -0.05484485626220703, -0.051586151123046875, -0.04832744598388672, -0.04506874084472656, -0.041810035705566406, -0.03855133056640625, -0.035292625427246094, -0.03203392028808594, -0.02877521514892578, -0.025516510009765625, -0.02225780487060547, -0.018999099731445312, -0.015740394592285156, -0.012481689453125, -0.009222984313964844, -0.0059642791748046875, -0.0027055740356445312, 0.000553131103515625, 0.0038118362426757812, 0.0070705413818359375, 0.010329246520996094, 0.01358795166015625, 0.016846656799316406, 0.020105361938476562, 0.02336406707763672, 0.026622772216796875, 0.02988147735595703, 0.03314018249511719, 0.036398887634277344, 0.0396575927734375, 0.042916297912597656, 0.04617500305175781, 0.04943370819091797, 0.052692413330078125, 0.05595111846923828, 0.05920982360839844, 0.062468528747558594, 0.06572723388671875, 0.0689859390258789, 0.07224464416503906, 0.07550334930419922, 0.07876205444335938, 0.08202075958251953, 0.08527946472167969, 0.08853816986083984, 0.091796875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 2.0, 4.0, 7.0, 5.0, 7.0, 14.0, 17.0, 11.0, 24.0, 26.0, 39.0, 26.0, 55.0, 113.0, 176.0, 151.0, 84.0, 44.0, 36.0, 32.0, 26.0, 13.0, 19.0, 8.0, 18.0, 12.0, 2.0, 9.0, 3.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.0210418701171875, -0.020514369010925293, -0.019986867904663086, -0.01945936679840088, -0.018931865692138672, -0.018404364585876465, -0.017876863479614258, -0.01734936237335205, -0.016821861267089844, -0.016294360160827637, -0.01576685905456543, -0.015239357948303223, -0.014711856842041016, -0.014184355735778809, -0.013656854629516602, -0.013129353523254395, -0.012601852416992188, -0.01207435131072998, -0.011546850204467773, -0.011019349098205566, -0.01049184799194336, -0.009964346885681152, -0.009436845779418945, -0.008909344673156738, -0.008381843566894531, -0.007854342460632324, -0.007326841354370117, -0.00679934024810791, -0.006271839141845703, -0.005744338035583496, -0.005216836929321289, -0.004689335823059082, -0.004161834716796875, -0.003634333610534668, -0.003106832504272461, -0.002579331398010254, -0.002051830291748047, -0.0015243291854858398, -0.0009968280792236328, -0.0004693269729614258, 5.817413330078125e-05, 0.0005856752395629883, 0.0011131763458251953, 0.0016406774520874023, 0.0021681785583496094, 0.0026956796646118164, 0.0032231807708740234, 0.0037506818771362305, 0.0042781829833984375, 0.0048056840896606445, 0.0053331851959228516, 0.005860686302185059, 0.006388187408447266, 0.006915688514709473, 0.00744318962097168, 0.007970690727233887, 0.008498191833496094, 0.0090256929397583, 0.009553194046020508, 0.010080695152282715, 0.010608196258544922, 0.011135697364807129, 0.011663198471069336, 0.012190699577331543, 0.01271820068359375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 9.0, 2.0, 7.0, 13.0, 22.0, 21.0, 36.0, 66.0, 88.0, 196.0, 501.0, 2216.0, 15803.0, 485391.0, 525182.0, 15805.0, 2199.0, 526.0, 197.0, 82.0, 64.0, 28.0, 28.0, 16.0, 5.0, 8.0, 8.0, 3.0, 2.0, 5.0, 4.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.1575927734375, -0.1530914306640625, -0.148590087890625, -0.1440887451171875, -0.13958740234375, -0.1350860595703125, -0.130584716796875, -0.1260833740234375, -0.12158203125, -0.1170806884765625, -0.112579345703125, -0.1080780029296875, -0.10357666015625, -0.0990753173828125, -0.094573974609375, -0.0900726318359375, -0.0855712890625, -0.0810699462890625, -0.076568603515625, -0.0720672607421875, -0.06756591796875, -0.0630645751953125, -0.058563232421875, -0.0540618896484375, -0.049560546875, -0.0450592041015625, -0.040557861328125, -0.0360565185546875, -0.03155517578125, -0.0270538330078125, -0.022552490234375, -0.0180511474609375, -0.0135498046875, -0.0090484619140625, -0.004547119140625, -4.57763671875e-05, 0.00445556640625, 0.0089569091796875, 0.013458251953125, 0.0179595947265625, 0.0224609375, 0.0269622802734375, 0.031463623046875, 0.0359649658203125, 0.04046630859375, 0.0449676513671875, 0.049468994140625, 0.0539703369140625, 0.0584716796875, 0.0629730224609375, 0.067474365234375, 0.0719757080078125, 0.07647705078125, 0.0809783935546875, 0.085479736328125, 0.0899810791015625, 0.094482421875, 0.0989837646484375, 0.103485107421875, 0.1079864501953125, 0.11248779296875, 0.1169891357421875, 0.121490478515625, 0.1259918212890625, 0.1304931640625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 10.0, 6.0, 7.0, 5.0, 8.0, 18.0, 19.0, 14.0, 23.0, 21.0, 28.0, 32.0, 40.0, 42.0, 56.0, 46.0, 49.0, 46.0, 55.0, 44.0, 35.0, 49.0, 57.0, 38.0, 34.0, 42.0, 25.0, 31.0, 25.0, 16.0, 19.0, 12.0, 10.0, 12.0, 4.0, 7.0, 7.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.05364990234375, -0.052046775817871094, -0.05044364929199219, -0.04884052276611328, -0.047237396240234375, -0.04563426971435547, -0.04403114318847656, -0.042428016662597656, -0.04082489013671875, -0.039221763610839844, -0.03761863708496094, -0.03601551055908203, -0.034412384033203125, -0.03280925750732422, -0.031206130981445312, -0.029603004455566406, -0.0279998779296875, -0.026396751403808594, -0.024793624877929688, -0.02319049835205078, -0.021587371826171875, -0.01998424530029297, -0.018381118774414062, -0.016777992248535156, -0.01517486572265625, -0.013571739196777344, -0.011968612670898438, -0.010365486145019531, -0.008762359619140625, -0.007159233093261719, -0.0055561065673828125, -0.003952980041503906, -0.002349853515625, -0.0007467269897460938, 0.0008563995361328125, 0.0024595260620117188, 0.004062652587890625, 0.005665779113769531, 0.0072689056396484375, 0.008872032165527344, 0.01047515869140625, 0.012078285217285156, 0.013681411743164062, 0.015284538269042969, 0.016887664794921875, 0.01849079132080078, 0.020093917846679688, 0.021697044372558594, 0.0233001708984375, 0.024903297424316406, 0.026506423950195312, 0.02810955047607422, 0.029712677001953125, 0.03131580352783203, 0.03291893005371094, 0.034522056579589844, 0.03612518310546875, 0.037728309631347656, 0.03933143615722656, 0.04093456268310547, 0.042537689208984375, 0.04414081573486328, 0.04574394226074219, 0.047347068786621094, 0.0489501953125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 7.0, 13.0, 25.0, 78.0, 554.0, 616227.0, 430949.0, 562.0, 82.0, 33.0, 15.0, 3.0, 3.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4658203125, -0.4538726806640625, -0.441925048828125, -0.4299774169921875, -0.41802978515625, -0.4060821533203125, -0.394134521484375, -0.3821868896484375, -0.3702392578125, -0.3582916259765625, -0.346343994140625, -0.3343963623046875, -0.32244873046875, -0.3105010986328125, -0.298553466796875, -0.2866058349609375, -0.274658203125, -0.2627105712890625, -0.250762939453125, -0.2388153076171875, -0.22686767578125, -0.2149200439453125, -0.202972412109375, -0.1910247802734375, -0.1790771484375, -0.1671295166015625, -0.155181884765625, -0.1432342529296875, -0.13128662109375, -0.1193389892578125, -0.107391357421875, -0.0954437255859375, -0.08349609375, -0.0715484619140625, -0.059600830078125, -0.0476531982421875, -0.03570556640625, -0.0237579345703125, -0.011810302734375, 0.0001373291015625, 0.0120849609375, 0.0240325927734375, 0.035980224609375, 0.0479278564453125, 0.05987548828125, 0.0718231201171875, 0.083770751953125, 0.0957183837890625, 0.107666015625, 0.1196136474609375, 0.131561279296875, 0.1435089111328125, 0.15545654296875, 0.1674041748046875, 0.179351806640625, 0.1912994384765625, 0.2032470703125, 0.2151947021484375, 0.227142333984375, 0.2390899658203125, 0.25103759765625, 0.2629852294921875, 0.274932861328125, 0.2868804931640625, 0.298828125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 2.0, 5.0, 5.0, 9.0, 17.0, 14.0, 23.0, 34.0, 45.0, 62.0, 70.0, 99.0, 106.0, 121.0, 83.0, 79.0, 57.0, 34.0, 29.0, 25.0, 9.0, 7.0, 10.0, 7.0, 9.0, 6.0, 8.0, 3.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.9981136322021484e-05, -2.8857029974460602e-05, -2.773292362689972e-05, -2.6608817279338837e-05, -2.5484710931777954e-05, -2.436060458421707e-05, -2.323649823665619e-05, -2.2112391889095306e-05, -2.0988285541534424e-05, -1.986417919397354e-05, -1.874007284641266e-05, -1.7615966498851776e-05, -1.6491860151290894e-05, -1.536775380373001e-05, -1.4243647456169128e-05, -1.3119541108608246e-05, -1.1995434761047363e-05, -1.087132841348648e-05, -9.747222065925598e-06, -8.623115718364716e-06, -7.499009370803833e-06, -6.3749030232429504e-06, -5.250796675682068e-06, -4.126690328121185e-06, -3.0025839805603027e-06, -1.8784776329994202e-06, -7.543712854385376e-07, 3.6973506212234497e-07, 1.4938414096832275e-06, 2.61794775724411e-06, 3.7420541048049927e-06, 4.866160452365875e-06, 5.990266799926758e-06, 7.11437314748764e-06, 8.238479495048523e-06, 9.362585842609406e-06, 1.0486692190170288e-05, 1.161079853773117e-05, 1.2734904885292053e-05, 1.3859011232852936e-05, 1.4983117580413818e-05, 1.61072239279747e-05, 1.7231330275535583e-05, 1.8355436623096466e-05, 1.947954297065735e-05, 2.060364931821823e-05, 2.1727755665779114e-05, 2.2851862013339996e-05, 2.397596836090088e-05, 2.510007470846176e-05, 2.6224181056022644e-05, 2.7348287403583527e-05, 2.847239375114441e-05, 2.9596500098705292e-05, 3.0720606446266174e-05, 3.184471279382706e-05, 3.296881914138794e-05, 3.409292548894882e-05, 3.5217031836509705e-05, 3.634113818407059e-05, 3.746524453163147e-05, 3.858935087919235e-05, 3.9713457226753235e-05, 4.083756357431412e-05, 4.1961669921875e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 10.0, 12.0, 28.0, 34.0, 50.0, 107.0, 208.0, 500.0, 1401.0, 5130.0, 38540.0, 842549.0, 145093.0, 10940.0, 2487.0, 795.0, 344.0, 126.0, 69.0, 42.0, 16.0, 15.0, 14.0, 8.0, 9.0, 5.0, 6.0, 2.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09271240234375, -0.08987712860107422, -0.08704185485839844, -0.08420658111572266, -0.08137130737304688, -0.0785360336303711, -0.07570075988769531, -0.07286548614501953, -0.07003021240234375, -0.06719493865966797, -0.06435966491699219, -0.061524391174316406, -0.058689117431640625, -0.055853843688964844, -0.05301856994628906, -0.05018329620361328, -0.0473480224609375, -0.04451274871826172, -0.04167747497558594, -0.038842201232910156, -0.036006927490234375, -0.033171653747558594, -0.030336380004882812, -0.02750110626220703, -0.02466583251953125, -0.02183055877685547, -0.018995285034179688, -0.016160011291503906, -0.013324737548828125, -0.010489463806152344, -0.0076541900634765625, -0.004818916320800781, -0.001983642578125, 0.0008516311645507812, 0.0036869049072265625, 0.006522178649902344, 0.009357452392578125, 0.012192726135253906, 0.015027999877929688, 0.01786327362060547, 0.02069854736328125, 0.02353382110595703, 0.026369094848632812, 0.029204368591308594, 0.032039642333984375, 0.034874916076660156, 0.03771018981933594, 0.04054546356201172, 0.0433807373046875, 0.04621601104736328, 0.04905128479003906, 0.051886558532714844, 0.054721832275390625, 0.057557106018066406, 0.06039237976074219, 0.06322765350341797, 0.06606292724609375, 0.06889820098876953, 0.07173347473144531, 0.0745687484741211, 0.07740402221679688, 0.08023929595947266, 0.08307456970214844, 0.08590984344482422, 0.0887451171875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 8.0, 6.0, 10.0, 16.0, 25.0, 41.0, 67.0, 124.0, 133.0, 173.0, 160.0, 93.0, 51.0, 26.0, 16.0, 12.0, 8.0, 8.0, 4.0, 1.0, 2.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.057373046875, -0.05559873580932617, -0.053824424743652344, -0.052050113677978516, -0.05027580261230469, -0.04850149154663086, -0.04672718048095703, -0.0449528694152832, -0.043178558349609375, -0.04140424728393555, -0.03962993621826172, -0.03785562515258789, -0.03608131408691406, -0.034307003021240234, -0.032532691955566406, -0.030758380889892578, -0.02898406982421875, -0.027209758758544922, -0.025435447692871094, -0.023661136627197266, -0.021886825561523438, -0.02011251449584961, -0.01833820343017578, -0.016563892364501953, -0.014789581298828125, -0.013015270233154297, -0.011240959167480469, -0.00946664810180664, -0.0076923370361328125, -0.005918025970458984, -0.004143714904785156, -0.002369403839111328, -0.0005950927734375, 0.0011792182922363281, 0.0029535293579101562, 0.004727840423583984, 0.0065021514892578125, 0.00827646255493164, 0.010050773620605469, 0.011825084686279297, 0.013599395751953125, 0.015373706817626953, 0.01714801788330078, 0.01892232894897461, 0.020696640014648438, 0.022470951080322266, 0.024245262145996094, 0.026019573211669922, 0.02779388427734375, 0.029568195343017578, 0.031342506408691406, 0.033116817474365234, 0.03489112854003906, 0.03666543960571289, 0.03843975067138672, 0.04021406173706055, 0.041988372802734375, 0.0437626838684082, 0.04553699493408203, 0.04731130599975586, 0.04908561706542969, 0.050859928131103516, 0.052634239196777344, 0.05440855026245117, 0.056182861328125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 7.0, 16.0, 218.0, 732.0, 32.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35238611698150635, -0.2851608991622925, -0.21793566644191742, -0.15071043372154236, -0.08348521590232849, -0.016259998083114624, 0.05096524953842163, 0.1181904673576355, 0.18541568517684937, 0.25264090299606323, 0.3198661208152771, 0.38709136843681335, 0.4543165862560272, 0.5215418338775635, 0.5887670516967773, 0.6559922695159912, 0.7232174873352051, 0.790442705154419, 0.8576679229736328, 0.9248931407928467, 0.9921183586120605, 1.0593435764312744, 1.1265687942504883, 1.1937940120697021, 1.261019229888916, 1.3282444477081299, 1.3954696655273438, 1.4626948833465576, 1.5299201011657715, 1.5971453189849854, 1.6643705368041992, 1.731595754623413, 1.798821210861206, 1.86604642868042, 1.9332716464996338, 2.0004968643188477, 2.0677220821380615, 2.1349472999572754, 2.2021725177764893, 2.269397735595703, 2.336622953414917, 2.403848171234131, 2.4710733890533447, 2.5382986068725586, 2.6055238246917725, 2.6727490425109863, 2.7399742603302, 2.807199478149414, 2.874424934387207, 2.941650152206421, 3.0088753700256348, 3.0761005878448486, 3.1433258056640625, 3.2105510234832764, 3.2777762413024902, 3.345001459121704, 3.412226676940918, 3.479451894760132, 3.5466771125793457, 3.6139023303985596, 3.6811275482177734, 3.7483527660369873, 3.815577983856201, 3.882803201675415, 3.950028419494629]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 1.0, 8.0, 10.0, 12.0, 8.0, 8.0, 9.0, 14.0, 15.0, 27.0, 33.0, 42.0, 52.0, 51.0, 66.0, 54.0, 72.0, 65.0, 71.0, 65.0, 46.0, 46.0, 40.0, 26.0, 38.0, 22.0, 18.0, 15.0, 20.0, 8.0, 4.0, 8.0, 4.0, 3.0, 3.0, 6.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4513883590698242, -0.4379616677761078, -0.42453497648239136, -0.41110825538635254, -0.3976815640926361, -0.3842548727989197, -0.37082818150520325, -0.3574014902114868, -0.343974769115448, -0.33054807782173157, -0.31712138652801514, -0.3036946654319763, -0.2902679741382599, -0.27684128284454346, -0.263414591550827, -0.2499879002571106, -0.23656120896339417, -0.22313451766967773, -0.2097078114748001, -0.19628112018108368, -0.18285441398620605, -0.16942772269248962, -0.1560010313987732, -0.14257434010505676, -0.12914763391017914, -0.11572093516588211, -0.10229423642158508, -0.08886754512786865, -0.07544084638357162, -0.0620141476392746, -0.048587456345558167, -0.03516075760126114, -0.02173405885696411, -0.008307361975312233, 0.005119334906339645, 0.018546029925346375, 0.0319727286696434, 0.04539942741394043, 0.05882611870765686, 0.07225281745195389, 0.08567951619625092, 0.09910621494054794, 0.11253291368484497, 0.1259596049785614, 0.13938629627227783, 0.15281300246715546, 0.1662396937608719, 0.1796663999557495, 0.19309309124946594, 0.20651978254318237, 0.21994648873806, 0.23337318003177643, 0.24679988622665405, 0.2602265775203705, 0.2736532688140869, 0.28707996010780334, 0.3005066514015198, 0.3139333426952362, 0.32736003398895264, 0.34078675508499146, 0.3542134463787079, 0.3676401376724243, 0.38106682896614075, 0.3944935202598572, 0.407920241355896]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 7.0, 3.0, 5.0, 16.0, 8.0, 10.0, 21.0, 20.0, 32.0, 27.0, 32.0, 54.0, 68.0, 98.0, 127.0, 183.0, 271.0, 384.0, 625.0, 812.0, 1244.0, 1796.0, 2898.0, 4701.0, 9240.0, 24348.0, 138289.0, 3877231.0, 90253.0, 20420.0, 8250.0, 4348.0, 2699.0, 1789.0, 1113.0, 819.0, 584.0, 411.0, 331.0, 211.0, 144.0, 113.0, 72.0, 63.0, 37.0, 29.0, 20.0, 13.0, 6.0, 6.0, 2.0, 2.0, 1.0], "bins": [-0.177734375, -0.17310714721679688, -0.16847991943359375, -0.16385269165039062, -0.1592254638671875, -0.15459823608398438, -0.14997100830078125, -0.14534378051757812, -0.140716552734375, -0.13608932495117188, -0.13146209716796875, -0.12683486938476562, -0.1222076416015625, -0.11758041381835938, -0.11295318603515625, -0.10832595825195312, -0.10369873046875, -0.09907150268554688, -0.09444427490234375, -0.08981704711914062, -0.0851898193359375, -0.08056259155273438, -0.07593536376953125, -0.07130813598632812, -0.066680908203125, -0.062053680419921875, -0.05742645263671875, -0.052799224853515625, -0.0481719970703125, -0.043544769287109375, -0.03891754150390625, -0.034290313720703125, -0.0296630859375, -0.025035858154296875, -0.02040863037109375, -0.015781402587890625, -0.0111541748046875, -0.006526947021484375, -0.00189971923828125, 0.002727508544921875, 0.007354736328125, 0.011981964111328125, 0.01660919189453125, 0.021236419677734375, 0.0258636474609375, 0.030490875244140625, 0.03511810302734375, 0.039745330810546875, 0.04437255859375, 0.048999786376953125, 0.05362701416015625, 0.058254241943359375, 0.0628814697265625, 0.06750869750976562, 0.07213592529296875, 0.07676315307617188, 0.081390380859375, 0.08601760864257812, 0.09064483642578125, 0.09527206420898438, 0.0998992919921875, 0.10452651977539062, 0.10915374755859375, 0.11378097534179688, 0.118408203125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 3.0, 6.0, 12.0, 11.0, 17.0, 19.0, 13.0, 18.0, 32.0, 39.0, 66.0, 82.0, 137.0, 142.0, 121.0, 63.0, 51.0, 42.0, 15.0, 20.0, 17.0, 13.0, 19.0, 5.0, 8.0, 5.0, 6.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.0209197998046875, -0.020386576652526855, -0.01985335350036621, -0.019320130348205566, -0.018786907196044922, -0.018253684043884277, -0.017720460891723633, -0.01718723773956299, -0.016654014587402344, -0.0161207914352417, -0.015587568283081055, -0.01505434513092041, -0.014521121978759766, -0.013987898826599121, -0.013454675674438477, -0.012921452522277832, -0.012388229370117188, -0.011855006217956543, -0.011321783065795898, -0.010788559913635254, -0.01025533676147461, -0.009722113609313965, -0.00918889045715332, -0.008655667304992676, -0.008122444152832031, -0.007589221000671387, -0.007055997848510742, -0.006522774696350098, -0.005989551544189453, -0.005456328392028809, -0.004923105239868164, -0.0043898820877075195, -0.003856658935546875, -0.0033234357833862305, -0.002790212631225586, -0.0022569894790649414, -0.0017237663269042969, -0.0011905431747436523, -0.0006573200225830078, -0.00012409687042236328, 0.00040912628173828125, 0.0009423494338989258, 0.0014755725860595703, 0.002008795738220215, 0.0025420188903808594, 0.003075242042541504, 0.0036084651947021484, 0.004141688346862793, 0.0046749114990234375, 0.005208134651184082, 0.0057413578033447266, 0.006274580955505371, 0.006807804107666016, 0.00734102725982666, 0.007874250411987305, 0.00840747356414795, 0.008940696716308594, 0.009473919868469238, 0.010007143020629883, 0.010540366172790527, 0.011073589324951172, 0.011606812477111816, 0.012140035629272461, 0.012673258781433105, 0.01320648193359375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 5.0, 12.0, 12.0, 14.0, 15.0, 40.0, 53.0, 90.0, 164.0, 324.0, 812.0, 2214.0, 6765.0, 23959.0, 154203.0, 3821972.0, 149177.0, 23828.0, 6628.0, 2308.0, 871.0, 334.0, 181.0, 85.0, 62.0, 40.0, 27.0, 20.0, 14.0, 12.0, 11.0, 5.0, 10.0, 2.0, 5.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1544189453125, -0.1493549346923828, -0.14429092407226562, -0.13922691345214844, -0.13416290283203125, -0.12909889221191406, -0.12403488159179688, -0.11897087097167969, -0.1139068603515625, -0.10884284973144531, -0.10377883911132812, -0.09871482849121094, -0.09365081787109375, -0.08858680725097656, -0.08352279663085938, -0.07845878601074219, -0.073394775390625, -0.06833076477050781, -0.06326675415039062, -0.05820274353027344, -0.05313873291015625, -0.04807472229003906, -0.043010711669921875, -0.03794670104980469, -0.0328826904296875, -0.027818679809570312, -0.022754669189453125, -0.017690658569335938, -0.01262664794921875, -0.0075626373291015625, -0.002498626708984375, 0.0025653839111328125, 0.00762939453125, 0.012693405151367188, 0.017757415771484375, 0.022821426391601562, 0.02788543701171875, 0.03294944763183594, 0.038013458251953125, 0.04307746887207031, 0.0481414794921875, 0.05320549011230469, 0.058269500732421875, 0.06333351135253906, 0.06839752197265625, 0.07346153259277344, 0.07852554321289062, 0.08358955383300781, 0.088653564453125, 0.09371757507324219, 0.09878158569335938, 0.10384559631347656, 0.10890960693359375, 0.11397361755371094, 0.11903762817382812, 0.12410163879394531, 0.1291656494140625, 0.1342296600341797, 0.13929367065429688, 0.14435768127441406, 0.14942169189453125, 0.15448570251464844, 0.15954971313476562, 0.1646137237548828, 0.169677734375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 4.0, 4.0, 3.0, 6.0, 7.0, 4.0, 9.0, 14.0, 10.0, 19.0, 33.0, 33.0, 45.0, 71.0, 105.0, 177.0, 409.0, 1784.0, 655.0, 231.0, 126.0, 98.0, 52.0, 33.0, 28.0, 24.0, 15.0, 19.0, 12.0, 7.0, 8.0, 4.0, 8.0, 2.0, 0.0, 3.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0160675048828125, -0.015443563461303711, -0.014819622039794922, -0.014195680618286133, -0.013571739196777344, -0.012947797775268555, -0.012323856353759766, -0.011699914932250977, -0.011075973510742188, -0.010452032089233398, -0.00982809066772461, -0.00920414924621582, -0.008580207824707031, -0.007956266403198242, -0.007332324981689453, -0.006708383560180664, -0.006084442138671875, -0.005460500717163086, -0.004836559295654297, -0.004212617874145508, -0.0035886764526367188, -0.0029647350311279297, -0.0023407936096191406, -0.0017168521881103516, -0.0010929107666015625, -0.00046896934509277344, 0.00015497207641601562, 0.0007789134979248047, 0.0014028549194335938, 0.002026796340942383, 0.002650737762451172, 0.003274679183959961, 0.00389862060546875, 0.004522562026977539, 0.005146503448486328, 0.005770444869995117, 0.006394386291503906, 0.007018327713012695, 0.007642269134521484, 0.008266210556030273, 0.008890151977539062, 0.009514093399047852, 0.01013803482055664, 0.01076197624206543, 0.011385917663574219, 0.012009859085083008, 0.012633800506591797, 0.013257741928100586, 0.013881683349609375, 0.014505624771118164, 0.015129566192626953, 0.015753507614135742, 0.01637744903564453, 0.01700139045715332, 0.01762533187866211, 0.0182492733001709, 0.018873214721679688, 0.019497156143188477, 0.020121097564697266, 0.020745038986206055, 0.021368980407714844, 0.021992921829223633, 0.022616863250732422, 0.02324080467224121, 0.02386474609375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 10.0, 34.0, 172.0, 427.0, 293.0, 55.0, 15.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16836299002170563, -0.1582910716533661, -0.14821913838386536, -0.13814722001552582, -0.12807530164718628, -0.11800337582826614, -0.10793145000934601, -0.09785953164100647, -0.08778760582208633, -0.0777156800031662, -0.06764376163482666, -0.057571835815906525, -0.04749991372227669, -0.03742799162864685, -0.027356065809726715, -0.017284147441387177, -0.007212221622467041, 0.0028597014024853706, 0.012931624427437782, 0.02300354838371277, 0.033075470477342606, 0.04314739257097244, 0.05321931838989258, 0.06329123675823212, 0.07336316257715225, 0.08343508839607239, 0.09350700676441193, 0.10357893258333206, 0.1136508584022522, 0.12372277677059174, 0.13379469513893127, 0.143866628408432, 0.15393856167793274, 0.16401048004627228, 0.174082413315773, 0.18415433168411255, 0.1942262500524521, 0.20429816842079163, 0.21437010169029236, 0.2244420200586319, 0.23451393842697144, 0.24458585679531097, 0.2546577751636505, 0.26472970843315125, 0.274801641702652, 0.2848735451698303, 0.29494547843933105, 0.3050174117088318, 0.3150893449783325, 0.32516127824783325, 0.3352331817150116, 0.34530511498451233, 0.35537704825401306, 0.3654489517211914, 0.37552088499069214, 0.38559281826019287, 0.3956647217273712, 0.40573665499687195, 0.4158085584640503, 0.425880491733551, 0.43595242500305176, 0.4460243284702301, 0.45609626173973083, 0.4661681652069092, 0.4762400984764099]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 3.0, 7.0, 7.0, 13.0, 18.0, 21.0, 22.0, 31.0, 39.0, 51.0, 63.0, 65.0, 58.0, 73.0, 63.0, 56.0, 56.0, 49.0, 64.0, 50.0, 46.0, 32.0, 34.0, 20.0, 18.0, 14.0, 7.0, 7.0, 6.0, 7.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09539002180099487, -0.0922093614935875, -0.08902870118618011, -0.08584803342819214, -0.08266737312078476, -0.07948671281337738, -0.0763060450553894, -0.07312538474798203, -0.06994472444057465, -0.06676406413316727, -0.06358340382575989, -0.06040273606777191, -0.05722207576036453, -0.05404141545295715, -0.050860751420259476, -0.0476800873875618, -0.04449942708015442, -0.04131876677274704, -0.03813810274004936, -0.034957438707351685, -0.031776778399944305, -0.028596116229891777, -0.02541545405983925, -0.02223479188978672, -0.019054129719734192, -0.015873467549681664, -0.012692805379629135, -0.009512143209576607, -0.006331481039524078, -0.00315081886947155, 2.9843300580978394e-05, 0.0032105054706335068, 0.006391167640686035, 0.009571829810738564, 0.012752491980791092, 0.01593315415084362, 0.01911381632089615, 0.022294478490948677, 0.025475140661001205, 0.028655802831053734, 0.03183646500110626, 0.03501712530851364, 0.03819778934121132, 0.041378453373909, 0.044559113681316376, 0.047739773988723755, 0.05092043802142143, 0.05410110205411911, 0.05728176236152649, 0.06046242266893387, 0.06364308297634125, 0.06682375073432922, 0.0700044110417366, 0.07318507134914398, 0.07636573910713196, 0.07954639941453934, 0.08272705972194672, 0.0859077200293541, 0.08908838033676147, 0.09226904809474945, 0.09544970840215683, 0.09863036870956421, 0.10181103646755219, 0.10499169677495956, 0.10817235708236694]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 10.0, 7.0, 14.0, 10.0, 24.0, 31.0, 44.0, 100.0, 136.0, 260.0, 431.0, 825.0, 1566.0, 3212.0, 7147.0, 16761.0, 49290.0, 237241.0, 586675.0, 96747.0, 27796.0, 10757.0, 4669.0, 2228.0, 1197.0, 585.0, 298.0, 184.0, 101.0, 78.0, 46.0, 22.0, 23.0, 18.0, 10.0, 4.0, 7.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1180419921875, -0.11413955688476562, -0.11023712158203125, -0.10633468627929688, -0.1024322509765625, -0.09852981567382812, -0.09462738037109375, -0.09072494506835938, -0.086822509765625, -0.08292007446289062, -0.07901763916015625, -0.07511520385742188, -0.0712127685546875, -0.06731033325195312, -0.06340789794921875, -0.059505462646484375, -0.05560302734375, -0.051700592041015625, -0.04779815673828125, -0.043895721435546875, -0.0399932861328125, -0.036090850830078125, -0.03218841552734375, -0.028285980224609375, -0.024383544921875, -0.020481109619140625, -0.01657867431640625, -0.012676239013671875, -0.0087738037109375, -0.004871368408203125, -0.00096893310546875, 0.002933502197265625, 0.0068359375, 0.010738372802734375, 0.01464080810546875, 0.018543243408203125, 0.0224456787109375, 0.026348114013671875, 0.03025054931640625, 0.034152984619140625, 0.038055419921875, 0.041957855224609375, 0.04586029052734375, 0.049762725830078125, 0.0536651611328125, 0.057567596435546875, 0.06147003173828125, 0.06537246704101562, 0.06927490234375, 0.07317733764648438, 0.07707977294921875, 0.08098220825195312, 0.0848846435546875, 0.08878707885742188, 0.09268951416015625, 0.09659194946289062, 0.100494384765625, 0.10439682006835938, 0.10829925537109375, 0.11220169067382812, 0.1161041259765625, 0.12000656127929688, 0.12390899658203125, 0.12781143188476562, 0.1317138671875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 3.0, 0.0, 10.0, 9.0, 3.0, 13.0, 14.0, 20.0, 15.0, 27.0, 23.0, 50.0, 71.0, 94.0, 134.0, 139.0, 105.0, 61.0, 55.0, 35.0, 25.0, 17.0, 16.0, 15.0, 9.0, 8.0, 5.0, 1.0, 7.0, 6.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 1.0], "bins": [-0.020599365234375, -0.02008509635925293, -0.01957082748413086, -0.01905655860900879, -0.01854228973388672, -0.01802802085876465, -0.017513751983642578, -0.016999483108520508, -0.016485214233398438, -0.015970945358276367, -0.015456676483154297, -0.014942407608032227, -0.014428138732910156, -0.013913869857788086, -0.013399600982666016, -0.012885332107543945, -0.012371063232421875, -0.011856794357299805, -0.011342525482177734, -0.010828256607055664, -0.010313987731933594, -0.009799718856811523, -0.009285449981689453, -0.008771181106567383, -0.008256912231445312, -0.007742643356323242, -0.007228374481201172, -0.0067141056060791016, -0.006199836730957031, -0.005685567855834961, -0.005171298980712891, -0.00465703010559082, -0.00414276123046875, -0.0036284923553466797, -0.0031142234802246094, -0.002599954605102539, -0.0020856857299804688, -0.0015714168548583984, -0.0010571479797363281, -0.0005428791046142578, -2.86102294921875e-05, 0.0004856586456298828, 0.0009999275207519531, 0.0015141963958740234, 0.0020284652709960938, 0.002542734146118164, 0.0030570030212402344, 0.0035712718963623047, 0.004085540771484375, 0.004599809646606445, 0.005114078521728516, 0.005628347396850586, 0.006142616271972656, 0.0066568851470947266, 0.007171154022216797, 0.007685422897338867, 0.008199691772460938, 0.008713960647583008, 0.009228229522705078, 0.009742498397827148, 0.010256767272949219, 0.010771036148071289, 0.01128530502319336, 0.01179957389831543, 0.0123138427734375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 4.0, 5.0, 9.0, 8.0, 14.0, 16.0, 27.0, 32.0, 40.0, 62.0, 93.0, 131.0, 194.0, 302.0, 507.0, 1090.0, 2809.0, 10933.0, 65724.0, 488951.0, 411494.0, 52188.0, 9158.0, 2410.0, 992.0, 501.0, 289.0, 177.0, 118.0, 82.0, 54.0, 36.0, 31.0, 23.0, 16.0, 6.0, 8.0, 6.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.15234375, -0.1478557586669922, -0.14336776733398438, -0.13887977600097656, -0.13439178466796875, -0.12990379333496094, -0.12541580200195312, -0.12092781066894531, -0.1164398193359375, -0.11195182800292969, -0.10746383666992188, -0.10297584533691406, -0.09848785400390625, -0.09399986267089844, -0.08951187133789062, -0.08502388000488281, -0.080535888671875, -0.07604789733886719, -0.07155990600585938, -0.06707191467285156, -0.06258392333984375, -0.05809593200683594, -0.053607940673828125, -0.04911994934082031, -0.0446319580078125, -0.04014396667480469, -0.035655975341796875, -0.031167984008789062, -0.02667999267578125, -0.022192001342773438, -0.017704010009765625, -0.013216018676757812, -0.00872802734375, -0.0042400360107421875, 0.000247955322265625, 0.0047359466552734375, 0.00922393798828125, 0.013711929321289062, 0.018199920654296875, 0.022687911987304688, 0.0271759033203125, 0.03166389465332031, 0.036151885986328125, 0.04063987731933594, 0.04512786865234375, 0.04961585998535156, 0.054103851318359375, 0.05859184265136719, 0.063079833984375, 0.06756782531738281, 0.07205581665039062, 0.07654380798339844, 0.08103179931640625, 0.08551979064941406, 0.09000778198242188, 0.09449577331542969, 0.0989837646484375, 0.10347175598144531, 0.10795974731445312, 0.11244773864746094, 0.11693572998046875, 0.12142372131347656, 0.12591171264648438, 0.1303997039794922, 0.1348876953125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 3.0, 6.0, 5.0, 11.0, 8.0, 22.0, 19.0, 14.0, 20.0, 23.0, 23.0, 30.0, 24.0, 36.0, 33.0, 32.0, 49.0, 42.0, 52.0, 54.0, 46.0, 46.0, 51.0, 42.0, 37.0, 40.0, 38.0, 28.0, 23.0, 20.0, 30.0, 13.0, 15.0, 16.0, 13.0, 11.0, 8.0, 2.0, 6.0, 3.0, 4.0, 1.0, 4.0, 2.0, 0.0, 2.0, 3.0], "bins": [-0.07135009765625, -0.06942319869995117, -0.06749629974365234, -0.06556940078735352, -0.06364250183105469, -0.06171560287475586, -0.05978870391845703, -0.0578618049621582, -0.055934906005859375, -0.05400800704956055, -0.05208110809326172, -0.05015420913696289, -0.04822731018066406, -0.046300411224365234, -0.044373512268066406, -0.04244661331176758, -0.04051971435546875, -0.03859281539916992, -0.036665916442871094, -0.034739017486572266, -0.03281211853027344, -0.03088521957397461, -0.02895832061767578, -0.027031421661376953, -0.025104522705078125, -0.023177623748779297, -0.02125072479248047, -0.01932382583618164, -0.017396926879882812, -0.015470027923583984, -0.013543128967285156, -0.011616230010986328, -0.0096893310546875, -0.007762432098388672, -0.005835533142089844, -0.003908634185791016, -0.0019817352294921875, -5.4836273193359375e-05, 0.0018720626831054688, 0.003798961639404297, 0.005725860595703125, 0.007652759552001953, 0.009579658508300781, 0.01150655746459961, 0.013433456420898438, 0.015360355377197266, 0.017287254333496094, 0.019214153289794922, 0.02114105224609375, 0.023067951202392578, 0.024994850158691406, 0.026921749114990234, 0.028848648071289062, 0.03077554702758789, 0.03270244598388672, 0.03462934494018555, 0.036556243896484375, 0.0384831428527832, 0.04041004180908203, 0.04233694076538086, 0.04426383972167969, 0.046190738677978516, 0.048117637634277344, 0.05004453659057617, 0.051971435546875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 7.0, 7.0, 11.0, 16.0, 17.0, 47.0, 58.0, 105.0, 189.0, 293.0, 572.0, 1078.0, 2560.0, 6471.0, 19806.0, 83520.0, 416245.0, 405727.0, 81352.0, 19358.0, 6170.0, 2419.0, 1159.0, 622.0, 289.0, 172.0, 103.0, 67.0, 40.0, 34.0, 16.0, 13.0, 7.0, 3.0, 5.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.053375244140625, -0.05165290832519531, -0.049930572509765625, -0.04820823669433594, -0.04648590087890625, -0.04476356506347656, -0.043041229248046875, -0.04131889343261719, -0.0395965576171875, -0.03787422180175781, -0.036151885986328125, -0.03442955017089844, -0.03270721435546875, -0.030984878540039062, -0.029262542724609375, -0.027540206909179688, -0.02581787109375, -0.024095535278320312, -0.022373199462890625, -0.020650863647460938, -0.01892852783203125, -0.017206192016601562, -0.015483856201171875, -0.013761520385742188, -0.0120391845703125, -0.010316848754882812, -0.008594512939453125, -0.0068721771240234375, -0.00514984130859375, -0.0034275054931640625, -0.001705169677734375, 1.71661376953125e-05, 0.001739501953125, 0.0034618377685546875, 0.005184173583984375, 0.0069065093994140625, 0.00862884521484375, 0.010351181030273438, 0.012073516845703125, 0.013795852661132812, 0.0155181884765625, 0.017240524291992188, 0.018962860107421875, 0.020685195922851562, 0.02240753173828125, 0.024129867553710938, 0.025852203369140625, 0.027574539184570312, 0.029296875, 0.031019210815429688, 0.032741546630859375, 0.03446388244628906, 0.03618621826171875, 0.03790855407714844, 0.039630889892578125, 0.04135322570800781, 0.0430755615234375, 0.04479789733886719, 0.046520233154296875, 0.04824256896972656, 0.04996490478515625, 0.05168724060058594, 0.053409576416015625, 0.05513191223144531, 0.056854248046875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 1.0, 8.0, 11.0, 6.0, 8.0, 14.0, 14.0, 21.0, 33.0, 31.0, 31.0, 58.0, 51.0, 67.0, 83.0, 92.0, 70.0, 63.0, 61.0, 59.0, 43.0, 31.0, 22.0, 21.0, 29.0, 10.0, 16.0, 13.0, 10.0, 5.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.695487976074219e-05, -3.566499799489975e-05, -3.437511622905731e-05, -3.3085234463214874e-05, -3.1795352697372437e-05, -3.050547093153e-05, -2.921558916568756e-05, -2.7925707399845123e-05, -2.6635825634002686e-05, -2.5345943868160248e-05, -2.405606210231781e-05, -2.2766180336475372e-05, -2.1476298570632935e-05, -2.0186416804790497e-05, -1.889653503894806e-05, -1.760665327310562e-05, -1.6316771507263184e-05, -1.5026889741420746e-05, -1.3737007975578308e-05, -1.244712620973587e-05, -1.1157244443893433e-05, -9.867362678050995e-06, -8.577480912208557e-06, -7.287599146366119e-06, -5.997717380523682e-06, -4.707835614681244e-06, -3.417953848838806e-06, -2.1280720829963684e-06, -8.381903171539307e-07, 4.516914486885071e-07, 1.7415732145309448e-06, 3.0314549803733826e-06, 4.32133674621582e-06, 5.611218512058258e-06, 6.901100277900696e-06, 8.190982043743134e-06, 9.480863809585571e-06, 1.0770745575428009e-05, 1.2060627341270447e-05, 1.3350509107112885e-05, 1.4640390872955322e-05, 1.593027263879776e-05, 1.7220154404640198e-05, 1.8510036170482635e-05, 1.9799917936325073e-05, 2.108979970216751e-05, 2.237968146800995e-05, 2.3669563233852386e-05, 2.4959444999694824e-05, 2.6249326765537262e-05, 2.75392085313797e-05, 2.8829090297222137e-05, 3.0118972063064575e-05, 3.140885382890701e-05, 3.269873559474945e-05, 3.398861736059189e-05, 3.5278499126434326e-05, 3.6568380892276764e-05, 3.78582626581192e-05, 3.914814442396164e-05, 4.043802618980408e-05, 4.1727907955646515e-05, 4.301778972148895e-05, 4.430767148733139e-05, 4.559755325317383e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 6.0, 10.0, 9.0, 5.0, 11.0, 7.0, 16.0, 15.0, 27.0, 40.0, 42.0, 63.0, 104.0, 171.0, 309.0, 561.0, 1307.0, 3230.0, 10499.0, 53923.0, 452268.0, 454746.0, 54635.0, 10617.0, 3308.0, 1267.0, 543.0, 276.0, 169.0, 103.0, 60.0, 66.0, 28.0, 29.0, 28.0, 14.0, 12.0, 9.0, 3.0, 7.0, 4.0, 0.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.07867431640625, -0.07648897171020508, -0.07430362701416016, -0.07211828231811523, -0.06993293762207031, -0.06774759292602539, -0.06556224822998047, -0.06337690353393555, -0.061191558837890625, -0.0590062141418457, -0.05682086944580078, -0.05463552474975586, -0.05245018005371094, -0.050264835357666016, -0.048079490661621094, -0.04589414596557617, -0.04370880126953125, -0.04152345657348633, -0.039338111877441406, -0.037152767181396484, -0.03496742248535156, -0.03278207778930664, -0.03059673309326172, -0.028411388397216797, -0.026226043701171875, -0.024040699005126953, -0.02185535430908203, -0.01967000961303711, -0.017484664916992188, -0.015299320220947266, -0.013113975524902344, -0.010928630828857422, -0.0087432861328125, -0.006557941436767578, -0.004372596740722656, -0.0021872520446777344, -1.9073486328125e-06, 0.0021834373474121094, 0.004368782043457031, 0.006554126739501953, 0.008739471435546875, 0.010924816131591797, 0.013110160827636719, 0.01529550552368164, 0.017480850219726562, 0.019666194915771484, 0.021851539611816406, 0.024036884307861328, 0.02622222900390625, 0.028407573699951172, 0.030592918395996094, 0.032778263092041016, 0.03496360778808594, 0.03714895248413086, 0.03933429718017578, 0.0415196418762207, 0.043704986572265625, 0.04589033126831055, 0.04807567596435547, 0.05026102066040039, 0.05244636535644531, 0.054631710052490234, 0.056817054748535156, 0.05900239944458008, 0.061187744140625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 4.0, 4.0, 3.0, 9.0, 11.0, 10.0, 17.0, 23.0, 16.0, 29.0, 31.0, 44.0, 55.0, 60.0, 52.0, 79.0, 77.0, 69.0, 67.0, 62.0, 42.0, 44.0, 40.0, 31.0, 22.0, 20.0, 18.0, 12.0, 8.0, 12.0, 7.0, 6.0, 5.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03155517578125, -0.030637025833129883, -0.029718875885009766, -0.02880072593688965, -0.02788257598876953, -0.026964426040649414, -0.026046276092529297, -0.02512812614440918, -0.024209976196289062, -0.023291826248168945, -0.022373676300048828, -0.02145552635192871, -0.020537376403808594, -0.019619226455688477, -0.01870107650756836, -0.017782926559448242, -0.016864776611328125, -0.015946626663208008, -0.01502847671508789, -0.014110326766967773, -0.013192176818847656, -0.012274026870727539, -0.011355876922607422, -0.010437726974487305, -0.009519577026367188, -0.00860142707824707, -0.007683277130126953, -0.006765127182006836, -0.005846977233886719, -0.0049288272857666016, -0.004010677337646484, -0.003092527389526367, -0.00217437744140625, -0.0012562274932861328, -0.0003380775451660156, 0.0005800724029541016, 0.0014982223510742188, 0.002416372299194336, 0.003334522247314453, 0.00425267219543457, 0.0051708221435546875, 0.006088972091674805, 0.007007122039794922, 0.007925271987915039, 0.008843421936035156, 0.009761571884155273, 0.01067972183227539, 0.011597871780395508, 0.012516021728515625, 0.013434171676635742, 0.01435232162475586, 0.015270471572875977, 0.016188621520996094, 0.01710677146911621, 0.018024921417236328, 0.018943071365356445, 0.019861221313476562, 0.02077937126159668, 0.021697521209716797, 0.022615671157836914, 0.02353382110595703, 0.02445197105407715, 0.025370121002197266, 0.026288270950317383, 0.0272064208984375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 5.0, 4.0, 13.0, 30.0, 63.0, 119.0, 228.0, 246.0, 147.0, 82.0, 33.0, 17.0, 12.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0117350816726685, -0.9838110208511353, -0.955886960029602, -0.9279628396034241, -0.9000387787818909, -0.8721147179603577, -0.8441905975341797, -0.8162665367126465, -0.7883424758911133, -0.7604184150695801, -0.7324943542480469, -0.7045702338218689, -0.6766461730003357, -0.6487221121788025, -0.6207979917526245, -0.5928739309310913, -0.5649498701095581, -0.5370258092880249, -0.5091017484664917, -0.4811776280403137, -0.4532535672187805, -0.4253295063972473, -0.3974054157733917, -0.36948132514953613, -0.34155726432800293, -0.3136332035064697, -0.28570911288261414, -0.25778502225875854, -0.22986096143722534, -0.20193688571453094, -0.17401280999183655, -0.14608873426914215, -0.11816471815109253, -0.09024064242839813, -0.062316566705703735, -0.03439249098300934, -0.006468415260314941, 0.021455660462379456, 0.04937973618507385, 0.07730381190776825, 0.10522788763046265, 0.13315196335315704, 0.16107603907585144, 0.18900011479854584, 0.21692419052124023, 0.24484826624393463, 0.27277234196662903, 0.3006964325904846, 0.3286204934120178, 0.356544554233551, 0.3844686448574066, 0.4123927354812622, 0.4403167963027954, 0.4682408571243286, 0.4961649477481842, 0.5240890383720398, 0.552013099193573, 0.5799371600151062, 0.6078612804412842, 0.6357853412628174, 0.6637094020843506, 0.6916334629058838, 0.719557523727417, 0.747481644153595, 0.7754057049751282]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 7.0, 5.0, 8.0, 7.0, 16.0, 11.0, 25.0, 28.0, 32.0, 33.0, 36.0, 53.0, 48.0, 46.0, 57.0, 59.0, 67.0, 60.0, 60.0, 48.0, 53.0, 39.0, 41.0, 36.0, 24.0, 23.0, 24.0, 16.0, 11.0, 13.0, 9.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5634295344352722, -0.5459505319595337, -0.5284714698791504, -0.5109924674034119, -0.49351343512535095, -0.47603440284729004, -0.4585554003715515, -0.4410763680934906, -0.4235973358154297, -0.4061183035373688, -0.38863930106163025, -0.37116026878356934, -0.3536812365055084, -0.3362022042274475, -0.318723201751709, -0.30124416947364807, -0.28376516699790955, -0.26628613471984863, -0.2488071173429489, -0.2313280999660492, -0.21384906768798828, -0.19637005031108856, -0.17889103293418884, -0.16141200065612793, -0.1439329832792282, -0.1264539659023285, -0.10897493362426758, -0.09149591624736786, -0.07401689141988754, -0.05653786659240723, -0.03905884921550751, -0.02157982438802719, -0.004100799560546875, 0.013378223404288292, 0.03085724636912346, 0.04833626747131348, 0.06581529229879379, 0.08329431712627411, 0.10077333450317383, 0.11825235933065414, 0.13573138415813446, 0.15321040153503418, 0.1706894338130951, 0.1881684511899948, 0.20564746856689453, 0.22312650084495544, 0.24060551822185516, 0.2580845355987549, 0.2755635678768158, 0.2930426001548767, 0.31052160263061523, 0.32800063490867615, 0.34547966718673706, 0.3629586696624756, 0.3804377019405365, 0.3979167342185974, 0.41539573669433594, 0.43287476897239685, 0.4503537714481354, 0.4678328037261963, 0.4853118360042572, 0.5027908682823181, 0.5202698707580566, 0.5377488732337952, 0.5552279353141785]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 8.0, 10.0, 10.0, 16.0, 30.0, 28.0, 46.0, 87.0, 173.0, 345.0, 730.0, 2176.0, 9538.0, 133125.0, 4005801.0, 34736.0, 4867.0, 1424.0, 525.0, 241.0, 145.0, 75.0, 45.0, 27.0, 25.0, 7.0, 5.0, 11.0, 6.0, 1.0, 1.0, 4.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.417236328125, -0.406341552734375, -0.39544677734375, -0.384552001953125, -0.3736572265625, -0.362762451171875, -0.35186767578125, -0.340972900390625, -0.330078125, -0.319183349609375, -0.30828857421875, -0.297393798828125, -0.2864990234375, -0.275604248046875, -0.26470947265625, -0.253814697265625, -0.242919921875, -0.232025146484375, -0.22113037109375, -0.210235595703125, -0.1993408203125, -0.188446044921875, -0.17755126953125, -0.166656494140625, -0.15576171875, -0.144866943359375, -0.13397216796875, -0.123077392578125, -0.1121826171875, -0.101287841796875, -0.09039306640625, -0.079498291015625, -0.068603515625, -0.057708740234375, -0.04681396484375, -0.035919189453125, -0.0250244140625, -0.014129638671875, -0.00323486328125, 0.007659912109375, 0.0185546875, 0.029449462890625, 0.04034423828125, 0.051239013671875, 0.0621337890625, 0.073028564453125, 0.08392333984375, 0.094818115234375, 0.105712890625, 0.116607666015625, 0.12750244140625, 0.138397216796875, 0.1492919921875, 0.160186767578125, 0.17108154296875, 0.181976318359375, 0.19287109375, 0.203765869140625, 0.21466064453125, 0.225555419921875, 0.2364501953125, 0.247344970703125, 0.25823974609375, 0.269134521484375, 0.280029296875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 4.0, 5.0, 11.0, 7.0, 9.0, 21.0, 16.0, 21.0, 36.0, 32.0, 51.0, 60.0, 96.0, 77.0, 113.0, 91.0, 76.0, 75.0, 49.0, 25.0, 21.0, 22.0, 18.0, 18.0, 9.0, 3.0, 7.0, 5.0, 7.0, 3.0, 1.0, 0.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.0220184326171875, -0.021444082260131836, -0.020869731903076172, -0.020295381546020508, -0.019721031188964844, -0.01914668083190918, -0.018572330474853516, -0.01799798011779785, -0.017423629760742188, -0.016849279403686523, -0.01627492904663086, -0.015700578689575195, -0.015126228332519531, -0.014551877975463867, -0.013977527618408203, -0.013403177261352539, -0.012828826904296875, -0.012254476547241211, -0.011680126190185547, -0.011105775833129883, -0.010531425476074219, -0.009957075119018555, -0.00938272476196289, -0.008808374404907227, -0.008234024047851562, -0.0076596736907958984, -0.007085323333740234, -0.00651097297668457, -0.005936622619628906, -0.005362272262573242, -0.004787921905517578, -0.004213571548461914, -0.00363922119140625, -0.003064870834350586, -0.002490520477294922, -0.0019161701202392578, -0.0013418197631835938, -0.0007674694061279297, -0.00019311904907226562, 0.00038123130798339844, 0.0009555816650390625, 0.0015299320220947266, 0.0021042823791503906, 0.0026786327362060547, 0.0032529830932617188, 0.003827333450317383, 0.004401683807373047, 0.004976034164428711, 0.005550384521484375, 0.006124734878540039, 0.006699085235595703, 0.007273435592651367, 0.007847785949707031, 0.008422136306762695, 0.00899648666381836, 0.009570837020874023, 0.010145187377929688, 0.010719537734985352, 0.011293888092041016, 0.01186823844909668, 0.012442588806152344, 0.013016939163208008, 0.013591289520263672, 0.014165639877319336, 0.014739990234375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 6.0, 9.0, 15.0, 25.0, 34.0, 45.0, 122.0, 268.0, 700.0, 2117.0, 8458.0, 50179.0, 3128000.0, 955022.0, 39467.0, 7076.0, 1798.0, 491.0, 221.0, 96.0, 65.0, 32.0, 15.0, 7.0, 6.0, 8.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.280029296875, -0.27301788330078125, -0.2660064697265625, -0.25899505615234375, -0.251983642578125, -0.24497222900390625, -0.2379608154296875, -0.23094940185546875, -0.22393798828125, -0.21692657470703125, -0.2099151611328125, -0.20290374755859375, -0.195892333984375, -0.18888092041015625, -0.1818695068359375, -0.17485809326171875, -0.1678466796875, -0.16083526611328125, -0.1538238525390625, -0.14681243896484375, -0.139801025390625, -0.13278961181640625, -0.1257781982421875, -0.11876678466796875, -0.11175537109375, -0.10474395751953125, -0.0977325439453125, -0.09072113037109375, -0.083709716796875, -0.07669830322265625, -0.0696868896484375, -0.06267547607421875, -0.0556640625, -0.04865264892578125, -0.0416412353515625, -0.03462982177734375, -0.027618408203125, -0.02060699462890625, -0.0135955810546875, -0.00658416748046875, 0.00042724609375, 0.00743865966796875, 0.0144500732421875, 0.02146148681640625, 0.028472900390625, 0.03548431396484375, 0.0424957275390625, 0.04950714111328125, 0.0565185546875, 0.06352996826171875, 0.0705413818359375, 0.07755279541015625, 0.084564208984375, 0.09157562255859375, 0.0985870361328125, 0.10559844970703125, 0.11260986328125, 0.11962127685546875, 0.1266326904296875, 0.13364410400390625, 0.140655517578125, 0.14766693115234375, 0.1546783447265625, 0.16168975830078125, 0.168701171875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 3.0, 2.0, 3.0, 8.0, 11.0, 14.0, 9.0, 17.0, 20.0, 26.0, 41.0, 59.0, 81.0, 122.0, 261.0, 479.0, 1800.0, 469.0, 207.0, 126.0, 82.0, 67.0, 40.0, 22.0, 19.0, 22.0, 8.0, 16.0, 9.0, 5.0, 9.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.025177001953125, -0.02429342269897461, -0.02340984344482422, -0.022526264190673828, -0.021642684936523438, -0.020759105682373047, -0.019875526428222656, -0.018991947174072266, -0.018108367919921875, -0.017224788665771484, -0.016341209411621094, -0.015457630157470703, -0.014574050903320312, -0.013690471649169922, -0.012806892395019531, -0.01192331314086914, -0.01103973388671875, -0.01015615463256836, -0.009272575378417969, -0.008388996124267578, -0.0075054168701171875, -0.006621837615966797, -0.005738258361816406, -0.004854679107666016, -0.003971099853515625, -0.0030875205993652344, -0.0022039413452148438, -0.0013203620910644531, -0.0004367828369140625, 0.0004467964172363281, 0.0013303756713867188, 0.0022139549255371094, 0.0030975341796875, 0.003981113433837891, 0.004864692687988281, 0.005748271942138672, 0.0066318511962890625, 0.007515430450439453, 0.008399009704589844, 0.009282588958740234, 0.010166168212890625, 0.011049747467041016, 0.011933326721191406, 0.012816905975341797, 0.013700485229492188, 0.014584064483642578, 0.015467643737792969, 0.01635122299194336, 0.01723480224609375, 0.01811838150024414, 0.01900196075439453, 0.019885540008544922, 0.020769119262695312, 0.021652698516845703, 0.022536277770996094, 0.023419857025146484, 0.024303436279296875, 0.025187015533447266, 0.026070594787597656, 0.026954174041748047, 0.027837753295898438, 0.028721332550048828, 0.02960491180419922, 0.03048849105834961, 0.0313720703125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 8.0, 20.0, 44.0, 81.0, 179.0, 270.0, 203.0, 108.0, 49.0, 22.0, 13.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3423707187175751, -0.3335146903991699, -0.3246586322784424, -0.31580260396003723, -0.3069465756416321, -0.29809054732322693, -0.2892345190048218, -0.28037846088409424, -0.2715224325656891, -0.26266640424728394, -0.2538103461265564, -0.24495431780815125, -0.2360982894897461, -0.22724226117134094, -0.2183862179517746, -0.20953017473220825, -0.2006741464138031, -0.19181811809539795, -0.1829620748758316, -0.17410603165626526, -0.1652500033378601, -0.15639397501945496, -0.1475379317998886, -0.13868188858032227, -0.12982586026191711, -0.12096982449293137, -0.11211378872394562, -0.10325775295495987, -0.09440171718597412, -0.08554568141698837, -0.07668964564800262, -0.06783360987901688, -0.05897757411003113, -0.05012153834104538, -0.04126550257205963, -0.03240946680307388, -0.023553431034088135, -0.014697395265102386, -0.005841359496116638, 0.00301467627286911, 0.011870712041854858, 0.020726747810840607, 0.029582783579826355, 0.0384388193488121, 0.04729485511779785, 0.0561508908867836, 0.06500692665576935, 0.0738629624247551, 0.08271899819374084, 0.09157503396272659, 0.10043106973171234, 0.10928710550069809, 0.11814314126968384, 0.126999169588089, 0.13585521280765533, 0.14471125602722168, 0.15356728434562683, 0.16242331266403198, 0.17127935588359833, 0.18013539910316467, 0.18899142742156982, 0.19784745573997498, 0.20670349895954132, 0.21555954217910767, 0.22441557049751282]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 4.0, 2.0, 9.0, 5.0, 11.0, 11.0, 15.0, 16.0, 22.0, 25.0, 26.0, 34.0, 37.0, 51.0, 33.0, 56.0, 53.0, 44.0, 53.0, 57.0, 44.0, 47.0, 43.0, 45.0, 36.0, 36.0, 30.0, 37.0, 21.0, 26.0, 17.0, 14.0, 14.0, 11.0, 7.0, 7.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11070460081100464, -0.10726530849933624, -0.10382600873708725, -0.10038671642541885, -0.09694741666316986, -0.09350812435150146, -0.09006883203983307, -0.08662953972816467, -0.08319023996591568, -0.07975094765424728, -0.07631164789199829, -0.0728723555803299, -0.0694330632686615, -0.0659937635064125, -0.06255447119474411, -0.059115175157785416, -0.05567587912082672, -0.05223658308386803, -0.04879728704690933, -0.045357994735240936, -0.04191869869828224, -0.03847940266132355, -0.03504011034965515, -0.03160081431269646, -0.028161518275737762, -0.024722222238779068, -0.021282928064465523, -0.017843633890151978, -0.014404337853193283, -0.010965041816234589, -0.007525747641921043, -0.004086453467607498, -0.0006471574306488037, 0.002792137674987316, 0.006231432780623436, 0.009670727886259556, 0.013110022991895676, 0.01654931902885437, 0.019988613203167915, 0.02342790737748146, 0.026867203414440155, 0.03030649945139885, 0.033745795488357544, 0.03718508780002594, 0.040624383836984634, 0.04406367987394333, 0.047502972185611725, 0.05094226822257042, 0.054381564259529114, 0.05782086029648781, 0.0612601563334465, 0.0646994486451149, 0.06813874840736389, 0.07157804071903229, 0.07501733303070068, 0.07845662534236908, 0.08189592510461807, 0.08533521741628647, 0.08877451717853546, 0.09221380949020386, 0.09565310180187225, 0.09909240156412125, 0.10253169387578964, 0.10597099363803864, 0.10941028594970703]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 7.0, 10.0, 24.0, 22.0, 21.0, 69.0, 95.0, 136.0, 228.0, 341.0, 645.0, 1177.0, 2397.0, 5065.0, 11219.0, 29827.0, 94999.0, 371507.0, 380403.0, 98179.0, 30169.0, 11645.0, 5056.0, 2413.0, 1277.0, 647.0, 366.0, 197.0, 144.0, 88.0, 59.0, 27.0, 27.0, 20.0, 17.0, 12.0, 6.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1146240234375, -0.11135005950927734, -0.10807609558105469, -0.10480213165283203, -0.10152816772460938, -0.09825420379638672, -0.09498023986816406, -0.0917062759399414, -0.08843231201171875, -0.0851583480834961, -0.08188438415527344, -0.07861042022705078, -0.07533645629882812, -0.07206249237060547, -0.06878852844238281, -0.06551456451416016, -0.0622406005859375, -0.058966636657714844, -0.05569267272949219, -0.05241870880126953, -0.049144744873046875, -0.04587078094482422, -0.04259681701660156, -0.039322853088378906, -0.03604888916015625, -0.032774925231933594, -0.029500961303710938, -0.02622699737548828, -0.022953033447265625, -0.01967906951904297, -0.016405105590820312, -0.013131141662597656, -0.009857177734375, -0.006583213806152344, -0.0033092498779296875, -3.528594970703125e-05, 0.003238677978515625, 0.006512641906738281, 0.009786605834960938, 0.013060569763183594, 0.01633453369140625, 0.019608497619628906, 0.022882461547851562, 0.02615642547607422, 0.029430389404296875, 0.03270435333251953, 0.03597831726074219, 0.039252281188964844, 0.0425262451171875, 0.045800209045410156, 0.04907417297363281, 0.05234813690185547, 0.055622100830078125, 0.05889606475830078, 0.06217002868652344, 0.0654439926147461, 0.06871795654296875, 0.0719919204711914, 0.07526588439941406, 0.07853984832763672, 0.08181381225585938, 0.08508777618408203, 0.08836174011230469, 0.09163570404052734, 0.09490966796875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 5.0, 10.0, 6.0, 15.0, 23.0, 15.0, 35.0, 44.0, 48.0, 64.0, 81.0, 84.0, 103.0, 72.0, 77.0, 70.0, 55.0, 34.0, 35.0, 22.0, 18.0, 14.0, 9.0, 11.0, 11.0, 6.0, 3.0, 3.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.021331787109375, -0.020779967308044434, -0.020228147506713867, -0.0196763277053833, -0.019124507904052734, -0.018572688102722168, -0.0180208683013916, -0.017469048500061035, -0.01691722869873047, -0.016365408897399902, -0.015813589096069336, -0.01526176929473877, -0.014709949493408203, -0.014158129692077637, -0.01360630989074707, -0.013054490089416504, -0.012502670288085938, -0.011950850486755371, -0.011399030685424805, -0.010847210884094238, -0.010295391082763672, -0.009743571281433105, -0.009191751480102539, -0.008639931678771973, -0.008088111877441406, -0.00753629207611084, -0.0069844722747802734, -0.006432652473449707, -0.005880832672119141, -0.005329012870788574, -0.004777193069458008, -0.004225373268127441, -0.003673553466796875, -0.0031217336654663086, -0.002569913864135742, -0.0020180940628051758, -0.0014662742614746094, -0.000914454460144043, -0.00036263465881347656, 0.00018918514251708984, 0.0007410049438476562, 0.0012928247451782227, 0.001844644546508789, 0.0023964643478393555, 0.002948284149169922, 0.0035001039505004883, 0.004051923751831055, 0.004603743553161621, 0.0051555633544921875, 0.005707383155822754, 0.00625920295715332, 0.006811022758483887, 0.007362842559814453, 0.00791466236114502, 0.008466482162475586, 0.009018301963806152, 0.009570121765136719, 0.010121941566467285, 0.010673761367797852, 0.011225581169128418, 0.011777400970458984, 0.01232922077178955, 0.012881040573120117, 0.013432860374450684, 0.01398468017578125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 8.0, 10.0, 12.0, 15.0, 28.0, 32.0, 56.0, 65.0, 86.0, 138.0, 197.0, 293.0, 441.0, 858.0, 1857.0, 5087.0, 16709.0, 67086.0, 313689.0, 486508.0, 115530.0, 26844.0, 7593.0, 2650.0, 1098.0, 578.0, 344.0, 220.0, 160.0, 95.0, 65.0, 58.0, 31.0, 25.0, 23.0, 19.0, 7.0, 9.0, 11.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1171875, -0.11342906951904297, -0.10967063903808594, -0.1059122085571289, -0.10215377807617188, -0.09839534759521484, -0.09463691711425781, -0.09087848663330078, -0.08712005615234375, -0.08336162567138672, -0.07960319519042969, -0.07584476470947266, -0.07208633422851562, -0.0683279037475586, -0.06456947326660156, -0.06081104278564453, -0.0570526123046875, -0.05329418182373047, -0.04953575134277344, -0.045777320861816406, -0.042018890380859375, -0.038260459899902344, -0.03450202941894531, -0.03074359893798828, -0.02698516845703125, -0.02322673797607422, -0.019468307495117188, -0.015709877014160156, -0.011951446533203125, -0.008193016052246094, -0.0044345855712890625, -0.0006761550903320312, 0.003082275390625, 0.006840705871582031, 0.010599136352539062, 0.014357566833496094, 0.018115997314453125, 0.021874427795410156, 0.025632858276367188, 0.02939128875732422, 0.03314971923828125, 0.03690814971923828, 0.04066658020019531, 0.044425010681152344, 0.048183441162109375, 0.051941871643066406, 0.05570030212402344, 0.05945873260498047, 0.0632171630859375, 0.06697559356689453, 0.07073402404785156, 0.0744924545288086, 0.07825088500976562, 0.08200931549072266, 0.08576774597167969, 0.08952617645263672, 0.09328460693359375, 0.09704303741455078, 0.10080146789550781, 0.10455989837646484, 0.10831832885742188, 0.1120767593383789, 0.11583518981933594, 0.11959362030029297, 0.12335205078125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 1.0, 3.0, 6.0, 4.0, 9.0, 3.0, 12.0, 11.0, 10.0, 20.0, 19.0, 15.0, 32.0, 33.0, 29.0, 28.0, 31.0, 35.0, 45.0, 46.0, 40.0, 48.0, 41.0, 48.0, 45.0, 38.0, 40.0, 35.0, 38.0, 44.0, 34.0, 23.0, 27.0, 12.0, 17.0, 14.0, 8.0, 13.0, 6.0, 9.0, 5.0, 10.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.072021484375, -0.06980514526367188, -0.06758880615234375, -0.06537246704101562, -0.0631561279296875, -0.060939788818359375, -0.05872344970703125, -0.056507110595703125, -0.054290771484375, -0.052074432373046875, -0.04985809326171875, -0.047641754150390625, -0.0454254150390625, -0.043209075927734375, -0.04099273681640625, -0.038776397705078125, -0.03656005859375, -0.034343719482421875, -0.03212738037109375, -0.029911041259765625, -0.0276947021484375, -0.025478363037109375, -0.02326202392578125, -0.021045684814453125, -0.018829345703125, -0.016613006591796875, -0.01439666748046875, -0.012180328369140625, -0.0099639892578125, -0.007747650146484375, -0.00553131103515625, -0.003314971923828125, -0.0010986328125, 0.001117706298828125, 0.00333404541015625, 0.005550384521484375, 0.0077667236328125, 0.009983062744140625, 0.01219940185546875, 0.014415740966796875, 0.016632080078125, 0.018848419189453125, 0.02106475830078125, 0.023281097412109375, 0.0254974365234375, 0.027713775634765625, 0.02993011474609375, 0.032146453857421875, 0.03436279296875, 0.036579132080078125, 0.03879547119140625, 0.041011810302734375, 0.0432281494140625, 0.045444488525390625, 0.04766082763671875, 0.049877166748046875, 0.052093505859375, 0.054309844970703125, 0.05652618408203125, 0.058742523193359375, 0.0609588623046875, 0.06317520141601562, 0.06539154052734375, 0.06760787963867188, 0.06982421875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 9.0, 11.0, 13.0, 18.0, 27.0, 52.0, 106.0, 102.0, 143.0, 239.0, 345.0, 517.0, 755.0, 1333.0, 2212.0, 4008.0, 8235.0, 21451.0, 71233.0, 295663.0, 459488.0, 124802.0, 33349.0, 12019.0, 5275.0, 2812.0, 1589.0, 906.0, 606.0, 392.0, 256.0, 181.0, 120.0, 91.0, 61.0, 53.0, 22.0, 18.0, 12.0, 8.0, 10.0, 2.0, 8.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.054534912109375, -0.05294036865234375, -0.0513458251953125, -0.04975128173828125, -0.04815673828125, -0.04656219482421875, -0.0449676513671875, -0.04337310791015625, -0.041778564453125, -0.04018402099609375, -0.0385894775390625, -0.03699493408203125, -0.035400390625, -0.03380584716796875, -0.0322113037109375, -0.03061676025390625, -0.029022216796875, -0.02742767333984375, -0.0258331298828125, -0.02423858642578125, -0.02264404296875, -0.02104949951171875, -0.0194549560546875, -0.01786041259765625, -0.016265869140625, -0.01467132568359375, -0.0130767822265625, -0.01148223876953125, -0.0098876953125, -0.00829315185546875, -0.0066986083984375, -0.00510406494140625, -0.003509521484375, -0.00191497802734375, -0.0003204345703125, 0.00127410888671875, 0.00286865234375, 0.00446319580078125, 0.0060577392578125, 0.00765228271484375, 0.009246826171875, 0.01084136962890625, 0.0124359130859375, 0.01403045654296875, 0.015625, 0.01721954345703125, 0.0188140869140625, 0.02040863037109375, 0.022003173828125, 0.02359771728515625, 0.0251922607421875, 0.02678680419921875, 0.02838134765625, 0.02997589111328125, 0.0315704345703125, 0.03316497802734375, 0.034759521484375, 0.03635406494140625, 0.0379486083984375, 0.03954315185546875, 0.0411376953125, 0.04273223876953125, 0.0443267822265625, 0.04592132568359375, 0.047515869140625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 6.0, 15.0, 21.0, 20.0, 32.0, 79.0, 90.0, 142.0, 187.0, 149.0, 103.0, 57.0, 39.0, 26.0, 19.0, 11.0, 3.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.594989776611328e-05, -8.409842848777771e-05, -8.224695920944214e-05, -8.039548993110657e-05, -7.8544020652771e-05, -7.669255137443542e-05, -7.484108209609985e-05, -7.298961281776428e-05, -7.113814353942871e-05, -6.928667426109314e-05, -6.743520498275757e-05, -6.5583735704422e-05, -6.373226642608643e-05, -6.188079714775085e-05, -6.002932786941528e-05, -5.817785859107971e-05, -5.632638931274414e-05, -5.447492003440857e-05, -5.2623450756073e-05, -5.077198147773743e-05, -4.8920512199401855e-05, -4.7069042921066284e-05, -4.521757364273071e-05, -4.336610436439514e-05, -4.151463508605957e-05, -3.9663165807724e-05, -3.781169652938843e-05, -3.5960227251052856e-05, -3.4108757972717285e-05, -3.2257288694381714e-05, -3.0405819416046143e-05, -2.855435013771057e-05, -2.6702880859375e-05, -2.485141158103943e-05, -2.2999942302703857e-05, -2.1148473024368286e-05, -1.9297003746032715e-05, -1.7445534467697144e-05, -1.5594065189361572e-05, -1.3742595911026001e-05, -1.189112663269043e-05, -1.0039657354354858e-05, -8.188188076019287e-06, -6.336718797683716e-06, -4.4852495193481445e-06, -2.6337802410125732e-06, -7.82310962677002e-07, 1.0691583156585693e-06, 2.9206275939941406e-06, 4.772096872329712e-06, 6.623566150665283e-06, 8.475035429000854e-06, 1.0326504707336426e-05, 1.2177973985671997e-05, 1.4029443264007568e-05, 1.588091254234314e-05, 1.773238182067871e-05, 1.9583851099014282e-05, 2.1435320377349854e-05, 2.3286789655685425e-05, 2.5138258934020996e-05, 2.6989728212356567e-05, 2.884119749069214e-05, 3.069266676902771e-05, 3.254413604736328e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 8.0, 6.0, 12.0, 17.0, 20.0, 42.0, 72.0, 124.0, 249.0, 667.0, 2197.0, 10833.0, 222616.0, 782098.0, 24187.0, 3671.0, 964.0, 367.0, 165.0, 71.0, 56.0, 28.0, 17.0, 15.0, 11.0, 11.0, 8.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10650634765625, -0.10147762298583984, -0.09644889831542969, -0.09142017364501953, -0.08639144897460938, -0.08136272430419922, -0.07633399963378906, -0.0713052749633789, -0.06627655029296875, -0.061247825622558594, -0.05621910095214844, -0.05119037628173828, -0.046161651611328125, -0.04113292694091797, -0.03610420227050781, -0.031075477600097656, -0.0260467529296875, -0.021018028259277344, -0.015989303588867188, -0.010960578918457031, -0.005931854248046875, -0.0009031295776367188, 0.0041255950927734375, 0.009154319763183594, 0.01418304443359375, 0.019211769104003906, 0.024240493774414062, 0.02926921844482422, 0.034297943115234375, 0.03932666778564453, 0.04435539245605469, 0.049384117126464844, 0.054412841796875, 0.059441566467285156, 0.06447029113769531, 0.06949901580810547, 0.07452774047851562, 0.07955646514892578, 0.08458518981933594, 0.0896139144897461, 0.09464263916015625, 0.0996713638305664, 0.10470008850097656, 0.10972881317138672, 0.11475753784179688, 0.11978626251220703, 0.12481498718261719, 0.12984371185302734, 0.1348724365234375, 0.13990116119384766, 0.1449298858642578, 0.14995861053466797, 0.15498733520507812, 0.16001605987548828, 0.16504478454589844, 0.1700735092163086, 0.17510223388671875, 0.1801309585571289, 0.18515968322753906, 0.19018840789794922, 0.19521713256835938, 0.20024585723876953, 0.2052745819091797, 0.21030330657958984, 0.21533203125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 9.0, 7.0, 20.0, 22.0, 45.0, 80.0, 124.0, 163.0, 143.0, 151.0, 68.0, 54.0, 36.0, 25.0, 13.0, 7.0, 5.0, 5.0, 2.0, 1.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.050506591796875, -0.048220157623291016, -0.04593372344970703, -0.04364728927612305, -0.04136085510253906, -0.03907442092895508, -0.036787986755371094, -0.03450155258178711, -0.032215118408203125, -0.02992868423461914, -0.027642250061035156, -0.025355815887451172, -0.023069381713867188, -0.020782947540283203, -0.01849651336669922, -0.016210079193115234, -0.01392364501953125, -0.011637210845947266, -0.009350776672363281, -0.007064342498779297, -0.0047779083251953125, -0.002491474151611328, -0.00020503997802734375, 0.0020813941955566406, 0.004367828369140625, 0.006654262542724609, 0.008940696716308594, 0.011227130889892578, 0.013513565063476562, 0.015799999237060547, 0.01808643341064453, 0.020372867584228516, 0.0226593017578125, 0.024945735931396484, 0.02723217010498047, 0.029518604278564453, 0.03180503845214844, 0.03409147262573242, 0.036377906799316406, 0.03866434097290039, 0.040950775146484375, 0.04323720932006836, 0.045523643493652344, 0.04781007766723633, 0.05009651184082031, 0.0523829460144043, 0.05466938018798828, 0.056955814361572266, 0.05924224853515625, 0.061528682708740234, 0.06381511688232422, 0.0661015510559082, 0.06838798522949219, 0.07067441940307617, 0.07296085357666016, 0.07524728775024414, 0.07753372192382812, 0.07982015609741211, 0.0821065902709961, 0.08439302444458008, 0.08667945861816406, 0.08896589279174805, 0.09125232696533203, 0.09353876113891602, 0.0958251953125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 6.0, 8.0, 16.0, 16.0, 43.0, 77.0, 106.0, 158.0, 158.0, 148.0, 118.0, 58.0, 43.0, 19.0, 10.0, 11.0, 9.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5261595845222473, -0.5014950037002563, -0.47683045268058777, -0.4521659016609192, -0.4275013208389282, -0.40283676981925964, -0.37817221879959106, -0.3535076379776001, -0.3288430869579315, -0.30417853593826294, -0.279513955116272, -0.2548494040966034, -0.23018483817577362, -0.20552027225494385, -0.18085572123527527, -0.1561911553144455, -0.13152658939361572, -0.10686202347278595, -0.08219746500253677, -0.0575329065322876, -0.032868340611457825, -0.008203774690628052, 0.016460776329040527, 0.0411253422498703, 0.06578990817070007, 0.09045447409152985, 0.11511903256177902, 0.1397835910320282, 0.16444815695285797, 0.18911272287368774, 0.21377727389335632, 0.2384418398141861, 0.2631063461303711, 0.2877708971500397, 0.31243547797203064, 0.3371000289916992, 0.3617646098136902, 0.38642916083335876, 0.41109371185302734, 0.4357582926750183, 0.4604228436946869, 0.48508739471435547, 0.5097519755363464, 0.5344165563583374, 0.5590810775756836, 0.5837456583976746, 0.6084102392196655, 0.6330747604370117, 0.6577393412590027, 0.6824039220809937, 0.7070684432983398, 0.7317330241203308, 0.7563976049423218, 0.781062126159668, 0.8057267069816589, 0.8303912878036499, 0.8550558090209961, 0.8797203898429871, 0.9043849110603333, 0.9290494918823242, 0.9537140727043152, 0.9783786535263062, 1.0030431747436523, 1.0277076959609985, 1.0523723363876343]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 6.0, 6.0, 7.0, 9.0, 9.0, 10.0, 17.0, 16.0, 23.0, 27.0, 25.0, 20.0, 31.0, 42.0, 30.0, 30.0, 36.0, 46.0, 40.0, 51.0, 38.0, 37.0, 38.0, 45.0, 46.0, 43.0, 40.0, 37.0, 35.0, 18.0, 30.0, 18.0, 14.0, 15.0, 18.0, 3.0, 10.0, 13.0, 2.0, 9.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.49666398763656616, -0.48125702142715454, -0.46585002541542053, -0.4504430294036865, -0.4350360631942749, -0.4196290969848633, -0.4042221009731293, -0.38881510496139526, -0.37340813875198364, -0.358001172542572, -0.342594176530838, -0.327187180519104, -0.3117802143096924, -0.29637324810028076, -0.28096625208854675, -0.26555925607681274, -0.2501522898674011, -0.2347453087568283, -0.2193383276462555, -0.20393134653568268, -0.18852436542510986, -0.17311738431453705, -0.15771040320396423, -0.14230342209339142, -0.1268964409828186, -0.11148945987224579, -0.09608247876167297, -0.08067549765110016, -0.06526851654052734, -0.04986153542995453, -0.034454554319381714, -0.0190475732088089, -0.003640592098236084, 0.011766389012336731, 0.027173370122909546, 0.04258035123348236, 0.057987332344055176, 0.07339431345462799, 0.0888012945652008, 0.10420827567577362, 0.11961525678634644, 0.13502223789691925, 0.15042921900749207, 0.16583620011806488, 0.1812431812286377, 0.1966501623392105, 0.21205714344978333, 0.22746412456035614, 0.24287110567092896, 0.2582780718803406, 0.2736850678920746, 0.2890920639038086, 0.3044990301132202, 0.31990599632263184, 0.33531299233436584, 0.35071998834609985, 0.3661269545555115, 0.3815339207649231, 0.3969409167766571, 0.4123479127883911, 0.42775487899780273, 0.44316184520721436, 0.45856884121894836, 0.4739758372306824, 0.489382803440094]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 9.0, 12.0, 10.0, 11.0, 15.0, 40.0, 42.0, 63.0, 92.0, 138.0, 206.0, 336.0, 541.0, 1004.0, 2046.0, 5136.0, 16182.0, 77559.0, 3638498.0, 396478.0, 38505.0, 9941.0, 3622.0, 1595.0, 798.0, 463.0, 298.0, 189.0, 122.0, 86.0, 63.0, 45.0, 39.0, 34.0, 12.0, 17.0, 11.0, 8.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.12841796875, -0.12410926818847656, -0.11980056762695312, -0.11549186706542969, -0.11118316650390625, -0.10687446594238281, -0.10256576538085938, -0.09825706481933594, -0.0939483642578125, -0.08963966369628906, -0.08533096313476562, -0.08102226257324219, -0.07671356201171875, -0.07240486145019531, -0.06809616088867188, -0.06378746032714844, -0.059478759765625, -0.05517005920410156, -0.050861358642578125, -0.04655265808105469, -0.04224395751953125, -0.03793525695800781, -0.033626556396484375, -0.029317855834960938, -0.0250091552734375, -0.020700454711914062, -0.016391754150390625, -0.012083053588867188, -0.00777435302734375, -0.0034656524658203125, 0.000843048095703125, 0.0051517486572265625, 0.00946044921875, 0.013769149780273438, 0.018077850341796875, 0.022386550903320312, 0.02669525146484375, 0.031003952026367188, 0.035312652587890625, 0.03962135314941406, 0.0439300537109375, 0.04823875427246094, 0.052547454833984375, 0.05685615539550781, 0.06116485595703125, 0.06547355651855469, 0.06978225708007812, 0.07409095764160156, 0.078399658203125, 0.08270835876464844, 0.08701705932617188, 0.09132575988769531, 0.09563446044921875, 0.09994316101074219, 0.10425186157226562, 0.10856056213378906, 0.1128692626953125, 0.11717796325683594, 0.12148666381835938, 0.1257953643798828, 0.13010406494140625, 0.1344127655029297, 0.13872146606445312, 0.14303016662597656, 0.1473388671875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 6.0, 6.0, 6.0, 6.0, 11.0, 8.0, 16.0, 12.0, 22.0, 25.0, 42.0, 46.0, 53.0, 47.0, 69.0, 80.0, 71.0, 84.0, 73.0, 73.0, 39.0, 45.0, 32.0, 25.0, 24.0, 18.0, 15.0, 10.0, 8.0, 8.0, 7.0, 4.0, 2.0, 4.0, 5.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0196685791015625, -0.019065380096435547, -0.018462181091308594, -0.01785898208618164, -0.017255783081054688, -0.016652584075927734, -0.01604938507080078, -0.015446186065673828, -0.014842987060546875, -0.014239788055419922, -0.013636589050292969, -0.013033390045166016, -0.012430191040039062, -0.01182699203491211, -0.011223793029785156, -0.010620594024658203, -0.01001739501953125, -0.009414196014404297, -0.008810997009277344, -0.00820779800415039, -0.0076045989990234375, -0.007001399993896484, -0.006398200988769531, -0.005795001983642578, -0.005191802978515625, -0.004588603973388672, -0.003985404968261719, -0.0033822059631347656, -0.0027790069580078125, -0.0021758079528808594, -0.0015726089477539062, -0.0009694099426269531, -0.0003662109375, 0.00023698806762695312, 0.0008401870727539062, 0.0014433860778808594, 0.0020465850830078125, 0.0026497840881347656, 0.0032529830932617188, 0.003856182098388672, 0.004459381103515625, 0.005062580108642578, 0.005665779113769531, 0.006268978118896484, 0.0068721771240234375, 0.007475376129150391, 0.008078575134277344, 0.008681774139404297, 0.00928497314453125, 0.009888172149658203, 0.010491371154785156, 0.01109457015991211, 0.011697769165039062, 0.012300968170166016, 0.012904167175292969, 0.013507366180419922, 0.014110565185546875, 0.014713764190673828, 0.015316963195800781, 0.015920162200927734, 0.016523361206054688, 0.01712656021118164, 0.017729759216308594, 0.018332958221435547, 0.0189361572265625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 6.0, 8.0, 16.0, 35.0, 72.0, 103.0, 175.0, 366.0, 908.0, 1973.0, 5086.0, 15355.0, 59749.0, 555866.0, 3391310.0, 124937.0, 25298.0, 7843.0, 2825.0, 1165.0, 610.0, 280.0, 138.0, 63.0, 40.0, 27.0, 15.0, 7.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13427734375, -0.1305685043334961, -0.1268596649169922, -0.12315082550048828, -0.11944198608398438, -0.11573314666748047, -0.11202430725097656, -0.10831546783447266, -0.10460662841796875, -0.10089778900146484, -0.09718894958496094, -0.09348011016845703, -0.08977127075195312, -0.08606243133544922, -0.08235359191894531, -0.0786447525024414, -0.0749359130859375, -0.0712270736694336, -0.06751823425292969, -0.06380939483642578, -0.060100555419921875, -0.05639171600341797, -0.05268287658691406, -0.048974037170410156, -0.04526519775390625, -0.041556358337402344, -0.03784751892089844, -0.03413867950439453, -0.030429840087890625, -0.02672100067138672, -0.023012161254882812, -0.019303321838378906, -0.015594482421875, -0.011885643005371094, -0.008176803588867188, -0.004467964172363281, -0.000759124755859375, 0.0029497146606445312, 0.0066585540771484375, 0.010367393493652344, 0.01407623291015625, 0.017785072326660156, 0.021493911743164062, 0.02520275115966797, 0.028911590576171875, 0.03262042999267578, 0.03632926940917969, 0.040038108825683594, 0.0437469482421875, 0.047455787658691406, 0.05116462707519531, 0.05487346649169922, 0.058582305908203125, 0.06229114532470703, 0.06599998474121094, 0.06970882415771484, 0.07341766357421875, 0.07712650299072266, 0.08083534240722656, 0.08454418182373047, 0.08825302124023438, 0.09196186065673828, 0.09567070007324219, 0.0993795394897461, 0.10308837890625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 1.0, 1.0, 4.0, 2.0, 7.0, 6.0, 10.0, 12.0, 15.0, 20.0, 21.0, 26.0, 61.0, 90.0, 147.0, 235.0, 717.0, 1767.0, 419.0, 193.0, 101.0, 60.0, 43.0, 28.0, 28.0, 20.0, 7.0, 12.0, 8.0, 7.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0295257568359375, -0.028580665588378906, -0.027635574340820312, -0.02669048309326172, -0.025745391845703125, -0.02480030059814453, -0.023855209350585938, -0.022910118103027344, -0.02196502685546875, -0.021019935607910156, -0.020074844360351562, -0.01912975311279297, -0.018184661865234375, -0.01723957061767578, -0.016294479370117188, -0.015349388122558594, -0.014404296875, -0.013459205627441406, -0.012514114379882812, -0.011569023132324219, -0.010623931884765625, -0.009678840637207031, -0.008733749389648438, -0.007788658142089844, -0.00684356689453125, -0.005898475646972656, -0.0049533843994140625, -0.004008293151855469, -0.003063201904296875, -0.0021181106567382812, -0.0011730194091796875, -0.00022792816162109375, 0.0007171630859375, 0.0016622543334960938, 0.0026073455810546875, 0.0035524368286132812, 0.004497528076171875, 0.005442619323730469, 0.0063877105712890625, 0.007332801818847656, 0.00827789306640625, 0.009222984313964844, 0.010168075561523438, 0.011113166809082031, 0.012058258056640625, 0.013003349304199219, 0.013948440551757812, 0.014893531799316406, 0.015838623046875, 0.016783714294433594, 0.017728805541992188, 0.01867389678955078, 0.019618988037109375, 0.02056407928466797, 0.021509170532226562, 0.022454261779785156, 0.02339935302734375, 0.024344444274902344, 0.025289535522460938, 0.02623462677001953, 0.027179718017578125, 0.02812480926513672, 0.029069900512695312, 0.030014991760253906, 0.0309600830078125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 7.0, 5.0, 12.0, 20.0, 28.0, 31.0, 45.0, 55.0, 87.0, 111.0, 129.0, 111.0, 101.0, 75.0, 51.0, 45.0, 26.0, 18.0, 14.0, 6.0, 2.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10153816640377045, -0.09757574647665024, -0.09361332654953003, -0.08965090662240982, -0.08568848669528961, -0.0817260593175888, -0.0777636393904686, -0.07380121946334839, -0.06983879953622818, -0.06587637960910797, -0.06191395968198776, -0.057951536029577255, -0.053989116102457047, -0.05002669617533684, -0.04606427252292633, -0.04210185259580612, -0.03813943266868591, -0.034177012741565704, -0.030214590951800346, -0.02625216916203499, -0.02228974923491478, -0.01832732930779457, -0.014364907518029213, -0.010402485728263855, -0.006440065801143646, -0.002477644942700863, 0.0014847759157419205, 0.005447196774184704, 0.009409617632627487, 0.013372037559747696, 0.017334459349513054, 0.021296881139278412, 0.025259315967559814, 0.029221735894680023, 0.03318415582180023, 0.03714657947421074, 0.04110899940133095, 0.04507141932845116, 0.049033842980861664, 0.05299626290798187, 0.05695868283510208, 0.06092110276222229, 0.0648835226893425, 0.06884594261646271, 0.07280836999416351, 0.07677078247070312, 0.08073320984840393, 0.08469562977552414, 0.08865804970264435, 0.09262046962976456, 0.09658288955688477, 0.10054530948400497, 0.10450772941112518, 0.10847015678882599, 0.1124325767159462, 0.1163949966430664, 0.12035741657018661, 0.12431983649730682, 0.12828226387500763, 0.13224467635154724, 0.13620710372924805, 0.14016951620578766, 0.14413194358348846, 0.14809435606002808, 0.15205678343772888]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 1.0, 5.0, 8.0, 6.0, 6.0, 16.0, 17.0, 12.0, 16.0, 14.0, 22.0, 25.0, 28.0, 34.0, 41.0, 40.0, 30.0, 33.0, 40.0, 32.0, 50.0, 59.0, 31.0, 44.0, 44.0, 43.0, 35.0, 38.0, 42.0, 27.0, 22.0, 14.0, 20.0, 14.0, 20.0, 18.0, 5.0, 18.0, 8.0, 2.0, 2.0, 6.0, 5.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.08024102449417114, -0.07758000493049622, -0.07491899281740189, -0.07225797325372696, -0.06959696114063263, -0.0669359415769577, -0.06427492201328278, -0.06161390617489815, -0.05895289033651352, -0.05629187449812889, -0.05363085865974426, -0.050969839096069336, -0.04830882325768471, -0.04564780741930008, -0.04298678785562515, -0.040325772017240524, -0.037664756178855896, -0.03500374034047127, -0.03234272450208664, -0.029681704938411713, -0.027020689100027084, -0.024359673261642456, -0.02169865556061268, -0.0190376378595829, -0.016376622021198273, -0.01371560525149107, -0.011054588481783867, -0.008393571712076664, -0.005732554942369461, -0.003071538172662258, -0.00041052140295505524, 0.0022504962980747223, 0.004911512136459351, 0.0075725289061665535, 0.010233545675873756, 0.01289456244558096, 0.015555579215288162, 0.01821659505367279, 0.020877612754702568, 0.023538630455732346, 0.026199646294116974, 0.028860662132501602, 0.03152167797088623, 0.03418269753456116, 0.036843713372945786, 0.039504729211330414, 0.04216574877500534, 0.04482676461338997, 0.0474877804517746, 0.050148796290159225, 0.052809812128543854, 0.05547083169221878, 0.05813184753060341, 0.06079286336898804, 0.06345388293266296, 0.06611490249633789, 0.06877591460943222, 0.07143693417310715, 0.07409794628620148, 0.0767589658498764, 0.07941998541355133, 0.08208099752664566, 0.08474201709032059, 0.08740302920341492, 0.09006404876708984]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 7.0, 10.0, 27.0, 33.0, 32.0, 54.0, 74.0, 137.0, 144.0, 248.0, 394.0, 586.0, 837.0, 1564.0, 2573.0, 4250.0, 7376.0, 13223.0, 25448.0, 50624.0, 105914.0, 222735.0, 298507.0, 159194.0, 74791.0, 36437.0, 18901.0, 10208.0, 5473.0, 3216.0, 2052.0, 1188.0, 799.0, 474.0, 347.0, 213.0, 154.0, 103.0, 54.0, 46.0, 39.0, 17.0, 9.0, 7.0, 12.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.055572509765625, -0.05390214920043945, -0.052231788635253906, -0.05056142807006836, -0.04889106750488281, -0.047220706939697266, -0.04555034637451172, -0.04387998580932617, -0.042209625244140625, -0.04053926467895508, -0.03886890411376953, -0.037198543548583984, -0.03552818298339844, -0.03385782241821289, -0.032187461853027344, -0.030517101287841797, -0.02884674072265625, -0.027176380157470703, -0.025506019592285156, -0.02383565902709961, -0.022165298461914062, -0.020494937896728516, -0.01882457733154297, -0.017154216766357422, -0.015483856201171875, -0.013813495635986328, -0.012143135070800781, -0.010472774505615234, -0.008802413940429688, -0.007132053375244141, -0.005461692810058594, -0.003791332244873047, -0.0021209716796875, -0.0004506111145019531, 0.0012197494506835938, 0.0028901100158691406, 0.0045604705810546875, 0.006230831146240234, 0.007901191711425781, 0.009571552276611328, 0.011241912841796875, 0.012912273406982422, 0.014582633972167969, 0.016252994537353516, 0.017923355102539062, 0.01959371566772461, 0.021264076232910156, 0.022934436798095703, 0.02460479736328125, 0.026275157928466797, 0.027945518493652344, 0.02961587905883789, 0.03128623962402344, 0.032956600189208984, 0.03462696075439453, 0.03629732131958008, 0.037967681884765625, 0.03963804244995117, 0.04130840301513672, 0.042978763580322266, 0.04464912414550781, 0.04631948471069336, 0.047989845275878906, 0.04966020584106445, 0.05133056640625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 7.0, 2.0, 5.0, 15.0, 12.0, 22.0, 18.0, 31.0, 29.0, 32.0, 50.0, 46.0, 72.0, 66.0, 64.0, 76.0, 63.0, 55.0, 59.0, 58.0, 42.0, 47.0, 22.0, 29.0, 15.0, 11.0, 7.0, 6.0, 9.0, 7.0, 2.0, 9.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.019561767578125, -0.018991708755493164, -0.018421649932861328, -0.017851591110229492, -0.017281532287597656, -0.01671147346496582, -0.016141414642333984, -0.015571355819702148, -0.015001296997070312, -0.014431238174438477, -0.01386117935180664, -0.013291120529174805, -0.012721061706542969, -0.012151002883911133, -0.011580944061279297, -0.011010885238647461, -0.010440826416015625, -0.009870767593383789, -0.009300708770751953, -0.008730649948120117, -0.008160591125488281, -0.007590532302856445, -0.007020473480224609, -0.0064504146575927734, -0.0058803558349609375, -0.0053102970123291016, -0.004740238189697266, -0.00417017936706543, -0.0036001205444335938, -0.003030061721801758, -0.002460002899169922, -0.001889944076538086, -0.00131988525390625, -0.0007498264312744141, -0.00017976760864257812, 0.0003902912139892578, 0.0009603500366210938, 0.0015304088592529297, 0.0021004676818847656, 0.0026705265045166016, 0.0032405853271484375, 0.0038106441497802734, 0.004380702972412109, 0.004950761795043945, 0.005520820617675781, 0.006090879440307617, 0.006660938262939453, 0.007230997085571289, 0.007801055908203125, 0.008371114730834961, 0.008941173553466797, 0.009511232376098633, 0.010081291198730469, 0.010651350021362305, 0.01122140884399414, 0.011791467666625977, 0.012361526489257812, 0.012931585311889648, 0.013501644134521484, 0.01407170295715332, 0.014641761779785156, 0.015211820602416992, 0.015781879425048828, 0.016351938247680664, 0.0169219970703125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 5.0, 9.0, 7.0, 8.0, 14.0, 17.0, 16.0, 30.0, 58.0, 68.0, 88.0, 119.0, 182.0, 245.0, 378.0, 596.0, 1022.0, 1885.0, 4027.0, 9376.0, 25054.0, 75623.0, 228990.0, 405571.0, 194491.0, 63303.0, 21265.0, 8167.0, 3557.0, 1628.0, 973.0, 585.0, 368.0, 235.0, 180.0, 111.0, 78.0, 51.0, 51.0, 33.0, 29.0, 18.0, 16.0, 8.0, 7.0, 4.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.071044921875, -0.06891918182373047, -0.06679344177246094, -0.0646677017211914, -0.06254196166992188, -0.060416221618652344, -0.05829048156738281, -0.05616474151611328, -0.05403900146484375, -0.05191326141357422, -0.04978752136230469, -0.047661781311035156, -0.045536041259765625, -0.043410301208496094, -0.04128456115722656, -0.03915882110595703, -0.0370330810546875, -0.03490734100341797, -0.03278160095214844, -0.030655860900878906, -0.028530120849609375, -0.026404380798339844, -0.024278640747070312, -0.02215290069580078, -0.02002716064453125, -0.01790142059326172, -0.015775680541992188, -0.013649940490722656, -0.011524200439453125, -0.009398460388183594, -0.0072727203369140625, -0.005146980285644531, -0.003021240234375, -0.0008955001831054688, 0.0012302398681640625, 0.0033559799194335938, 0.005481719970703125, 0.007607460021972656, 0.009733200073242188, 0.011858940124511719, 0.01398468017578125, 0.01611042022705078, 0.018236160278320312, 0.020361900329589844, 0.022487640380859375, 0.024613380432128906, 0.026739120483398438, 0.02886486053466797, 0.0309906005859375, 0.03311634063720703, 0.03524208068847656, 0.037367820739746094, 0.039493560791015625, 0.041619300842285156, 0.04374504089355469, 0.04587078094482422, 0.04799652099609375, 0.05012226104736328, 0.05224800109863281, 0.054373741149902344, 0.056499481201171875, 0.058625221252441406, 0.06075096130371094, 0.06287670135498047, 0.06500244140625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 5.0, 2.0, 3.0, 4.0, 5.0, 13.0, 10.0, 15.0, 18.0, 24.0, 22.0, 22.0, 28.0, 32.0, 25.0, 35.0, 34.0, 31.0, 47.0, 45.0, 53.0, 41.0, 46.0, 39.0, 38.0, 33.0, 43.0, 31.0, 32.0, 46.0, 25.0, 25.0, 20.0, 18.0, 15.0, 17.0, 14.0, 12.0, 5.0, 3.0, 8.0, 7.0, 3.0, 3.0, 4.0, 5.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.0765380859375, -0.07442569732666016, -0.07231330871582031, -0.07020092010498047, -0.06808853149414062, -0.06597614288330078, -0.06386375427246094, -0.061751365661621094, -0.05963897705078125, -0.057526588439941406, -0.05541419982910156, -0.05330181121826172, -0.051189422607421875, -0.04907703399658203, -0.04696464538574219, -0.044852256774902344, -0.0427398681640625, -0.040627479553222656, -0.03851509094238281, -0.03640270233154297, -0.034290313720703125, -0.03217792510986328, -0.030065536499023438, -0.027953147888183594, -0.02584075927734375, -0.023728370666503906, -0.021615982055664062, -0.01950359344482422, -0.017391204833984375, -0.015278816223144531, -0.013166427612304688, -0.011054039001464844, -0.008941650390625, -0.006829261779785156, -0.0047168731689453125, -0.0026044845581054688, -0.000492095947265625, 0.0016202926635742188, 0.0037326812744140625, 0.005845069885253906, 0.00795745849609375, 0.010069847106933594, 0.012182235717773438, 0.014294624328613281, 0.016407012939453125, 0.01851940155029297, 0.020631790161132812, 0.022744178771972656, 0.0248565673828125, 0.026968955993652344, 0.029081344604492188, 0.03119373321533203, 0.033306121826171875, 0.03541851043701172, 0.03753089904785156, 0.039643287658691406, 0.04175567626953125, 0.043868064880371094, 0.04598045349121094, 0.04809284210205078, 0.050205230712890625, 0.05231761932373047, 0.05443000793457031, 0.056542396545410156, 0.05865478515625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 7.0, 15.0, 13.0, 15.0, 23.0, 34.0, 55.0, 78.0, 96.0, 139.0, 243.0, 449.0, 728.0, 1332.0, 2706.0, 5568.0, 13143.0, 34961.0, 105435.0, 351051.0, 361193.0, 109679.0, 36006.0, 13630.0, 5749.0, 2790.0, 1382.0, 764.0, 463.0, 274.0, 183.0, 106.0, 81.0, 44.0, 35.0, 17.0, 18.0, 14.0, 8.0, 6.0, 1.0, 7.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.03448486328125, -0.033471107482910156, -0.03245735168457031, -0.03144359588623047, -0.030429840087890625, -0.02941608428955078, -0.028402328491210938, -0.027388572692871094, -0.02637481689453125, -0.025361061096191406, -0.024347305297851562, -0.02333354949951172, -0.022319793701171875, -0.02130603790283203, -0.020292282104492188, -0.019278526306152344, -0.0182647705078125, -0.017251014709472656, -0.016237258911132812, -0.015223503112792969, -0.014209747314453125, -0.013195991516113281, -0.012182235717773438, -0.011168479919433594, -0.01015472412109375, -0.009140968322753906, -0.008127212524414062, -0.007113456726074219, -0.006099700927734375, -0.005085945129394531, -0.0040721893310546875, -0.0030584335327148438, -0.002044677734375, -0.0010309219360351562, -1.71661376953125e-05, 0.0009965896606445312, 0.002010345458984375, 0.0030241012573242188, 0.0040378570556640625, 0.005051612854003906, 0.00606536865234375, 0.007079124450683594, 0.008092880249023438, 0.009106636047363281, 0.010120391845703125, 0.011134147644042969, 0.012147903442382812, 0.013161659240722656, 0.0141754150390625, 0.015189170837402344, 0.016202926635742188, 0.01721668243408203, 0.018230438232421875, 0.01924419403076172, 0.020257949829101562, 0.021271705627441406, 0.02228546142578125, 0.023299217224121094, 0.024312973022460938, 0.02532672882080078, 0.026340484619140625, 0.02735424041748047, 0.028367996215820312, 0.029381752014160156, 0.0303955078125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 13.0, 15.0, 16.0, 28.0, 34.0, 46.0, 45.0, 86.0, 85.0, 86.0, 100.0, 108.0, 69.0, 70.0, 47.0, 43.0, 28.0, 25.0, 12.0, 8.0, 5.0, 5.0, 5.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.7087669372558594e-05, -4.5942142605781555e-05, -4.4796615839004517e-05, -4.365108907222748e-05, -4.250556230545044e-05, -4.13600355386734e-05, -4.021450877189636e-05, -3.9068982005119324e-05, -3.7923455238342285e-05, -3.6777928471565247e-05, -3.563240170478821e-05, -3.448687493801117e-05, -3.334134817123413e-05, -3.219582140445709e-05, -3.1050294637680054e-05, -2.9904767870903015e-05, -2.8759241104125977e-05, -2.7613714337348938e-05, -2.64681875705719e-05, -2.532266080379486e-05, -2.4177134037017822e-05, -2.3031607270240784e-05, -2.1886080503463745e-05, -2.0740553736686707e-05, -1.9595026969909668e-05, -1.844950020313263e-05, -1.730397343635559e-05, -1.6158446669578552e-05, -1.5012919902801514e-05, -1.3867393136024475e-05, -1.2721866369247437e-05, -1.1576339602470398e-05, -1.043081283569336e-05, -9.28528606891632e-06, -8.139759302139282e-06, -6.994232535362244e-06, -5.848705768585205e-06, -4.7031790018081665e-06, -3.557652235031128e-06, -2.4121254682540894e-06, -1.2665987014770508e-06, -1.210719347000122e-07, 1.0244548320770264e-06, 2.169981598854065e-06, 3.3155083656311035e-06, 4.461035132408142e-06, 5.606561899185181e-06, 6.752088665962219e-06, 7.897615432739258e-06, 9.043142199516296e-06, 1.0188668966293335e-05, 1.1334195733070374e-05, 1.2479722499847412e-05, 1.362524926662445e-05, 1.477077603340149e-05, 1.5916302800178528e-05, 1.7061829566955566e-05, 1.8207356333732605e-05, 1.9352883100509644e-05, 2.0498409867286682e-05, 2.164393663406372e-05, 2.278946340084076e-05, 2.3934990167617798e-05, 2.5080516934394836e-05, 2.6226043701171875e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 5.0, 4.0, 14.0, 11.0, 15.0, 25.0, 29.0, 51.0, 93.0, 132.0, 260.0, 433.0, 890.0, 2231.0, 6922.0, 29549.0, 167603.0, 631490.0, 168106.0, 29552.0, 6970.0, 2183.0, 968.0, 457.0, 222.0, 137.0, 71.0, 47.0, 28.0, 22.0, 11.0, 7.0, 10.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052520751953125, -0.050952911376953125, -0.04938507080078125, -0.047817230224609375, -0.0462493896484375, -0.044681549072265625, -0.04311370849609375, -0.041545867919921875, -0.03997802734375, -0.038410186767578125, -0.03684234619140625, -0.035274505615234375, -0.0337066650390625, -0.032138824462890625, -0.03057098388671875, -0.029003143310546875, -0.027435302734375, -0.025867462158203125, -0.02429962158203125, -0.022731781005859375, -0.0211639404296875, -0.019596099853515625, -0.01802825927734375, -0.016460418701171875, -0.014892578125, -0.013324737548828125, -0.01175689697265625, -0.010189056396484375, -0.0086212158203125, -0.007053375244140625, -0.00548553466796875, -0.003917694091796875, -0.002349853515625, -0.000782012939453125, 0.00078582763671875, 0.002353668212890625, 0.0039215087890625, 0.005489349365234375, 0.00705718994140625, 0.008625030517578125, 0.01019287109375, 0.011760711669921875, 0.01332855224609375, 0.014896392822265625, 0.0164642333984375, 0.018032073974609375, 0.01959991455078125, 0.021167755126953125, 0.022735595703125, 0.024303436279296875, 0.02587127685546875, 0.027439117431640625, 0.0290069580078125, 0.030574798583984375, 0.03214263916015625, 0.033710479736328125, 0.0352783203125, 0.036846160888671875, 0.03841400146484375, 0.039981842041015625, 0.0415496826171875, 0.043117523193359375, 0.04468536376953125, 0.046253204345703125, 0.047821044921875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 4.0, 8.0, 9.0, 4.0, 9.0, 13.0, 18.0, 33.0, 51.0, 49.0, 73.0, 98.0, 102.0, 118.0, 105.0, 89.0, 65.0, 45.0, 34.0, 29.0, 19.0, 14.0, 8.0, 7.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.05975341796875, -0.05840444564819336, -0.05705547332763672, -0.05570650100708008, -0.05435752868652344, -0.0530085563659668, -0.051659584045410156, -0.050310611724853516, -0.048961639404296875, -0.047612667083740234, -0.046263694763183594, -0.04491472244262695, -0.04356575012207031, -0.04221677780151367, -0.04086780548095703, -0.03951883316040039, -0.03816986083984375, -0.03682088851928711, -0.03547191619873047, -0.03412294387817383, -0.03277397155761719, -0.03142499923706055, -0.030076026916503906, -0.028727054595947266, -0.027378082275390625, -0.026029109954833984, -0.024680137634277344, -0.023331165313720703, -0.021982192993164062, -0.020633220672607422, -0.01928424835205078, -0.01793527603149414, -0.0165863037109375, -0.01523733139038086, -0.013888359069824219, -0.012539386749267578, -0.011190414428710938, -0.009841442108154297, -0.008492469787597656, -0.007143497467041016, -0.005794525146484375, -0.004445552825927734, -0.0030965805053710938, -0.0017476081848144531, -0.0003986358642578125, 0.0009503364562988281, 0.0022993087768554688, 0.0036482810974121094, 0.00499725341796875, 0.006346225738525391, 0.007695198059082031, 0.009044170379638672, 0.010393142700195312, 0.011742115020751953, 0.013091087341308594, 0.014440059661865234, 0.015789031982421875, 0.017138004302978516, 0.018486976623535156, 0.019835948944091797, 0.021184921264648438, 0.022533893585205078, 0.02388286590576172, 0.02523183822631836, 0.026580810546875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 13.0, 16.0, 49.0, 117.0, 219.0, 235.0, 177.0, 115.0, 33.0, 18.0, 12.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42393758893013, -0.39454230666160583, -0.36514702439308167, -0.3357517421245575, -0.3063564598560333, -0.27696117758750916, -0.24756589531898499, -0.21817061305046082, -0.18877533078193665, -0.15938004851341248, -0.1299847662448883, -0.10058948397636414, -0.07119420170783997, -0.041798919439315796, -0.012403637170791626, 0.016991645097732544, 0.046386927366256714, 0.07578220963478088, 0.10517749190330505, 0.13457277417182922, 0.1639680564403534, 0.19336333870887756, 0.22275862097740173, 0.2521539032459259, 0.2815491855144501, 0.31094446778297424, 0.3403397500514984, 0.3697350323200226, 0.39913031458854675, 0.4285255968570709, 0.4579208791255951, 0.48731616139411926, 0.5167114734649658, 0.54610675573349, 0.5755020380020142, 0.6048973202705383, 0.6342926025390625, 0.6636878848075867, 0.6930831670761108, 0.722478449344635, 0.7518737316131592, 0.7812690138816833, 0.8106642961502075, 0.8400595784187317, 0.8694548606872559, 0.89885014295578, 0.9282454252243042, 0.9576407074928284, 0.9870359897613525, 1.0164313316345215, 1.0458265542984009, 1.0752217769622803, 1.1046171188354492, 1.1340124607086182, 1.1634076833724976, 1.192802906036377, 1.222198247909546, 1.2515935897827148, 1.2809888124465942, 1.3103840351104736, 1.3397793769836426, 1.3691747188568115, 1.398569941520691, 1.4279651641845703, 1.4573605060577393]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 5.0, 5.0, 7.0, 8.0, 9.0, 9.0, 10.0, 13.0, 19.0, 23.0, 24.0, 22.0, 25.0, 34.0, 40.0, 37.0, 54.0, 38.0, 61.0, 48.0, 52.0, 57.0, 61.0, 43.0, 50.0, 40.0, 34.0, 23.0, 19.0, 20.0, 21.0, 24.0, 15.0, 13.0, 13.0, 10.0, 3.0, 3.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.5078218579292297, -0.4937440752983093, -0.4796662926673889, -0.4655885100364685, -0.4515107274055481, -0.4374329447746277, -0.4233551621437073, -0.40927737951278687, -0.39519959688186646, -0.38112181425094604, -0.36704403162002563, -0.3529662489891052, -0.3388884663581848, -0.3248106837272644, -0.310732901096344, -0.2966551184654236, -0.2825773358345032, -0.26849955320358276, -0.25442177057266235, -0.24034398794174194, -0.22626620531082153, -0.21218842267990112, -0.1981106400489807, -0.1840328574180603, -0.1699550747871399, -0.15587729215621948, -0.14179950952529907, -0.12772172689437866, -0.11364394426345825, -0.09956616163253784, -0.08548837900161743, -0.07141059637069702, -0.05733281373977661, -0.0432550311088562, -0.02917724847793579, -0.01509946584701538, -0.0010216832160949707, 0.01305609941482544, 0.02713388204574585, 0.04121166467666626, 0.05528944730758667, 0.06936722993850708, 0.08344501256942749, 0.0975227952003479, 0.11160057783126831, 0.12567836046218872, 0.13975614309310913, 0.15383392572402954, 0.16791170835494995, 0.18198949098587036, 0.19606727361679077, 0.21014505624771118, 0.2242228388786316, 0.238300621509552, 0.2523784041404724, 0.2664561867713928, 0.28053396940231323, 0.29461175203323364, 0.30868953466415405, 0.32276731729507446, 0.3368450999259949, 0.3509228825569153, 0.3650006651878357, 0.3790784478187561, 0.3931562304496765]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 7.0, 5.0, 7.0, 9.0, 11.0, 18.0, 28.0, 40.0, 81.0, 106.0, 141.0, 235.0, 379.0, 612.0, 1035.0, 1793.0, 3568.0, 7368.0, 17966.0, 58294.0, 507898.0, 3451142.0, 98614.0, 25213.0, 9634.0, 4447.0, 2297.0, 1273.0, 741.0, 420.0, 266.0, 199.0, 150.0, 92.0, 61.0, 44.0, 31.0, 22.0, 15.0, 7.0, 2.0, 7.0, 1.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0804443359375, -0.07758903503417969, -0.07473373413085938, -0.07187843322753906, -0.06902313232421875, -0.06616783142089844, -0.06331253051757812, -0.06045722961425781, -0.0576019287109375, -0.05474662780761719, -0.051891326904296875, -0.04903602600097656, -0.04618072509765625, -0.04332542419433594, -0.040470123291015625, -0.03761482238769531, -0.034759521484375, -0.03190422058105469, -0.029048919677734375, -0.026193618774414062, -0.02333831787109375, -0.020483016967773438, -0.017627716064453125, -0.014772415161132812, -0.0119171142578125, -0.009061813354492188, -0.006206512451171875, -0.0033512115478515625, -0.00049591064453125, 0.0023593902587890625, 0.005214691162109375, 0.008069992065429688, 0.01092529296875, 0.013780593872070312, 0.016635894775390625, 0.019491195678710938, 0.02234649658203125, 0.025201797485351562, 0.028057098388671875, 0.030912399291992188, 0.0337677001953125, 0.03662300109863281, 0.039478302001953125, 0.04233360290527344, 0.04518890380859375, 0.04804420471191406, 0.050899505615234375, 0.05375480651855469, 0.056610107421875, 0.05946540832519531, 0.062320709228515625, 0.06517601013183594, 0.06803131103515625, 0.07088661193847656, 0.07374191284179688, 0.07659721374511719, 0.0794525146484375, 0.08230781555175781, 0.08516311645507812, 0.08801841735839844, 0.09087371826171875, 0.09372901916503906, 0.09658432006835938, 0.09943962097167969, 0.102294921875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 5.0, 9.0, 13.0, 6.0, 19.0, 18.0, 26.0, 29.0, 33.0, 37.0, 52.0, 50.0, 49.0, 64.0, 57.0, 64.0, 67.0, 60.0, 55.0, 33.0, 37.0, 47.0, 30.0, 24.0, 21.0, 14.0, 20.0, 14.0, 6.0, 9.0, 4.0, 3.0, 3.0, 6.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0189056396484375, -0.0183560848236084, -0.017806529998779297, -0.017256975173950195, -0.016707420349121094, -0.016157865524291992, -0.01560831069946289, -0.015058755874633789, -0.014509201049804688, -0.013959646224975586, -0.013410091400146484, -0.012860536575317383, -0.012310981750488281, -0.01176142692565918, -0.011211872100830078, -0.010662317276000977, -0.010112762451171875, -0.009563207626342773, -0.009013652801513672, -0.00846409797668457, -0.007914543151855469, -0.007364988327026367, -0.006815433502197266, -0.006265878677368164, -0.0057163238525390625, -0.005166769027709961, -0.004617214202880859, -0.004067659378051758, -0.0035181045532226562, -0.0029685497283935547, -0.002418994903564453, -0.0018694400787353516, -0.00131988525390625, -0.0007703304290771484, -0.00022077560424804688, 0.0003287792205810547, 0.0008783340454101562, 0.0014278888702392578, 0.0019774436950683594, 0.002526998519897461, 0.0030765533447265625, 0.003626108169555664, 0.004175662994384766, 0.004725217819213867, 0.005274772644042969, 0.00582432746887207, 0.006373882293701172, 0.0069234371185302734, 0.007472991943359375, 0.008022546768188477, 0.008572101593017578, 0.00912165641784668, 0.009671211242675781, 0.010220766067504883, 0.010770320892333984, 0.011319875717163086, 0.011869430541992188, 0.012418985366821289, 0.01296854019165039, 0.013518095016479492, 0.014067649841308594, 0.014617204666137695, 0.015166759490966797, 0.0157163143157959, 0.016265869140625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 5.0, 11.0, 12.0, 30.0, 29.0, 41.0, 68.0, 90.0, 201.0, 369.0, 747.0, 1808.0, 4738.0, 14161.0, 60029.0, 773628.0, 3213419.0, 94480.0, 19564.0, 6198.0, 2341.0, 1042.0, 496.0, 285.0, 156.0, 100.0, 67.0, 54.0, 36.0, 28.0, 14.0, 7.0, 10.0, 9.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08697509765625, -0.08336925506591797, -0.07976341247558594, -0.0761575698852539, -0.07255172729492188, -0.06894588470458984, -0.06534004211425781, -0.06173419952392578, -0.05812835693359375, -0.05452251434326172, -0.05091667175292969, -0.047310829162597656, -0.043704986572265625, -0.040099143981933594, -0.03649330139160156, -0.03288745880126953, -0.0292816162109375, -0.02567577362060547, -0.022069931030273438, -0.018464088439941406, -0.014858245849609375, -0.011252403259277344, -0.0076465606689453125, -0.004040718078613281, -0.00043487548828125, 0.0031709671020507812, 0.0067768096923828125, 0.010382652282714844, 0.013988494873046875, 0.017594337463378906, 0.021200180053710938, 0.02480602264404297, 0.028411865234375, 0.03201770782470703, 0.03562355041503906, 0.039229393005371094, 0.042835235595703125, 0.046441078186035156, 0.05004692077636719, 0.05365276336669922, 0.05725860595703125, 0.06086444854736328, 0.06447029113769531, 0.06807613372802734, 0.07168197631835938, 0.0752878189086914, 0.07889366149902344, 0.08249950408935547, 0.0861053466796875, 0.08971118927001953, 0.09331703186035156, 0.0969228744506836, 0.10052871704101562, 0.10413455963134766, 0.10774040222167969, 0.11134624481201172, 0.11495208740234375, 0.11855792999267578, 0.12216377258300781, 0.12576961517333984, 0.12937545776367188, 0.1329813003540039, 0.13658714294433594, 0.14019298553466797, 0.143798828125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 7.0, 14.0, 11.0, 24.0, 40.0, 59.0, 93.0, 173.0, 395.0, 2043.0, 635.0, 247.0, 117.0, 72.0, 46.0, 26.0, 19.0, 5.0, 19.0, 6.0, 4.0, 6.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0232086181640625, -0.02208685874938965, -0.020965099334716797, -0.019843339920043945, -0.018721580505371094, -0.017599821090698242, -0.01647806167602539, -0.015356302261352539, -0.014234542846679688, -0.013112783432006836, -0.011991024017333984, -0.010869264602661133, -0.009747505187988281, -0.00862574577331543, -0.007503986358642578, -0.0063822269439697266, -0.005260467529296875, -0.0041387081146240234, -0.003016948699951172, -0.0018951892852783203, -0.0007734298706054688, 0.0003483295440673828, 0.0014700889587402344, 0.002591848373413086, 0.0037136077880859375, 0.004835367202758789, 0.005957126617431641, 0.007078886032104492, 0.008200645446777344, 0.009322404861450195, 0.010444164276123047, 0.011565923690795898, 0.01268768310546875, 0.013809442520141602, 0.014931201934814453, 0.016052961349487305, 0.017174720764160156, 0.018296480178833008, 0.01941823959350586, 0.02053999900817871, 0.021661758422851562, 0.022783517837524414, 0.023905277252197266, 0.025027036666870117, 0.02614879608154297, 0.02727055549621582, 0.028392314910888672, 0.029514074325561523, 0.030635833740234375, 0.03175759315490723, 0.03287935256958008, 0.03400111198425293, 0.03512287139892578, 0.03624463081359863, 0.037366390228271484, 0.038488149642944336, 0.03960990905761719, 0.04073166847229004, 0.04185342788696289, 0.04297518730163574, 0.044096946716308594, 0.045218706130981445, 0.0463404655456543, 0.04746222496032715, 0.048583984375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 12.0, 27.0, 69.0, 131.0, 277.0, 254.0, 152.0, 45.0, 30.0, 7.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13349102437496185, -0.12308056652545929, -0.11267010867595673, -0.10225965082645416, -0.0918491929769516, -0.08143873512744904, -0.07102828472852707, -0.060617826879024506, -0.05020736902952194, -0.03979691118001938, -0.029386455193161964, -0.01897599920630455, -0.008565541356801987, 0.0018449164927005768, 0.012255370616912842, 0.022665828466415405, 0.03307628631591797, 0.04348674416542053, 0.053897202014923096, 0.06430765986442566, 0.07471811771392822, 0.08512857556343079, 0.09553902596235275, 0.10594948381185532, 0.11635994166135788, 0.12677039206027985, 0.1371808499097824, 0.14759130775928497, 0.15800176560878754, 0.1684122234582901, 0.17882268130779266, 0.18923313915729523, 0.1996435821056366, 0.21005403995513916, 0.22046449780464172, 0.2308749556541443, 0.24128541350364685, 0.2516958713531494, 0.262106329202652, 0.27251678705215454, 0.2829272449016571, 0.29333770275115967, 0.30374816060066223, 0.3141586184501648, 0.32456907629966736, 0.3349795341491699, 0.3453899919986725, 0.35580044984817505, 0.3662108778953552, 0.3766213357448578, 0.38703179359436035, 0.3974422514438629, 0.4078527092933655, 0.41826316714286804, 0.4286736249923706, 0.43908408284187317, 0.44949454069137573, 0.4599049985408783, 0.47031545639038086, 0.4807259142398834, 0.491136372089386, 0.5015468001365662, 0.5119572877883911, 0.5223677158355713, 0.5327782034873962]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 3.0, 9.0, 0.0, 4.0, 4.0, 7.0, 8.0, 11.0, 19.0, 13.0, 28.0, 13.0, 20.0, 26.0, 31.0, 20.0, 25.0, 38.0, 47.0, 58.0, 34.0, 53.0, 49.0, 37.0, 39.0, 42.0, 34.0, 42.0, 34.0, 41.0, 28.0, 25.0, 31.0, 26.0, 15.0, 24.0, 14.0, 13.0, 10.0, 3.0, 7.0, 6.0, 4.0, 4.0, 6.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09318786859512329, -0.0903608500957489, -0.08753383159637451, -0.08470682054758072, -0.08187980204820633, -0.07905278354883194, -0.07622577250003815, -0.07339875400066376, -0.07057173550128937, -0.06774471700191498, -0.06491769850254059, -0.062090687453746796, -0.059263668954372406, -0.056436650454998016, -0.053609635680913925, -0.050782620906829834, -0.047955602407455444, -0.045128583908081055, -0.042301569133996964, -0.03947455435991287, -0.03664753586053848, -0.03382051736116409, -0.030993502587080002, -0.02816648595035076, -0.02533946931362152, -0.02251245267689228, -0.01968543604016304, -0.0168584194034338, -0.01403140276670456, -0.011204386129975319, -0.008377369493246078, -0.005550352856516838, -0.0027233362197875977, 0.00010368041694164276, 0.002930697053670883, 0.005757713690400124, 0.008584730327129364, 0.011411746963858604, 0.014238763600587845, 0.017065780237317085, 0.019892796874046326, 0.022719813510775566, 0.025546830147504807, 0.028373846784234047, 0.031200863420963287, 0.03402788192033768, 0.03685489669442177, 0.03968191146850586, 0.04250892996788025, 0.04533594846725464, 0.04816296324133873, 0.05098997801542282, 0.05381699651479721, 0.0566440150141716, 0.05947102978825569, 0.06229804456233978, 0.06512506306171417, 0.06795208156108856, 0.07077910006046295, 0.07360611110925674, 0.07643312960863113, 0.07926014810800552, 0.08208715915679932, 0.0849141776561737, 0.0877411961555481]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 8.0, 10.0, 8.0, 13.0, 17.0, 31.0, 32.0, 51.0, 80.0, 112.0, 185.0, 252.0, 421.0, 667.0, 952.0, 1607.0, 2761.0, 4824.0, 8505.0, 15951.0, 31413.0, 62896.0, 131228.0, 254376.0, 261716.0, 135650.0, 65164.0, 32220.0, 16498.0, 8725.0, 4844.0, 2761.0, 1609.0, 1015.0, 661.0, 443.0, 266.0, 187.0, 118.0, 86.0, 49.0, 46.0, 27.0, 18.0, 17.0, 8.0, 7.0, 9.0, 6.0, 4.0, 2.0, 2.0], "bins": [-0.05615234375, -0.054593563079833984, -0.05303478240966797, -0.05147600173950195, -0.04991722106933594, -0.04835844039916992, -0.046799659729003906, -0.04524087905883789, -0.043682098388671875, -0.04212331771850586, -0.040564537048339844, -0.03900575637817383, -0.03744697570800781, -0.0358881950378418, -0.03432941436767578, -0.032770633697509766, -0.03121185302734375, -0.029653072357177734, -0.02809429168701172, -0.026535511016845703, -0.024976730346679688, -0.023417949676513672, -0.021859169006347656, -0.02030038833618164, -0.018741607666015625, -0.01718282699584961, -0.015624046325683594, -0.014065265655517578, -0.012506484985351562, -0.010947704315185547, -0.009388923645019531, -0.007830142974853516, -0.0062713623046875, -0.004712581634521484, -0.0031538009643554688, -0.0015950202941894531, -3.62396240234375e-05, 0.0015225410461425781, 0.0030813217163085938, 0.004640102386474609, 0.006198883056640625, 0.007757663726806641, 0.009316444396972656, 0.010875225067138672, 0.012434005737304688, 0.013992786407470703, 0.015551567077636719, 0.017110347747802734, 0.01866912841796875, 0.020227909088134766, 0.02178668975830078, 0.023345470428466797, 0.024904251098632812, 0.026463031768798828, 0.028021812438964844, 0.02958059310913086, 0.031139373779296875, 0.03269815444946289, 0.034256935119628906, 0.03581571578979492, 0.03737449645996094, 0.03893327713012695, 0.04049205780029297, 0.042050838470458984, 0.043609619140625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 6.0, 6.0, 7.0, 7.0, 13.0, 19.0, 24.0, 28.0, 28.0, 53.0, 39.0, 45.0, 63.0, 64.0, 53.0, 62.0, 65.0, 63.0, 63.0, 40.0, 51.0, 47.0, 29.0, 21.0, 25.0, 17.0, 13.0, 12.0, 6.0, 6.0, 8.0, 7.0, 1.0, 5.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0204620361328125, -0.01987171173095703, -0.019281387329101562, -0.018691062927246094, -0.018100738525390625, -0.017510414123535156, -0.016920089721679688, -0.01632976531982422, -0.01573944091796875, -0.015149116516113281, -0.014558792114257812, -0.013968467712402344, -0.013378143310546875, -0.012787818908691406, -0.012197494506835938, -0.011607170104980469, -0.011016845703125, -0.010426521301269531, -0.009836196899414062, -0.009245872497558594, -0.008655548095703125, -0.008065223693847656, -0.0074748992919921875, -0.006884574890136719, -0.00629425048828125, -0.005703926086425781, -0.0051136016845703125, -0.004523277282714844, -0.003932952880859375, -0.0033426284790039062, -0.0027523040771484375, -0.0021619796752929688, -0.0015716552734375, -0.0009813308715820312, -0.0003910064697265625, 0.00019931793212890625, 0.000789642333984375, 0.0013799667358398438, 0.0019702911376953125, 0.0025606155395507812, 0.00315093994140625, 0.0037412643432617188, 0.0043315887451171875, 0.004921913146972656, 0.005512237548828125, 0.006102561950683594, 0.0066928863525390625, 0.007283210754394531, 0.00787353515625, 0.008463859558105469, 0.009054183959960938, 0.009644508361816406, 0.010234832763671875, 0.010825157165527344, 0.011415481567382812, 0.012005805969238281, 0.01259613037109375, 0.013186454772949219, 0.013776779174804688, 0.014367103576660156, 0.014957427978515625, 0.015547752380371094, 0.016138076782226562, 0.01672840118408203, 0.0173187255859375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 6.0, 10.0, 5.0, 11.0, 13.0, 20.0, 36.0, 49.0, 72.0, 103.0, 180.0, 214.0, 367.0, 627.0, 1144.0, 2440.0, 5743.0, 17459.0, 62121.0, 246050.0, 473241.0, 172974.0, 43915.0, 12901.0, 4458.0, 1951.0, 953.0, 532.0, 320.0, 213.0, 128.0, 83.0, 69.0, 51.0, 28.0, 20.0, 18.0, 12.0, 13.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06781005859375, -0.06533241271972656, -0.06285476684570312, -0.06037712097167969, -0.05789947509765625, -0.05542182922363281, -0.052944183349609375, -0.05046653747558594, -0.0479888916015625, -0.04551124572753906, -0.043033599853515625, -0.04055595397949219, -0.03807830810546875, -0.03560066223144531, -0.033123016357421875, -0.030645370483398438, -0.028167724609375, -0.025690078735351562, -0.023212432861328125, -0.020734786987304688, -0.01825714111328125, -0.015779495239257812, -0.013301849365234375, -0.010824203491210938, -0.0083465576171875, -0.0058689117431640625, -0.003391265869140625, -0.0009136199951171875, 0.00156402587890625, 0.0040416717529296875, 0.006519317626953125, 0.008996963500976562, 0.011474609375, 0.013952255249023438, 0.016429901123046875, 0.018907546997070312, 0.02138519287109375, 0.023862838745117188, 0.026340484619140625, 0.028818130493164062, 0.0312957763671875, 0.03377342224121094, 0.036251068115234375, 0.03872871398925781, 0.04120635986328125, 0.04368400573730469, 0.046161651611328125, 0.04863929748535156, 0.051116943359375, 0.05359458923339844, 0.056072235107421875, 0.05854988098144531, 0.06102752685546875, 0.06350517272949219, 0.06598281860351562, 0.06846046447753906, 0.0709381103515625, 0.07341575622558594, 0.07589340209960938, 0.07837104797363281, 0.08084869384765625, 0.08332633972167969, 0.08580398559570312, 0.08828163146972656, 0.09075927734375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 1.0, 7.0, 4.0, 3.0, 6.0, 12.0, 17.0, 20.0, 18.0, 18.0, 21.0, 24.0, 32.0, 34.0, 31.0, 41.0, 42.0, 49.0, 42.0, 42.0, 35.0, 41.0, 45.0, 41.0, 46.0, 38.0, 37.0, 35.0, 31.0, 26.0, 20.0, 24.0, 28.0, 19.0, 19.0, 8.0, 9.0, 6.0, 8.0, 3.0, 7.0, 7.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06634521484375, -0.06415367126464844, -0.061962127685546875, -0.05977058410644531, -0.05757904052734375, -0.05538749694824219, -0.053195953369140625, -0.05100440979003906, -0.0488128662109375, -0.04662132263183594, -0.044429779052734375, -0.04223823547363281, -0.04004669189453125, -0.03785514831542969, -0.035663604736328125, -0.03347206115722656, -0.031280517578125, -0.029088973999023438, -0.026897430419921875, -0.024705886840820312, -0.02251434326171875, -0.020322799682617188, -0.018131256103515625, -0.015939712524414062, -0.0137481689453125, -0.011556625366210938, -0.009365081787109375, -0.0071735382080078125, -0.00498199462890625, -0.0027904510498046875, -0.000598907470703125, 0.0015926361083984375, 0.0037841796875, 0.0059757232666015625, 0.008167266845703125, 0.010358810424804688, 0.01255035400390625, 0.014741897583007812, 0.016933441162109375, 0.019124984741210938, 0.0213165283203125, 0.023508071899414062, 0.025699615478515625, 0.027891159057617188, 0.03008270263671875, 0.03227424621582031, 0.034465789794921875, 0.03665733337402344, 0.038848876953125, 0.04104042053222656, 0.043231964111328125, 0.04542350769042969, 0.04761505126953125, 0.04980659484863281, 0.051998138427734375, 0.05418968200683594, 0.0563812255859375, 0.05857276916503906, 0.060764312744140625, 0.06295585632324219, 0.06514739990234375, 0.06733894348144531, 0.06953048706054688, 0.07172203063964844, 0.07391357421875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 4.0, 1.0, 7.0, 10.0, 10.0, 17.0, 24.0, 27.0, 50.0, 92.0, 109.0, 199.0, 366.0, 721.0, 1673.0, 3668.0, 10462.0, 39419.0, 227914.0, 585868.0, 137671.0, 26701.0, 7812.0, 3025.0, 1254.0, 654.0, 325.0, 167.0, 82.0, 61.0, 43.0, 33.0, 20.0, 24.0, 15.0, 7.0, 5.0, 5.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04254150390625, -0.04114055633544922, -0.03973960876464844, -0.038338661193847656, -0.036937713623046875, -0.035536766052246094, -0.03413581848144531, -0.03273487091064453, -0.03133392333984375, -0.02993297576904297, -0.028532028198242188, -0.027131080627441406, -0.025730133056640625, -0.024329185485839844, -0.022928237915039062, -0.02152729034423828, -0.0201263427734375, -0.01872539520263672, -0.017324447631835938, -0.015923500061035156, -0.014522552490234375, -0.013121604919433594, -0.011720657348632812, -0.010319709777832031, -0.00891876220703125, -0.007517814636230469, -0.0061168670654296875, -0.004715919494628906, -0.003314971923828125, -0.0019140243530273438, -0.0005130767822265625, 0.0008878707885742188, 0.002288818359375, 0.0036897659301757812, 0.0050907135009765625, 0.006491661071777344, 0.007892608642578125, 0.009293556213378906, 0.010694503784179688, 0.012095451354980469, 0.01349639892578125, 0.014897346496582031, 0.016298294067382812, 0.017699241638183594, 0.019100189208984375, 0.020501136779785156, 0.021902084350585938, 0.02330303192138672, 0.0247039794921875, 0.02610492706298828, 0.027505874633789062, 0.028906822204589844, 0.030307769775390625, 0.031708717346191406, 0.03310966491699219, 0.03451061248779297, 0.03591156005859375, 0.03731250762939453, 0.03871345520019531, 0.040114402770996094, 0.041515350341796875, 0.042916297912597656, 0.04431724548339844, 0.04571819305419922, 0.047119140625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 6.0, 12.0, 11.0, 26.0, 22.0, 34.0, 41.0, 74.0, 74.0, 115.0, 100.0, 116.0, 96.0, 76.0, 60.0, 30.0, 25.0, 27.0, 13.0, 11.0, 6.0, 1.0, 6.0, 4.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0279159545898438e-05, -2.9056333005428314e-05, -2.783350646495819e-05, -2.6610679924488068e-05, -2.5387853384017944e-05, -2.416502684354782e-05, -2.2942200303077698e-05, -2.1719373762607574e-05, -2.049654722213745e-05, -1.9273720681667328e-05, -1.8050894141197205e-05, -1.682806760072708e-05, -1.5605241060256958e-05, -1.4382414519786835e-05, -1.3159587979316711e-05, -1.1936761438846588e-05, -1.0713934898376465e-05, -9.491108357906342e-06, -8.268281817436218e-06, -7.045455276966095e-06, -5.822628736495972e-06, -4.599802196025848e-06, -3.376975655555725e-06, -2.154149115085602e-06, -9.313225746154785e-07, 2.915039658546448e-07, 1.514330506324768e-06, 2.7371570467948914e-06, 3.959983587265015e-06, 5.182810127735138e-06, 6.405636668205261e-06, 7.6284632086753845e-06, 8.851289749145508e-06, 1.0074116289615631e-05, 1.1296942830085754e-05, 1.2519769370555878e-05, 1.3742595911026001e-05, 1.4965422451496124e-05, 1.6188248991966248e-05, 1.741107553243637e-05, 1.8633902072906494e-05, 1.9856728613376617e-05, 2.107955515384674e-05, 2.2302381694316864e-05, 2.3525208234786987e-05, 2.474803477525711e-05, 2.5970861315727234e-05, 2.7193687856197357e-05, 2.841651439666748e-05, 2.9639340937137604e-05, 3.086216747760773e-05, 3.208499401807785e-05, 3.3307820558547974e-05, 3.45306470990181e-05, 3.575347363948822e-05, 3.6976300179958344e-05, 3.819912672042847e-05, 3.942195326089859e-05, 4.064477980136871e-05, 4.186760634183884e-05, 4.309043288230896e-05, 4.431325942277908e-05, 4.5536085963249207e-05, 4.675891250371933e-05, 4.798173904418945e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 7.0, 11.0, 12.0, 30.0, 35.0, 41.0, 74.0, 107.0, 192.0, 310.0, 631.0, 1326.0, 3038.0, 8449.0, 29151.0, 171937.0, 625424.0, 165405.0, 28482.0, 8120.0, 3013.0, 1236.0, 662.0, 321.0, 206.0, 103.0, 73.0, 52.0, 30.0, 19.0, 11.0, 8.0, 8.0, 10.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.042205810546875, -0.04082155227661133, -0.039437294006347656, -0.038053035736083984, -0.03666877746582031, -0.03528451919555664, -0.03390026092529297, -0.0325160026550293, -0.031131744384765625, -0.029747486114501953, -0.02836322784423828, -0.02697896957397461, -0.025594711303710938, -0.024210453033447266, -0.022826194763183594, -0.021441936492919922, -0.02005767822265625, -0.018673419952392578, -0.017289161682128906, -0.015904903411865234, -0.014520645141601562, -0.01313638687133789, -0.011752128601074219, -0.010367870330810547, -0.008983612060546875, -0.007599353790283203, -0.006215095520019531, -0.004830837249755859, -0.0034465789794921875, -0.0020623207092285156, -0.0006780624389648438, 0.0007061958312988281, 0.0020904541015625, 0.003474712371826172, 0.004858970642089844, 0.006243228912353516, 0.0076274871826171875, 0.00901174545288086, 0.010396003723144531, 0.011780261993408203, 0.013164520263671875, 0.014548778533935547, 0.01593303680419922, 0.01731729507446289, 0.018701553344726562, 0.020085811614990234, 0.021470069885253906, 0.022854328155517578, 0.02423858642578125, 0.025622844696044922, 0.027007102966308594, 0.028391361236572266, 0.029775619506835938, 0.03115987777709961, 0.03254413604736328, 0.03392839431762695, 0.035312652587890625, 0.0366969108581543, 0.03808116912841797, 0.03946542739868164, 0.04084968566894531, 0.042233943939208984, 0.043618202209472656, 0.04500246047973633, 0.04638671875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 4.0, 7.0, 8.0, 13.0, 15.0, 26.0, 28.0, 29.0, 61.0, 71.0, 63.0, 90.0, 103.0, 77.0, 86.0, 72.0, 58.0, 53.0, 33.0, 19.0, 17.0, 16.0, 14.0, 7.0, 3.0, 3.0, 5.0, 6.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0300140380859375, -0.02901434898376465, -0.028014659881591797, -0.027014970779418945, -0.026015281677246094, -0.025015592575073242, -0.02401590347290039, -0.02301621437072754, -0.022016525268554688, -0.021016836166381836, -0.020017147064208984, -0.019017457962036133, -0.01801776885986328, -0.01701807975769043, -0.016018390655517578, -0.015018701553344727, -0.014019012451171875, -0.013019323348999023, -0.012019634246826172, -0.01101994514465332, -0.010020256042480469, -0.009020566940307617, -0.008020877838134766, -0.007021188735961914, -0.0060214996337890625, -0.005021810531616211, -0.004022121429443359, -0.003022432327270508, -0.0020227432250976562, -0.0010230541229248047, -2.3365020751953125e-05, 0.0009763240814208984, 0.00197601318359375, 0.0029757022857666016, 0.003975391387939453, 0.004975080490112305, 0.005974769592285156, 0.006974458694458008, 0.00797414779663086, 0.008973836898803711, 0.009973526000976562, 0.010973215103149414, 0.011972904205322266, 0.012972593307495117, 0.013972282409667969, 0.01497197151184082, 0.015971660614013672, 0.016971349716186523, 0.017971038818359375, 0.018970727920532227, 0.019970417022705078, 0.02097010612487793, 0.02196979522705078, 0.022969484329223633, 0.023969173431396484, 0.024968862533569336, 0.025968551635742188, 0.02696824073791504, 0.02796792984008789, 0.028967618942260742, 0.029967308044433594, 0.030966997146606445, 0.0319666862487793, 0.03296637535095215, 0.033966064453125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 18.0, 22.0, 26.0, 56.0, 72.0, 111.0, 151.0, 119.0, 141.0, 102.0, 71.0, 51.0, 22.0, 15.0, 7.0, 8.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3377261459827423, -0.3202654719352722, -0.3028047978878021, -0.28534412384033203, -0.26788341999053955, -0.25042277574539185, -0.23296207189559937, -0.21550139784812927, -0.19804072380065918, -0.1805800497531891, -0.163119375705719, -0.1456586867570877, -0.12819801270961761, -0.11073733866214752, -0.09327665716409683, -0.07581597566604614, -0.05835530161857605, -0.04089462384581566, -0.023433946073055267, -0.005973268300294876, 0.011487409472465515, 0.028948083519935608, 0.0464087650179863, 0.06386944651603699, 0.08133012056350708, 0.09879079461097717, 0.11625147610902786, 0.13371215760707855, 0.15117283165454865, 0.16863350570201874, 0.18609419465065002, 0.20355486869812012, 0.2210155725479126, 0.2384762465953827, 0.2559369206428528, 0.2733975946903229, 0.29085826873779297, 0.30831897258758545, 0.32577964663505554, 0.34324032068252563, 0.3607009947299957, 0.3781616687774658, 0.3956223428249359, 0.413083016872406, 0.4305437207221985, 0.4480043649673462, 0.46546506881713867, 0.48292574286460876, 0.5003864169120789, 0.5178471207618713, 0.535307765007019, 0.5527684688568115, 0.5702291131019592, 0.5876898169517517, 0.6051504611968994, 0.6226111650466919, 0.6400718688964844, 0.6575325727462769, 0.6749932169914246, 0.692453920841217, 0.7099145650863647, 0.7273752689361572, 0.7448359131813049, 0.7622966170310974, 0.7797572612762451]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 6.0, 2.0, 3.0, 4.0, 9.0, 8.0, 13.0, 8.0, 15.0, 21.0, 21.0, 29.0, 25.0, 32.0, 44.0, 38.0, 51.0, 51.0, 52.0, 61.0, 62.0, 45.0, 50.0, 45.0, 42.0, 39.0, 38.0, 25.0, 27.0, 22.0, 25.0, 16.0, 20.0, 16.0, 16.0, 9.0, 6.0, 5.0, 6.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43339109420776367, -0.4191264510154724, -0.40486177802085876, -0.3905971348285675, -0.37633249163627625, -0.3620678186416626, -0.34780317544937134, -0.3335385322570801, -0.3192738890647888, -0.30500924587249756, -0.2907445728778839, -0.27647992968559265, -0.2622152864933014, -0.24795062839984894, -0.23368597030639648, -0.21942132711410522, -0.20515665411949158, -0.19089199602603912, -0.17662735283374786, -0.1623626947402954, -0.14809805154800415, -0.1338333934545517, -0.11956873536109924, -0.10530408471822739, -0.09103943407535553, -0.07677478343248367, -0.06251013278961182, -0.04824547469615936, -0.033980824053287506, -0.01971617341041565, -0.005451515316963196, 0.008813135325908661, 0.023077785968780518, 0.037342436611652374, 0.05160709097981453, 0.06587174534797668, 0.08013639599084854, 0.0944010466337204, 0.10866570472717285, 0.12293035537004471, 0.13719500601291656, 0.15145966410636902, 0.16572430729866028, 0.17998896539211273, 0.19425362348556519, 0.20851826667785645, 0.2227829247713089, 0.23704758286476135, 0.2513122260570526, 0.26557686924934387, 0.2798415422439575, 0.2941061854362488, 0.30837082862854004, 0.3226354718208313, 0.33690014481544495, 0.3511647880077362, 0.36542946100234985, 0.3796941041946411, 0.39395877718925476, 0.408223420381546, 0.4224880635738373, 0.4367527365684509, 0.4510173797607422, 0.46528202295303345, 0.4795466661453247]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 5.0, 3.0, 7.0, 7.0, 15.0, 24.0, 41.0, 47.0, 72.0, 124.0, 182.0, 330.0, 465.0, 855.0, 1526.0, 2742.0, 5600.0, 12451.0, 32995.0, 116116.0, 2611960.0, 1256076.0, 100176.0, 29441.0, 11362.0, 5294.0, 2673.0, 1488.0, 842.0, 492.0, 309.0, 167.0, 113.0, 72.0, 78.0, 49.0, 31.0, 23.0, 8.0, 10.0, 6.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.07763671875, -0.07541561126708984, -0.07319450378417969, -0.07097339630126953, -0.06875228881835938, -0.06653118133544922, -0.06431007385253906, -0.062088966369628906, -0.05986785888671875, -0.057646751403808594, -0.05542564392089844, -0.05320453643798828, -0.050983428955078125, -0.04876232147216797, -0.04654121398925781, -0.044320106506347656, -0.0420989990234375, -0.039877891540527344, -0.03765678405761719, -0.03543567657470703, -0.033214569091796875, -0.03099346160888672, -0.028772354125976562, -0.026551246643066406, -0.02433013916015625, -0.022109031677246094, -0.019887924194335938, -0.01766681671142578, -0.015445709228515625, -0.013224601745605469, -0.011003494262695312, -0.008782386779785156, -0.006561279296875, -0.004340171813964844, -0.0021190643310546875, 0.00010204315185546875, 0.002323150634765625, 0.004544258117675781, 0.0067653656005859375, 0.008986473083496094, 0.01120758056640625, 0.013428688049316406, 0.015649795532226562, 0.01787090301513672, 0.020092010498046875, 0.02231311798095703, 0.024534225463867188, 0.026755332946777344, 0.0289764404296875, 0.031197547912597656, 0.03341865539550781, 0.03563976287841797, 0.037860870361328125, 0.04008197784423828, 0.04230308532714844, 0.044524192810058594, 0.04674530029296875, 0.048966407775878906, 0.05118751525878906, 0.05340862274169922, 0.055629730224609375, 0.05785083770751953, 0.06007194519042969, 0.062293052673339844, 0.06451416015625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 0.0, 1.0, 4.0, 6.0, 9.0, 4.0, 11.0, 9.0, 21.0, 17.0, 21.0, 28.0, 34.0, 39.0, 53.0, 58.0, 53.0, 51.0, 56.0, 57.0, 45.0, 71.0, 52.0, 58.0, 41.0, 41.0, 33.0, 29.0, 21.0, 18.0, 16.0, 4.0, 9.0, 8.0, 11.0, 2.0, 5.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.01776123046875, -0.017196178436279297, -0.016631126403808594, -0.01606607437133789, -0.015501022338867188, -0.014935970306396484, -0.014370918273925781, -0.013805866241455078, -0.013240814208984375, -0.012675762176513672, -0.012110710144042969, -0.011545658111572266, -0.010980606079101562, -0.01041555404663086, -0.009850502014160156, -0.009285449981689453, -0.00872039794921875, -0.008155345916748047, -0.007590293884277344, -0.007025241851806641, -0.0064601898193359375, -0.005895137786865234, -0.005330085754394531, -0.004765033721923828, -0.004199981689453125, -0.003634929656982422, -0.0030698776245117188, -0.0025048255920410156, -0.0019397735595703125, -0.0013747215270996094, -0.0008096694946289062, -0.0002446174621582031, 0.0003204345703125, 0.0008854866027832031, 0.0014505386352539062, 0.0020155906677246094, 0.0025806427001953125, 0.0031456947326660156, 0.0037107467651367188, 0.004275798797607422, 0.004840850830078125, 0.005405902862548828, 0.005970954895019531, 0.006536006927490234, 0.0071010589599609375, 0.007666110992431641, 0.008231163024902344, 0.008796215057373047, 0.00936126708984375, 0.009926319122314453, 0.010491371154785156, 0.01105642318725586, 0.011621475219726562, 0.012186527252197266, 0.012751579284667969, 0.013316631317138672, 0.013881683349609375, 0.014446735382080078, 0.015011787414550781, 0.015576839447021484, 0.016141891479492188, 0.01670694351196289, 0.017271995544433594, 0.017837047576904297, 0.018402099609375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 4.0, 10.0, 11.0, 18.0, 29.0, 70.0, 95.0, 197.0, 394.0, 828.0, 1912.0, 4823.0, 13501.0, 46696.0, 278781.0, 3484700.0, 293013.0, 47539.0, 13437.0, 4719.0, 1810.0, 833.0, 405.0, 209.0, 107.0, 56.0, 21.0, 21.0, 9.0, 13.0, 5.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.1243896484375, -0.12139320373535156, -0.11839675903320312, -0.11540031433105469, -0.11240386962890625, -0.10940742492675781, -0.10641098022460938, -0.10341453552246094, -0.1004180908203125, -0.09742164611816406, -0.09442520141601562, -0.09142875671386719, -0.08843231201171875, -0.08543586730957031, -0.08243942260742188, -0.07944297790527344, -0.076446533203125, -0.07345008850097656, -0.07045364379882812, -0.06745719909667969, -0.06446075439453125, -0.06146430969238281, -0.058467864990234375, -0.05547142028808594, -0.0524749755859375, -0.04947853088378906, -0.046482086181640625, -0.04348564147949219, -0.04048919677734375, -0.03749275207519531, -0.034496307373046875, -0.03149986267089844, -0.02850341796875, -0.025506973266601562, -0.022510528564453125, -0.019514083862304688, -0.01651763916015625, -0.013521194458007812, -0.010524749755859375, -0.0075283050537109375, -0.0045318603515625, -0.0015354156494140625, 0.001461029052734375, 0.0044574737548828125, 0.00745391845703125, 0.010450363159179688, 0.013446807861328125, 0.016443252563476562, 0.019439697265625, 0.022436141967773438, 0.025432586669921875, 0.028429031372070312, 0.03142547607421875, 0.03442192077636719, 0.037418365478515625, 0.04041481018066406, 0.0434112548828125, 0.04640769958496094, 0.049404144287109375, 0.05240058898925781, 0.05539703369140625, 0.05839347839355469, 0.061389923095703125, 0.06438636779785156, 0.0673828125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 1.0, 9.0, 7.0, 11.0, 9.0, 10.0, 22.0, 25.0, 25.0, 39.0, 69.0, 86.0, 166.0, 275.0, 608.0, 1476.0, 545.0, 268.0, 140.0, 84.0, 56.0, 32.0, 34.0, 24.0, 18.0, 10.0, 4.0, 3.0, 12.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0379638671875, -0.03682994842529297, -0.03569602966308594, -0.034562110900878906, -0.033428192138671875, -0.032294273376464844, -0.031160354614257812, -0.03002643585205078, -0.02889251708984375, -0.02775859832763672, -0.026624679565429688, -0.025490760803222656, -0.024356842041015625, -0.023222923278808594, -0.022089004516601562, -0.02095508575439453, -0.0198211669921875, -0.01868724822998047, -0.017553329467773438, -0.016419410705566406, -0.015285491943359375, -0.014151573181152344, -0.013017654418945312, -0.011883735656738281, -0.01074981689453125, -0.009615898132324219, -0.008481979370117188, -0.007348060607910156, -0.006214141845703125, -0.005080223083496094, -0.0039463043212890625, -0.0028123855590820312, -0.001678466796875, -0.0005445480346679688, 0.0005893707275390625, 0.0017232894897460938, 0.002857208251953125, 0.003991127014160156, 0.0051250457763671875, 0.006258964538574219, 0.00739288330078125, 0.008526802062988281, 0.009660720825195312, 0.010794639587402344, 0.011928558349609375, 0.013062477111816406, 0.014196395874023438, 0.015330314636230469, 0.0164642333984375, 0.01759815216064453, 0.018732070922851562, 0.019865989685058594, 0.020999908447265625, 0.022133827209472656, 0.023267745971679688, 0.02440166473388672, 0.02553558349609375, 0.02666950225830078, 0.027803421020507812, 0.028937339782714844, 0.030071258544921875, 0.031205177307128906, 0.03233909606933594, 0.03347301483154297, 0.03460693359375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 14.0, 64.0, 272.0, 414.0, 202.0, 30.0, 11.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2561997175216675, -1.2291288375854492, -1.202057957649231, -1.1749869585037231, -1.1479160785675049, -1.1208451986312866, -1.0937743186950684, -1.0667033195495605, -1.0396324396133423, -1.012561559677124, -0.985490620136261, -0.9584197402000427, -0.9313488006591797, -0.9042779207229614, -0.8772069811820984, -0.8501361012458801, -0.8230651617050171, -0.7959942817687988, -0.7689233422279358, -0.7418524622917175, -0.7147815227508545, -0.6877106428146362, -0.6606397032737732, -0.6335688233375549, -0.6064979434013367, -0.5794270634651184, -0.5523561239242554, -0.5252852439880371, -0.4982143044471741, -0.4711434245109558, -0.4440724849700928, -0.4170016050338745, -0.3899306654930115, -0.3628597557544708, -0.3357888460159302, -0.3087179362773895, -0.2816470265388489, -0.2545761466026306, -0.22750522196292877, -0.20043431222438812, -0.17336340248584747, -0.14629249274730682, -0.11922158300876617, -0.09215068072080612, -0.06507977098226547, -0.03800886869430542, -0.01093795895576477, 0.01613295078277588, 0.04320386052131653, 0.07027477025985718, 0.09734567999839783, 0.12441658228635788, 0.15148749947547913, 0.17855839431285858, 0.20562930405139923, 0.23270021378993988, 0.25977110862731934, 0.28684201836586, 0.31391292810440063, 0.3409838378429413, 0.36805474758148193, 0.3951256275177002, 0.42219656705856323, 0.4492674469947815, 0.47633838653564453]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 9.0, 2.0, 0.0, 3.0, 5.0, 9.0, 5.0, 6.0, 4.0, 16.0, 13.0, 13.0, 12.0, 22.0, 12.0, 21.0, 44.0, 33.0, 41.0, 33.0, 29.0, 32.0, 49.0, 36.0, 66.0, 29.0, 54.0, 42.0, 47.0, 48.0, 35.0, 29.0, 36.0, 22.0, 13.0, 18.0, 21.0, 26.0, 15.0, 13.0, 13.0, 8.0, 8.0, 4.0, 6.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.12559539079666138, -0.12173214554786682, -0.11786890029907227, -0.11400565505027771, -0.11014240980148315, -0.1062791645526886, -0.10241591930389404, -0.09855267405509949, -0.09468942880630493, -0.09082618355751038, -0.08696293830871582, -0.08309969305992126, -0.07923644781112671, -0.07537320256233215, -0.0715099573135376, -0.06764671206474304, -0.06378346681594849, -0.05992022156715393, -0.056056976318359375, -0.05219373106956482, -0.048330485820770264, -0.04446724057197571, -0.04060399532318115, -0.0367407500743866, -0.03287750482559204, -0.029014259576797485, -0.02515101432800293, -0.021287769079208374, -0.01742452383041382, -0.013561278581619263, -0.009698033332824707, -0.005834788084030151, -0.0019715428352355957, 0.00189170241355896, 0.005754947662353516, 0.009618192911148071, 0.013481438159942627, 0.017344683408737183, 0.02120792865753174, 0.025071173906326294, 0.02893441915512085, 0.032797664403915405, 0.03666090965270996, 0.04052415490150452, 0.04438740015029907, 0.04825064539909363, 0.052113890647888184, 0.05597713589668274, 0.059840381145477295, 0.06370362639427185, 0.0675668716430664, 0.07143011689186096, 0.07529336214065552, 0.07915660738945007, 0.08301985263824463, 0.08688309788703918, 0.09074634313583374, 0.0946095883846283, 0.09847283363342285, 0.10233607888221741, 0.10619932413101196, 0.11006256937980652, 0.11392581462860107, 0.11778905987739563, 0.12165230512619019]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 10.0, 12.0, 20.0, 20.0, 22.0, 50.0, 77.0, 133.0, 213.0, 389.0, 698.0, 1182.0, 2302.0, 4781.0, 9938.0, 22600.0, 54874.0, 144223.0, 384357.0, 262352.0, 92685.0, 37247.0, 15795.0, 7141.0, 3549.0, 1694.0, 881.0, 501.0, 293.0, 197.0, 96.0, 85.0, 45.0, 26.0, 20.0, 12.0, 8.0, 6.0, 6.0, 3.0, 2.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0833740234375, -0.08090591430664062, -0.07843780517578125, -0.07596969604492188, -0.0735015869140625, -0.07103347778320312, -0.06856536865234375, -0.06609725952148438, -0.063629150390625, -0.061161041259765625, -0.05869293212890625, -0.056224822998046875, -0.0537567138671875, -0.051288604736328125, -0.04882049560546875, -0.046352386474609375, -0.04388427734375, -0.041416168212890625, -0.03894805908203125, -0.036479949951171875, -0.0340118408203125, -0.031543731689453125, -0.02907562255859375, -0.026607513427734375, -0.024139404296875, -0.021671295166015625, -0.01920318603515625, -0.016735076904296875, -0.0142669677734375, -0.011798858642578125, -0.00933074951171875, -0.006862640380859375, -0.00439453125, -0.001926422119140625, 0.00054168701171875, 0.003009796142578125, 0.0054779052734375, 0.007946014404296875, 0.01041412353515625, 0.012882232666015625, 0.015350341796875, 0.017818450927734375, 0.02028656005859375, 0.022754669189453125, 0.0252227783203125, 0.027690887451171875, 0.03015899658203125, 0.032627105712890625, 0.03509521484375, 0.037563323974609375, 0.04003143310546875, 0.042499542236328125, 0.0449676513671875, 0.047435760498046875, 0.04990386962890625, 0.052371978759765625, 0.054840087890625, 0.057308197021484375, 0.05977630615234375, 0.062244415283203125, 0.0647125244140625, 0.06718063354492188, 0.06964874267578125, 0.07211685180664062, 0.0745849609375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 0.0, 7.0, 2.0, 6.0, 8.0, 15.0, 8.0, 9.0, 27.0, 16.0, 30.0, 45.0, 36.0, 50.0, 59.0, 54.0, 57.0, 67.0, 62.0, 74.0, 69.0, 46.0, 46.0, 32.0, 37.0, 33.0, 15.0, 23.0, 19.0, 16.0, 10.0, 5.0, 6.0, 6.0, 3.0, 1.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0177764892578125, -0.01718282699584961, -0.01658916473388672, -0.015995502471923828, -0.015401840209960938, -0.014808177947998047, -0.014214515686035156, -0.013620853424072266, -0.013027191162109375, -0.012433528900146484, -0.011839866638183594, -0.011246204376220703, -0.010652542114257812, -0.010058879852294922, -0.009465217590332031, -0.00887155532836914, -0.00827789306640625, -0.007684230804443359, -0.007090568542480469, -0.006496906280517578, -0.0059032440185546875, -0.005309581756591797, -0.004715919494628906, -0.004122257232666016, -0.003528594970703125, -0.0029349327087402344, -0.0023412704467773438, -0.0017476081848144531, -0.0011539459228515625, -0.0005602836608886719, 3.337860107421875e-05, 0.0006270408630371094, 0.001220703125, 0.0018143653869628906, 0.0024080276489257812, 0.003001689910888672, 0.0035953521728515625, 0.004189014434814453, 0.004782676696777344, 0.005376338958740234, 0.005970001220703125, 0.006563663482666016, 0.007157325744628906, 0.007750988006591797, 0.008344650268554688, 0.008938312530517578, 0.009531974792480469, 0.01012563705444336, 0.01071929931640625, 0.01131296157836914, 0.011906623840332031, 0.012500286102294922, 0.013093948364257812, 0.013687610626220703, 0.014281272888183594, 0.014874935150146484, 0.015468597412109375, 0.016062259674072266, 0.016655921936035156, 0.017249584197998047, 0.017843246459960938, 0.018436908721923828, 0.01903057098388672, 0.01962423324584961, 0.0202178955078125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 5.0, 4.0, 5.0, 10.0, 14.0, 28.0, 35.0, 46.0, 72.0, 108.0, 208.0, 301.0, 496.0, 907.0, 1654.0, 3553.0, 7945.0, 20558.0, 60520.0, 186049.0, 425891.0, 225195.0, 72996.0, 24486.0, 9325.0, 3903.0, 1896.0, 927.0, 504.0, 323.0, 206.0, 118.0, 88.0, 55.0, 36.0, 24.0, 21.0, 16.0, 12.0, 6.0, 4.0, 6.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.070068359375, -0.06785011291503906, -0.06563186645507812, -0.06341361999511719, -0.06119537353515625, -0.05897712707519531, -0.056758880615234375, -0.05454063415527344, -0.0523223876953125, -0.05010414123535156, -0.047885894775390625, -0.04566764831542969, -0.04344940185546875, -0.04123115539550781, -0.039012908935546875, -0.03679466247558594, -0.034576416015625, -0.03235816955566406, -0.030139923095703125, -0.027921676635742188, -0.02570343017578125, -0.023485183715820312, -0.021266937255859375, -0.019048690795898438, -0.0168304443359375, -0.014612197875976562, -0.012393951416015625, -0.010175704956054688, -0.00795745849609375, -0.0057392120361328125, -0.003520965576171875, -0.0013027191162109375, 0.00091552734375, 0.0031337738037109375, 0.005352020263671875, 0.0075702667236328125, 0.00978851318359375, 0.012006759643554688, 0.014225006103515625, 0.016443252563476562, 0.0186614990234375, 0.020879745483398438, 0.023097991943359375, 0.025316238403320312, 0.02753448486328125, 0.029752731323242188, 0.031970977783203125, 0.03418922424316406, 0.036407470703125, 0.03862571716308594, 0.040843963623046875, 0.04306221008300781, 0.04528045654296875, 0.04749870300292969, 0.049716949462890625, 0.05193519592285156, 0.0541534423828125, 0.05637168884277344, 0.058589935302734375, 0.06080818176269531, 0.06302642822265625, 0.06524467468261719, 0.06746292114257812, 0.06968116760253906, 0.0718994140625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 0.0, 4.0, 6.0, 7.0, 8.0, 8.0, 17.0, 14.0, 15.0, 23.0, 16.0, 24.0, 27.0, 28.0, 39.0, 40.0, 33.0, 39.0, 50.0, 41.0, 44.0, 33.0, 48.0, 48.0, 42.0, 30.0, 37.0, 41.0, 27.0, 31.0, 34.0, 24.0, 22.0, 19.0, 14.0, 12.0, 10.0, 5.0, 8.0, 8.0, 3.0, 8.0, 7.0, 0.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06646728515625, -0.06432056427001953, -0.06217384338378906, -0.060027122497558594, -0.057880401611328125, -0.055733680725097656, -0.05358695983886719, -0.05144023895263672, -0.04929351806640625, -0.04714679718017578, -0.04500007629394531, -0.042853355407714844, -0.040706634521484375, -0.038559913635253906, -0.03641319274902344, -0.03426647186279297, -0.0321197509765625, -0.02997303009033203, -0.027826309204101562, -0.025679588317871094, -0.023532867431640625, -0.021386146545410156, -0.019239425659179688, -0.01709270477294922, -0.01494598388671875, -0.012799263000488281, -0.010652542114257812, -0.008505821228027344, -0.006359100341796875, -0.004212379455566406, -0.0020656585693359375, 8.106231689453125e-05, 0.002227783203125, 0.004374504089355469, 0.0065212249755859375, 0.008667945861816406, 0.010814666748046875, 0.012961387634277344, 0.015108108520507812, 0.01725482940673828, 0.01940155029296875, 0.02154827117919922, 0.023694992065429688, 0.025841712951660156, 0.027988433837890625, 0.030135154724121094, 0.03228187561035156, 0.03442859649658203, 0.0365753173828125, 0.03872203826904297, 0.04086875915527344, 0.043015480041503906, 0.045162200927734375, 0.047308921813964844, 0.04945564270019531, 0.05160236358642578, 0.05374908447265625, 0.05589580535888672, 0.05804252624511719, 0.060189247131347656, 0.062335968017578125, 0.0644826889038086, 0.06662940979003906, 0.06877613067626953, 0.0709228515625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 7.0, 6.0, 8.0, 12.0, 15.0, 19.0, 41.0, 59.0, 131.0, 258.0, 527.0, 1017.0, 2567.0, 6846.0, 22209.0, 94465.0, 536496.0, 307505.0, 53914.0, 14344.0, 4678.0, 1846.0, 749.0, 401.0, 195.0, 101.0, 61.0, 34.0, 20.0, 12.0, 6.0, 8.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061614990234375, -0.05954885482788086, -0.05748271942138672, -0.05541658401489258, -0.05335044860839844, -0.0512843132019043, -0.049218177795410156, -0.047152042388916016, -0.045085906982421875, -0.043019771575927734, -0.040953636169433594, -0.03888750076293945, -0.03682136535644531, -0.03475522994995117, -0.03268909454345703, -0.03062295913696289, -0.02855682373046875, -0.02649068832397461, -0.02442455291748047, -0.022358417510986328, -0.020292282104492188, -0.018226146697998047, -0.016160011291503906, -0.014093875885009766, -0.012027740478515625, -0.009961605072021484, -0.007895469665527344, -0.005829334259033203, -0.0037631988525390625, -0.0016970634460449219, 0.00036907196044921875, 0.0024352073669433594, 0.0045013427734375, 0.006567478179931641, 0.008633613586425781, 0.010699748992919922, 0.012765884399414062, 0.014832019805908203, 0.016898155212402344, 0.018964290618896484, 0.021030426025390625, 0.023096561431884766, 0.025162696838378906, 0.027228832244873047, 0.029294967651367188, 0.03136110305786133, 0.03342723846435547, 0.03549337387084961, 0.03755950927734375, 0.03962564468383789, 0.04169178009033203, 0.04375791549682617, 0.04582405090332031, 0.04789018630981445, 0.049956321716308594, 0.052022457122802734, 0.054088592529296875, 0.056154727935791016, 0.058220863342285156, 0.0602869987487793, 0.06235313415527344, 0.06441926956176758, 0.06648540496826172, 0.06855154037475586, 0.07061767578125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 4.0, 11.0, 22.0, 26.0, 43.0, 59.0, 81.0, 113.0, 151.0, 146.0, 129.0, 77.0, 48.0, 39.0, 28.0, 10.0, 8.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5418739318847656e-05, -4.372932016849518e-05, -4.20399010181427e-05, -4.035048186779022e-05, -3.8661062717437744e-05, -3.6971643567085266e-05, -3.528222441673279e-05, -3.359280526638031e-05, -3.190338611602783e-05, -3.0213966965675354e-05, -2.8524547815322876e-05, -2.6835128664970398e-05, -2.514570951461792e-05, -2.3456290364265442e-05, -2.1766871213912964e-05, -2.0077452063560486e-05, -1.8388032913208008e-05, -1.669861376285553e-05, -1.5009194612503052e-05, -1.3319775462150574e-05, -1.1630356311798096e-05, -9.940937161445618e-06, -8.25151801109314e-06, -6.562098860740662e-06, -4.872679710388184e-06, -3.1832605600357056e-06, -1.4938414096832275e-06, 1.955777406692505e-07, 1.8849968910217285e-06, 3.5744160413742065e-06, 5.2638351917266846e-06, 6.953254342079163e-06, 8.64267349243164e-06, 1.0332092642784119e-05, 1.2021511793136597e-05, 1.3710930943489075e-05, 1.5400350093841553e-05, 1.708976924419403e-05, 1.877918839454651e-05, 2.0468607544898987e-05, 2.2158026695251465e-05, 2.3847445845603943e-05, 2.553686499595642e-05, 2.72262841463089e-05, 2.8915703296661377e-05, 3.0605122447013855e-05, 3.229454159736633e-05, 3.398396074771881e-05, 3.567337989807129e-05, 3.736279904842377e-05, 3.9052218198776245e-05, 4.074163734912872e-05, 4.24310564994812e-05, 4.412047564983368e-05, 4.580989480018616e-05, 4.7499313950538635e-05, 4.918873310089111e-05, 5.087815225124359e-05, 5.256757140159607e-05, 5.425699055194855e-05, 5.5946409702301025e-05, 5.7635828852653503e-05, 5.932524800300598e-05, 6.101466715335846e-05, 6.270408630371094e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 1.0, 8.0, 12.0, 12.0, 21.0, 25.0, 39.0, 81.0, 123.0, 195.0, 306.0, 572.0, 1096.0, 2334.0, 5581.0, 15525.0, 51111.0, 221162.0, 549411.0, 144456.0, 36221.0, 11901.0, 4314.0, 1894.0, 913.0, 486.0, 275.0, 182.0, 96.0, 70.0, 48.0, 25.0, 19.0, 13.0, 8.0, 5.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.056732177734375, -0.05512809753417969, -0.053524017333984375, -0.05191993713378906, -0.05031585693359375, -0.04871177673339844, -0.047107696533203125, -0.04550361633300781, -0.0438995361328125, -0.04229545593261719, -0.040691375732421875, -0.03908729553222656, -0.03748321533203125, -0.03587913513183594, -0.034275054931640625, -0.03267097473144531, -0.03106689453125, -0.029462814331054688, -0.027858734130859375, -0.026254653930664062, -0.02465057373046875, -0.023046493530273438, -0.021442413330078125, -0.019838333129882812, -0.0182342529296875, -0.016630172729492188, -0.015026092529296875, -0.013422012329101562, -0.01181793212890625, -0.010213851928710938, -0.008609771728515625, -0.0070056915283203125, -0.005401611328125, -0.0037975311279296875, -0.002193450927734375, -0.0005893707275390625, 0.00101470947265625, 0.0026187896728515625, 0.004222869873046875, 0.0058269500732421875, 0.0074310302734375, 0.009035110473632812, 0.010639190673828125, 0.012243270874023438, 0.01384735107421875, 0.015451431274414062, 0.017055511474609375, 0.018659591674804688, 0.020263671875, 0.021867752075195312, 0.023471832275390625, 0.025075912475585938, 0.02667999267578125, 0.028284072875976562, 0.029888153076171875, 0.03149223327636719, 0.0330963134765625, 0.03470039367675781, 0.036304473876953125, 0.03790855407714844, 0.03951263427734375, 0.04111671447753906, 0.042720794677734375, 0.04432487487792969, 0.045928955078125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 8.0, 1.0, 4.0, 8.0, 4.0, 10.0, 14.0, 22.0, 18.0, 22.0, 32.0, 34.0, 42.0, 51.0, 92.0, 97.0, 96.0, 87.0, 76.0, 61.0, 43.0, 33.0, 39.0, 22.0, 20.0, 22.0, 15.0, 12.0, 3.0, 4.0, 4.0, 4.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.042999267578125, -0.041748046875, -0.040496826171875, -0.03924560546875, -0.037994384765625, -0.0367431640625, -0.035491943359375, -0.03424072265625, -0.032989501953125, -0.03173828125, -0.030487060546875, -0.02923583984375, -0.027984619140625, -0.0267333984375, -0.025482177734375, -0.02423095703125, -0.022979736328125, -0.021728515625, -0.020477294921875, -0.01922607421875, -0.017974853515625, -0.0167236328125, -0.015472412109375, -0.01422119140625, -0.012969970703125, -0.01171875, -0.010467529296875, -0.00921630859375, -0.007965087890625, -0.0067138671875, -0.005462646484375, -0.00421142578125, -0.002960205078125, -0.001708984375, -0.000457763671875, 0.00079345703125, 0.002044677734375, 0.0032958984375, 0.004547119140625, 0.00579833984375, 0.007049560546875, 0.00830078125, 0.009552001953125, 0.01080322265625, 0.012054443359375, 0.0133056640625, 0.014556884765625, 0.01580810546875, 0.017059326171875, 0.018310546875, 0.019561767578125, 0.02081298828125, 0.022064208984375, 0.0233154296875, 0.024566650390625, 0.02581787109375, 0.027069091796875, 0.0283203125, 0.029571533203125, 0.03082275390625, 0.032073974609375, 0.0333251953125, 0.034576416015625, 0.03582763671875, 0.037078857421875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 9.0, 42.0, 72.0, 138.0, 179.0, 187.0, 177.0, 98.0, 52.0, 23.0, 12.0, 8.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6950697302818298, -0.6665341258049011, -0.6379985213279724, -0.6094629764556885, -0.5809273719787598, -0.552391767501831, -0.5238561630249023, -0.49532055854797363, -0.4667849838733673, -0.4382493793964386, -0.4097138047218323, -0.38117820024490356, -0.35264259576797485, -0.32410702109336853, -0.2955714166164398, -0.2670358419418335, -0.23850023746490479, -0.20996464788913727, -0.18142905831336975, -0.15289345383644104, -0.12435786426067352, -0.095822274684906, -0.0672866702079773, -0.03875108063220978, -0.01021549105644226, 0.018320102244615555, 0.04685569554567337, 0.07539129257202148, 0.103926882147789, 0.13246247172355652, 0.16099807620048523, 0.18953366577625275, 0.21806931495666504, 0.24660490453243256, 0.2751404941082001, 0.3036760985851288, 0.3322116732597351, 0.3607472777366638, 0.38928288221359253, 0.41781848669052124, 0.44635406136512756, 0.4748896658420563, 0.5034252405166626, 0.5319608449935913, 0.56049644947052, 0.5890320539474487, 0.6175676584243774, 0.6461032032966614, 0.6746388077735901, 0.7031744122505188, 0.7317100167274475, 0.7602455615997314, 0.7887811660766602, 0.8173167705535889, 0.8458523750305176, 0.8743879795074463, 0.902923583984375, 0.9314591884613037, 0.9599947929382324, 0.9885303974151611, 1.0170660018920898, 1.0456016063690186, 1.0741372108459473, 1.1026726961135864, 1.1312083005905151]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 0.0, 1.0, 6.0, 6.0, 3.0, 6.0, 17.0, 19.0, 17.0, 19.0, 30.0, 30.0, 32.0, 39.0, 33.0, 47.0, 39.0, 52.0, 46.0, 60.0, 55.0, 50.0, 48.0, 57.0, 48.0, 38.0, 43.0, 36.0, 24.0, 27.0, 16.0, 15.0, 11.0, 10.0, 3.0, 8.0, 4.0, 7.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43116235733032227, -0.4161853790283203, -0.40120840072631836, -0.3862314224243164, -0.37125447392463684, -0.3562774956226349, -0.34130051732063293, -0.326323539018631, -0.3113465905189514, -0.29636961221694946, -0.2813926339149475, -0.26641565561294556, -0.251438707113266, -0.23646172881126404, -0.22148475050926208, -0.20650777220726013, -0.19153079390525818, -0.17655381560325623, -0.16157685220241547, -0.1465998739004135, -0.13162291049957275, -0.1166459321975708, -0.10166895389556885, -0.08669198304414749, -0.07171501219272614, -0.05673804134130478, -0.041761066764593124, -0.02678409218788147, -0.011807121336460114, 0.0031698495149612427, 0.018146827816963196, 0.03312379866838455, 0.04810076951980591, 0.06307774037122726, 0.07805471122264862, 0.09303168952465057, 0.10800866037607193, 0.12298563122749329, 0.13796260952949524, 0.1529395878314972, 0.16791655123233795, 0.1828935295343399, 0.19787049293518066, 0.21284747123718262, 0.22782444953918457, 0.24280141294002533, 0.2577784061431885, 0.27275535464286804, 0.28773233294487, 0.30270931124687195, 0.3176862895488739, 0.33266323804855347, 0.3476402163505554, 0.3626171946525574, 0.3775941729545593, 0.3925711512565613, 0.40754812955856323, 0.4225251078605652, 0.43750208616256714, 0.4524790644645691, 0.46745601296424866, 0.4824329912662506, 0.49740996956825256, 0.5123869180679321, 0.5273638963699341]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 5.0, 8.0, 8.0, 16.0, 26.0, 37.0, 53.0, 108.0, 158.0, 234.0, 397.0, 677.0, 1250.0, 2270.0, 4771.0, 11174.0, 29903.0, 112532.0, 3425749.0, 504155.0, 64729.0, 19988.0, 7844.0, 3713.0, 1841.0, 1062.0, 571.0, 362.0, 215.0, 137.0, 111.0, 58.0, 40.0, 28.0, 12.0, 9.0, 9.0, 6.0, 3.0, 5.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07421875, -0.07145118713378906, -0.06868362426757812, -0.06591606140136719, -0.06314849853515625, -0.06038093566894531, -0.057613372802734375, -0.05484580993652344, -0.0520782470703125, -0.04931068420410156, -0.046543121337890625, -0.04377555847167969, -0.04100799560546875, -0.03824043273925781, -0.035472869873046875, -0.03270530700683594, -0.029937744140625, -0.027170181274414062, -0.024402618408203125, -0.021635055541992188, -0.01886749267578125, -0.016099929809570312, -0.013332366943359375, -0.010564804077148438, -0.0077972412109375, -0.0050296783447265625, -0.002262115478515625, 0.0005054473876953125, 0.00327301025390625, 0.0060405731201171875, 0.008808135986328125, 0.011575698852539062, 0.01434326171875, 0.017110824584960938, 0.019878387451171875, 0.022645950317382812, 0.02541351318359375, 0.028181076049804688, 0.030948638916015625, 0.03371620178222656, 0.0364837646484375, 0.03925132751464844, 0.042018890380859375, 0.04478645324707031, 0.04755401611328125, 0.05032157897949219, 0.053089141845703125, 0.05585670471191406, 0.058624267578125, 0.06139183044433594, 0.06415939331054688, 0.06692695617675781, 0.06969451904296875, 0.07246208190917969, 0.07522964477539062, 0.07799720764160156, 0.0807647705078125, 0.08353233337402344, 0.08629989624023438, 0.08906745910644531, 0.09183502197265625, 0.09460258483886719, 0.09737014770507812, 0.10013771057128906, 0.1029052734375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 10.0, 4.0, 9.0, 9.0, 11.0, 18.0, 25.0, 43.0, 38.0, 48.0, 67.0, 57.0, 78.0, 53.0, 69.0, 72.0, 65.0, 64.0, 52.0, 44.0, 44.0, 29.0, 14.0, 32.0, 10.0, 11.0, 7.0, 2.0, 4.0, 6.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0169219970703125, -0.016196012496948242, -0.015470027923583984, -0.014744043350219727, -0.014018058776855469, -0.013292074203491211, -0.012566089630126953, -0.011840105056762695, -0.011114120483398438, -0.01038813591003418, -0.009662151336669922, -0.008936166763305664, -0.008210182189941406, -0.0074841976165771484, -0.006758213043212891, -0.006032228469848633, -0.005306243896484375, -0.004580259323120117, -0.0038542747497558594, -0.0031282901763916016, -0.0024023056030273438, -0.001676321029663086, -0.0009503364562988281, -0.0002243518829345703, 0.0005016326904296875, 0.0012276172637939453, 0.001953601837158203, 0.002679586410522461, 0.0034055709838867188, 0.0041315555572509766, 0.004857540130615234, 0.005583524703979492, 0.00630950927734375, 0.007035493850708008, 0.007761478424072266, 0.008487462997436523, 0.009213447570800781, 0.009939432144165039, 0.010665416717529297, 0.011391401290893555, 0.012117385864257812, 0.01284337043762207, 0.013569355010986328, 0.014295339584350586, 0.015021324157714844, 0.0157473087310791, 0.01647329330444336, 0.017199277877807617, 0.017925262451171875, 0.018651247024536133, 0.01937723159790039, 0.02010321617126465, 0.020829200744628906, 0.021555185317993164, 0.022281169891357422, 0.02300715446472168, 0.023733139038085938, 0.024459123611450195, 0.025185108184814453, 0.02591109275817871, 0.02663707733154297, 0.027363061904907227, 0.028089046478271484, 0.028815031051635742, 0.029541015625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 5.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 6.0, 13.0, 12.0, 23.0, 44.0, 46.0, 80.0, 100.0, 162.0, 235.0, 337.0, 501.0, 725.0, 1105.0, 1742.0, 2813.0, 4485.0, 7744.0, 13434.0, 25155.0, 52981.0, 135021.0, 644599.0, 2866360.0, 266990.0, 85334.0, 37628.0, 19226.0, 10745.0, 6177.0, 3777.0, 2313.0, 1460.0, 972.0, 580.0, 459.0, 287.0, 175.0, 111.0, 112.0, 80.0, 48.0, 20.0, 27.0, 16.0, 8.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.053863525390625, -0.05214071273803711, -0.05041790008544922, -0.04869508743286133, -0.04697227478027344, -0.04524946212768555, -0.043526649475097656, -0.041803836822509766, -0.040081024169921875, -0.038358211517333984, -0.036635398864746094, -0.0349125862121582, -0.03318977355957031, -0.03146696090698242, -0.02974414825439453, -0.02802133560180664, -0.02629852294921875, -0.02457571029663086, -0.02285289764404297, -0.021130084991455078, -0.019407272338867188, -0.017684459686279297, -0.015961647033691406, -0.014238834381103516, -0.012516021728515625, -0.010793209075927734, -0.009070396423339844, -0.007347583770751953, -0.0056247711181640625, -0.003901958465576172, -0.0021791458129882812, -0.0004563331604003906, 0.0012664794921875, 0.0029892921447753906, 0.004712104797363281, 0.006434917449951172, 0.008157730102539062, 0.009880542755126953, 0.011603355407714844, 0.013326168060302734, 0.015048980712890625, 0.016771793365478516, 0.018494606018066406, 0.020217418670654297, 0.021940231323242188, 0.023663043975830078, 0.02538585662841797, 0.02710866928100586, 0.02883148193359375, 0.03055429458618164, 0.03227710723876953, 0.03399991989135742, 0.03572273254394531, 0.0374455451965332, 0.039168357849121094, 0.040891170501708984, 0.042613983154296875, 0.044336795806884766, 0.046059608459472656, 0.04778242111206055, 0.04950523376464844, 0.05122804641723633, 0.05295085906982422, 0.05467367172241211, 0.056396484375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 6.0, 8.0, 10.0, 8.0, 17.0, 21.0, 19.0, 38.0, 64.0, 85.0, 168.0, 361.0, 1660.0, 849.0, 295.0, 138.0, 96.0, 56.0, 43.0, 32.0, 26.0, 20.0, 18.0, 9.0, 12.0, 5.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034942626953125, -0.03368806838989258, -0.032433509826660156, -0.031178951263427734, -0.029924392700195312, -0.02866983413696289, -0.02741527557373047, -0.026160717010498047, -0.024906158447265625, -0.023651599884033203, -0.02239704132080078, -0.02114248275756836, -0.019887924194335938, -0.018633365631103516, -0.017378807067871094, -0.016124248504638672, -0.01486968994140625, -0.013615131378173828, -0.012360572814941406, -0.011106014251708984, -0.009851455688476562, -0.00859689712524414, -0.007342338562011719, -0.006087779998779297, -0.004833221435546875, -0.003578662872314453, -0.0023241043090820312, -0.0010695457458496094, 0.0001850128173828125, 0.0014395713806152344, 0.0026941299438476562, 0.003948688507080078, 0.0052032470703125, 0.006457805633544922, 0.007712364196777344, 0.008966922760009766, 0.010221481323242188, 0.01147603988647461, 0.012730598449707031, 0.013985157012939453, 0.015239715576171875, 0.016494274139404297, 0.01774883270263672, 0.01900339126586914, 0.020257949829101562, 0.021512508392333984, 0.022767066955566406, 0.024021625518798828, 0.02527618408203125, 0.026530742645263672, 0.027785301208496094, 0.029039859771728516, 0.030294418334960938, 0.03154897689819336, 0.03280353546142578, 0.0340580940246582, 0.035312652587890625, 0.03656721115112305, 0.03782176971435547, 0.03907632827758789, 0.04033088684082031, 0.041585445404052734, 0.042840003967285156, 0.04409456253051758, 0.04534912109375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 11.0, 20.0, 37.0, 67.0, 115.0, 168.0, 169.0, 165.0, 110.0, 62.0, 34.0, 24.0, 14.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17778435349464417, -0.16735491156578064, -0.15692545473575592, -0.1464960128068924, -0.13606657087802887, -0.12563711404800415, -0.11520767211914062, -0.1047782301902771, -0.09434878081083298, -0.08391933143138885, -0.07348988950252533, -0.06306044012308121, -0.05263099446892738, -0.04220154881477356, -0.03177209943532944, -0.021342657506465912, -0.01091320812702179, -0.0004837615415453911, 0.009945685043931007, 0.02037513256072998, 0.030804578214883804, 0.04123402386903763, 0.05166347324848175, 0.062092915177345276, 0.0725223645567894, 0.08295181393623352, 0.09338125586509705, 0.10381070524454117, 0.11424015462398529, 0.12466959655284882, 0.13509905338287354, 0.14552849531173706, 0.15595793724060059, 0.1663873791694641, 0.17681683599948883, 0.18724627792835236, 0.19767571985721588, 0.2081051766872406, 0.21853461861610413, 0.22896406054496765, 0.23939350247383118, 0.2498229444026947, 0.2602523863315582, 0.27068185806274414, 0.28111129999160767, 0.2915407419204712, 0.3019701838493347, 0.31239962577819824, 0.32282906770706177, 0.3332585096359253, 0.3436879515647888, 0.35411739349365234, 0.36454686522483826, 0.3749763071537018, 0.3854057490825653, 0.39583519101142883, 0.40626466274261475, 0.41669410467147827, 0.4271235466003418, 0.4375529885292053, 0.44798246026039124, 0.45841190218925476, 0.4688413441181183, 0.4792707860469818, 0.48970022797584534]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 5.0, 5.0, 2.0, 10.0, 10.0, 7.0, 15.0, 11.0, 16.0, 14.0, 20.0, 20.0, 27.0, 27.0, 18.0, 39.0, 39.0, 27.0, 35.0, 29.0, 45.0, 25.0, 48.0, 48.0, 35.0, 47.0, 40.0, 35.0, 30.0, 37.0, 29.0, 32.0, 28.0, 14.0, 14.0, 18.0, 17.0, 10.0, 21.0, 11.0, 10.0, 8.0, 10.0, 3.0, 4.0, 3.0, 1.0, 1.0, 5.0, 2.0], "bins": [-0.1448119878768921, -0.14098496735095978, -0.13715794682502747, -0.13333092629909515, -0.12950390577316284, -0.12567687034606934, -0.12184984982013702, -0.11802282929420471, -0.1141958087682724, -0.11036878824234009, -0.10654176771640778, -0.10271473973989487, -0.09888771921396255, -0.09506069868803024, -0.09123367071151733, -0.08740665018558502, -0.08357962965965271, -0.0797526091337204, -0.07592558860778809, -0.07209856063127518, -0.06827154010534286, -0.06444451957941055, -0.06061749532818794, -0.05679047107696533, -0.05296345055103302, -0.04913643002510071, -0.0453094057738781, -0.04148238152265549, -0.037655360996723175, -0.03382834047079086, -0.030001316219568253, -0.02617429383099079, -0.02234727144241333, -0.01852024905383587, -0.014693226665258408, -0.010866204276680946, -0.007039181888103485, -0.003212159499526024, 0.0006148628890514374, 0.004441885277628899, 0.00826890766620636, 0.012095930054783821, 0.015922952443361282, 0.019749974831938744, 0.023576997220516205, 0.027404019609093666, 0.031231041997671127, 0.03505806624889374, 0.03888508677482605, 0.04271210730075836, 0.04653913155198097, 0.05036615580320358, 0.054193176329135895, 0.05802019685506821, 0.06184722110629082, 0.06567424535751343, 0.06950126588344574, 0.07332828640937805, 0.07715530693531036, 0.08098233491182327, 0.08480935543775558, 0.0886363759636879, 0.0924634039402008, 0.09629042446613312, 0.10011744499206543]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 8.0, 3.0, 5.0, 4.0, 9.0, 9.0, 18.0, 31.0, 47.0, 57.0, 72.0, 113.0, 145.0, 256.0, 374.0, 525.0, 851.0, 1359.0, 2296.0, 3776.0, 6470.0, 11826.0, 22424.0, 44515.0, 93869.0, 208800.0, 322422.0, 170001.0, 77334.0, 37447.0, 18991.0, 10211.0, 5571.0, 3276.0, 1976.0, 1232.0, 813.0, 482.0, 326.0, 207.0, 134.0, 84.0, 58.0, 42.0, 27.0, 24.0, 16.0, 8.0, 10.0, 2.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.056488037109375, -0.0545649528503418, -0.052641868591308594, -0.05071878433227539, -0.04879570007324219, -0.046872615814208984, -0.04494953155517578, -0.04302644729614258, -0.041103363037109375, -0.03918027877807617, -0.03725719451904297, -0.035334110260009766, -0.03341102600097656, -0.03148794174194336, -0.029564857482910156, -0.027641773223876953, -0.02571868896484375, -0.023795604705810547, -0.021872520446777344, -0.01994943618774414, -0.018026351928710938, -0.016103267669677734, -0.014180183410644531, -0.012257099151611328, -0.010334014892578125, -0.008410930633544922, -0.006487846374511719, -0.004564762115478516, -0.0026416778564453125, -0.0007185935974121094, 0.0012044906616210938, 0.003127574920654297, 0.0050506591796875, 0.006973743438720703, 0.008896827697753906, 0.01081991195678711, 0.012742996215820312, 0.014666080474853516, 0.01658916473388672, 0.018512248992919922, 0.020435333251953125, 0.022358417510986328, 0.02428150177001953, 0.026204586029052734, 0.028127670288085938, 0.03005075454711914, 0.031973838806152344, 0.03389692306518555, 0.03582000732421875, 0.03774309158325195, 0.039666175842285156, 0.04158926010131836, 0.04351234436035156, 0.045435428619384766, 0.04735851287841797, 0.04928159713745117, 0.051204681396484375, 0.05312776565551758, 0.05505084991455078, 0.056973934173583984, 0.05889701843261719, 0.06082010269165039, 0.0627431869506836, 0.0646662712097168, 0.06658935546875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 6.0, 5.0, 7.0, 2.0, 5.0, 8.0, 11.0, 5.0, 11.0, 26.0, 34.0, 37.0, 47.0, 41.0, 57.0, 55.0, 55.0, 58.0, 56.0, 62.0, 73.0, 83.0, 40.0, 31.0, 39.0, 33.0, 29.0, 18.0, 20.0, 12.0, 15.0, 6.0, 5.0, 7.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01824951171875, -0.01758432388305664, -0.01691913604736328, -0.016253948211669922, -0.015588760375976562, -0.014923572540283203, -0.014258384704589844, -0.013593196868896484, -0.012928009033203125, -0.012262821197509766, -0.011597633361816406, -0.010932445526123047, -0.010267257690429688, -0.009602069854736328, -0.008936882019042969, -0.00827169418334961, -0.00760650634765625, -0.006941318511962891, -0.006276130676269531, -0.005610942840576172, -0.0049457550048828125, -0.004280567169189453, -0.0036153793334960938, -0.0029501914978027344, -0.002285003662109375, -0.0016198158264160156, -0.0009546279907226562, -0.0002894401550292969, 0.0003757476806640625, 0.0010409355163574219, 0.0017061233520507812, 0.0023713111877441406, 0.0030364990234375, 0.0037016868591308594, 0.004366874694824219, 0.005032062530517578, 0.0056972503662109375, 0.006362438201904297, 0.007027626037597656, 0.007692813873291016, 0.008358001708984375, 0.009023189544677734, 0.009688377380371094, 0.010353565216064453, 0.011018753051757812, 0.011683940887451172, 0.012349128723144531, 0.01301431655883789, 0.01367950439453125, 0.01434469223022461, 0.015009880065917969, 0.015675067901611328, 0.016340255737304688, 0.017005443572998047, 0.017670631408691406, 0.018335819244384766, 0.019001007080078125, 0.019666194915771484, 0.020331382751464844, 0.020996570587158203, 0.021661758422851562, 0.022326946258544922, 0.02299213409423828, 0.02365732192993164, 0.024322509765625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 9.0, 5.0, 8.0, 7.0, 7.0, 23.0, 35.0, 42.0, 69.0, 89.0, 124.0, 159.0, 243.0, 421.0, 550.0, 1054.0, 2137.0, 5378.0, 13835.0, 41200.0, 130828.0, 391507.0, 313058.0, 97694.0, 31067.0, 10612.0, 4074.0, 1843.0, 953.0, 494.0, 312.0, 229.0, 139.0, 94.0, 58.0, 58.0, 38.0, 25.0, 23.0, 20.0, 16.0, 8.0, 4.0, 4.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0694580078125, -0.06713294982910156, -0.06480789184570312, -0.06248283386230469, -0.06015777587890625, -0.05783271789550781, -0.055507659912109375, -0.05318260192871094, -0.0508575439453125, -0.04853248596191406, -0.046207427978515625, -0.04388236999511719, -0.04155731201171875, -0.03923225402832031, -0.036907196044921875, -0.03458213806152344, -0.032257080078125, -0.029932022094726562, -0.027606964111328125, -0.025281906127929688, -0.02295684814453125, -0.020631790161132812, -0.018306732177734375, -0.015981674194335938, -0.0136566162109375, -0.011331558227539062, -0.009006500244140625, -0.0066814422607421875, -0.00435638427734375, -0.0020313262939453125, 0.000293731689453125, 0.0026187896728515625, 0.00494384765625, 0.0072689056396484375, 0.009593963623046875, 0.011919021606445312, 0.01424407958984375, 0.016569137573242188, 0.018894195556640625, 0.021219253540039062, 0.0235443115234375, 0.025869369506835938, 0.028194427490234375, 0.030519485473632812, 0.03284454345703125, 0.03516960144042969, 0.037494659423828125, 0.03981971740722656, 0.042144775390625, 0.04446983337402344, 0.046794891357421875, 0.04911994934082031, 0.05144500732421875, 0.05377006530761719, 0.056095123291015625, 0.05842018127441406, 0.0607452392578125, 0.06307029724121094, 0.06539535522460938, 0.06772041320800781, 0.07004547119140625, 0.07237052917480469, 0.07469558715820312, 0.07702064514160156, 0.079345703125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 5.0, 4.0, 3.0, 5.0, 9.0, 7.0, 13.0, 9.0, 16.0, 13.0, 16.0, 20.0, 27.0, 21.0, 32.0, 33.0, 32.0, 40.0, 32.0, 50.0, 38.0, 42.0, 40.0, 64.0, 26.0, 23.0, 34.0, 29.0, 42.0, 35.0, 31.0, 34.0, 25.0, 24.0, 24.0, 25.0, 18.0, 16.0, 9.0, 5.0, 7.0, 8.0, 5.0, 4.0, 5.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.06695556640625, -0.06477832794189453, -0.06260108947753906, -0.060423851013183594, -0.058246612548828125, -0.056069374084472656, -0.05389213562011719, -0.05171489715576172, -0.04953765869140625, -0.04736042022705078, -0.04518318176269531, -0.043005943298339844, -0.040828704833984375, -0.038651466369628906, -0.03647422790527344, -0.03429698944091797, -0.0321197509765625, -0.02994251251220703, -0.027765274047851562, -0.025588035583496094, -0.023410797119140625, -0.021233558654785156, -0.019056320190429688, -0.01687908172607422, -0.01470184326171875, -0.012524604797363281, -0.010347366333007812, -0.008170127868652344, -0.005992889404296875, -0.0038156509399414062, -0.0016384124755859375, 0.0005388259887695312, 0.002716064453125, 0.004893302917480469, 0.0070705413818359375, 0.009247779846191406, 0.011425018310546875, 0.013602256774902344, 0.015779495239257812, 0.01795673370361328, 0.02013397216796875, 0.02231121063232422, 0.024488449096679688, 0.026665687561035156, 0.028842926025390625, 0.031020164489746094, 0.03319740295410156, 0.03537464141845703, 0.0375518798828125, 0.03972911834716797, 0.04190635681152344, 0.044083595275878906, 0.046260833740234375, 0.048438072204589844, 0.05061531066894531, 0.05279254913330078, 0.05496978759765625, 0.05714702606201172, 0.05932426452636719, 0.061501502990722656, 0.06367874145507812, 0.0658559799194336, 0.06803321838378906, 0.07021045684814453, 0.0723876953125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 8.0, 12.0, 15.0, 21.0, 41.0, 52.0, 81.0, 135.0, 227.0, 387.0, 697.0, 1286.0, 2446.0, 5103.0, 11898.0, 30100.0, 87626.0, 286990.0, 408766.0, 137465.0, 44516.0, 16661.0, 7025.0, 3212.0, 1630.0, 874.0, 500.0, 289.0, 168.0, 106.0, 59.0, 53.0, 39.0, 17.0, 9.0, 9.0, 6.0, 10.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03887939453125, -0.03763294219970703, -0.03638648986816406, -0.035140037536621094, -0.033893585205078125, -0.032647132873535156, -0.03140068054199219, -0.03015422821044922, -0.02890777587890625, -0.02766132354736328, -0.026414871215820312, -0.025168418884277344, -0.023921966552734375, -0.022675514221191406, -0.021429061889648438, -0.02018260955810547, -0.0189361572265625, -0.01768970489501953, -0.016443252563476562, -0.015196800231933594, -0.013950347900390625, -0.012703895568847656, -0.011457443237304688, -0.010210990905761719, -0.00896453857421875, -0.007718086242675781, -0.0064716339111328125, -0.005225181579589844, -0.003978729248046875, -0.0027322769165039062, -0.0014858245849609375, -0.00023937225341796875, 0.001007080078125, 0.0022535324096679688, 0.0034999847412109375, 0.004746437072753906, 0.005992889404296875, 0.007239341735839844, 0.008485794067382812, 0.009732246398925781, 0.01097869873046875, 0.012225151062011719, 0.013471603393554688, 0.014718055725097656, 0.015964508056640625, 0.017210960388183594, 0.018457412719726562, 0.01970386505126953, 0.0209503173828125, 0.02219676971435547, 0.023443222045898438, 0.024689674377441406, 0.025936126708984375, 0.027182579040527344, 0.028429031372070312, 0.02967548370361328, 0.03092193603515625, 0.03216838836669922, 0.03341484069824219, 0.034661293029785156, 0.035907745361328125, 0.037154197692871094, 0.03840065002441406, 0.03964710235595703, 0.0408935546875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 6.0, 12.0, 12.0, 15.0, 24.0, 20.0, 46.0, 68.0, 67.0, 84.0, 96.0, 106.0, 91.0, 86.0, 65.0, 57.0, 36.0, 29.0, 26.0, 22.0, 5.0, 11.0, 1.0, 5.0, 8.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5822391510009766e-05, -3.46088781952858e-05, -3.339536488056183e-05, -3.218185156583786e-05, -3.096833825111389e-05, -2.9754824936389923e-05, -2.8541311621665955e-05, -2.7327798306941986e-05, -2.6114284992218018e-05, -2.490077167749405e-05, -2.368725836277008e-05, -2.2473745048046112e-05, -2.1260231733322144e-05, -2.0046718418598175e-05, -1.8833205103874207e-05, -1.7619691789150238e-05, -1.640617847442627e-05, -1.5192665159702301e-05, -1.3979151844978333e-05, -1.2765638530254364e-05, -1.1552125215530396e-05, -1.0338611900806427e-05, -9.125098586082458e-06, -7.91158527135849e-06, -6.6980719566345215e-06, -5.484558641910553e-06, -4.2710453271865845e-06, -3.057532012462616e-06, -1.8440186977386475e-06, -6.30505383014679e-07, 5.830079317092896e-07, 1.796521246433258e-06, 3.0100345611572266e-06, 4.223547875881195e-06, 5.4370611906051636e-06, 6.650574505329132e-06, 7.8640878200531e-06, 9.077601134777069e-06, 1.0291114449501038e-05, 1.1504627764225006e-05, 1.2718141078948975e-05, 1.3931654393672943e-05, 1.5145167708396912e-05, 1.635868102312088e-05, 1.757219433784485e-05, 1.8785707652568817e-05, 1.9999220967292786e-05, 2.1212734282016754e-05, 2.2426247596740723e-05, 2.363976091146469e-05, 2.485327422618866e-05, 2.6066787540912628e-05, 2.7280300855636597e-05, 2.8493814170360565e-05, 2.9707327485084534e-05, 3.09208407998085e-05, 3.213435411453247e-05, 3.334786742925644e-05, 3.456138074398041e-05, 3.5774894058704376e-05, 3.6988407373428345e-05, 3.820192068815231e-05, 3.941543400287628e-05, 4.062894731760025e-05, 4.184246063232422e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 4.0, 6.0, 10.0, 11.0, 18.0, 20.0, 37.0, 51.0, 77.0, 114.0, 160.0, 308.0, 547.0, 995.0, 2022.0, 4057.0, 8856.0, 21707.0, 63537.0, 225624.0, 474423.0, 164985.0, 48794.0, 17735.0, 7199.0, 3478.0, 1708.0, 819.0, 489.0, 279.0, 158.0, 106.0, 73.0, 35.0, 31.0, 21.0, 18.0, 20.0, 3.0, 7.0, 4.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.041229248046875, -0.03991556167602539, -0.03860187530517578, -0.03728818893432617, -0.03597450256347656, -0.03466081619262695, -0.033347129821777344, -0.032033443450927734, -0.030719757080078125, -0.029406070709228516, -0.028092384338378906, -0.026778697967529297, -0.025465011596679688, -0.024151325225830078, -0.02283763885498047, -0.02152395248413086, -0.02021026611328125, -0.01889657974243164, -0.01758289337158203, -0.016269207000732422, -0.014955520629882812, -0.013641834259033203, -0.012328147888183594, -0.011014461517333984, -0.009700775146484375, -0.008387088775634766, -0.007073402404785156, -0.005759716033935547, -0.0044460296630859375, -0.003132343292236328, -0.0018186569213867188, -0.0005049705505371094, 0.0008087158203125, 0.0021224021911621094, 0.0034360885620117188, 0.004749774932861328, 0.0060634613037109375, 0.007377147674560547, 0.008690834045410156, 0.010004520416259766, 0.011318206787109375, 0.012631893157958984, 0.013945579528808594, 0.015259265899658203, 0.016572952270507812, 0.017886638641357422, 0.01920032501220703, 0.02051401138305664, 0.02182769775390625, 0.02314138412475586, 0.02445507049560547, 0.025768756866455078, 0.027082443237304688, 0.028396129608154297, 0.029709815979003906, 0.031023502349853516, 0.032337188720703125, 0.033650875091552734, 0.034964561462402344, 0.03627824783325195, 0.03759193420410156, 0.03890562057495117, 0.04021930694580078, 0.04153299331665039, 0.0428466796875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 8.0, 13.0, 15.0, 21.0, 21.0, 21.0, 36.0, 36.0, 65.0, 72.0, 69.0, 103.0, 78.0, 75.0, 60.0, 52.0, 36.0, 52.0, 30.0, 24.0, 28.0, 13.0, 14.0, 7.0, 14.0, 9.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0297698974609375, -0.02870965003967285, -0.027649402618408203, -0.026589155197143555, -0.025528907775878906, -0.024468660354614258, -0.02340841293334961, -0.02234816551208496, -0.021287918090820312, -0.020227670669555664, -0.019167423248291016, -0.018107175827026367, -0.01704692840576172, -0.01598668098449707, -0.014926433563232422, -0.013866186141967773, -0.012805938720703125, -0.011745691299438477, -0.010685443878173828, -0.00962519645690918, -0.008564949035644531, -0.007504701614379883, -0.006444454193115234, -0.005384206771850586, -0.0043239593505859375, -0.003263711929321289, -0.0022034645080566406, -0.0011432170867919922, -8.296966552734375e-05, 0.0009772777557373047, 0.002037525177001953, 0.0030977725982666016, 0.00415802001953125, 0.0052182674407958984, 0.006278514862060547, 0.007338762283325195, 0.008399009704589844, 0.009459257125854492, 0.01051950454711914, 0.011579751968383789, 0.012639999389648438, 0.013700246810913086, 0.014760494232177734, 0.015820741653442383, 0.01688098907470703, 0.01794123649597168, 0.019001483917236328, 0.020061731338500977, 0.021121978759765625, 0.022182226181030273, 0.023242473602294922, 0.02430272102355957, 0.02536296844482422, 0.026423215866088867, 0.027483463287353516, 0.028543710708618164, 0.029603958129882812, 0.03066420555114746, 0.03172445297241211, 0.03278470039367676, 0.033844947814941406, 0.034905195236206055, 0.0359654426574707, 0.03702569007873535, 0.0380859375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 8.0, 12.0, 20.0, 48.0, 64.0, 115.0, 168.0, 183.0, 153.0, 113.0, 67.0, 34.0, 13.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8925408124923706, -0.8664276003837585, -0.8403143882751465, -0.8142011165618896, -0.7880879044532776, -0.7619746923446655, -0.7358614802360535, -0.7097482681274414, -0.6836349964141846, -0.6575217843055725, -0.6314085721969604, -0.6052953004837036, -0.5791820883750916, -0.5530688762664795, -0.5269556641578674, -0.5008424520492554, -0.4747292101383209, -0.44861599802970886, -0.4225027561187744, -0.39638954401016235, -0.3702763020992279, -0.34416308999061584, -0.3180498480796814, -0.29193663597106934, -0.2658234238624573, -0.23971019685268402, -0.21359696984291077, -0.1874837577342987, -0.16137051582336426, -0.1352573037147522, -0.10914407670497894, -0.08303084969520569, -0.05691760778427124, -0.030804382637143135, -0.00469115749001503, 0.021422065794467926, 0.04753529280424118, 0.07364851236343384, 0.09976173937320709, 0.12587496638298035, 0.1519881933927536, 0.17810142040252686, 0.2042146474123001, 0.23032787442207336, 0.2564410865306854, 0.2825543284416199, 0.30866754055023193, 0.334780752658844, 0.36089399456977844, 0.3870072066783905, 0.41312044858932495, 0.439233660697937, 0.46534690260887146, 0.4914601147174835, 0.517573356628418, 0.54368656873703, 0.5697997808456421, 0.5959129929542542, 0.6220262050628662, 0.648139476776123, 0.6742526888847351, 0.7003659009933472, 0.7264791131019592, 0.7525923252105713, 0.7787055969238281]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 9.0, 10.0, 6.0, 11.0, 9.0, 8.0, 21.0, 24.0, 20.0, 35.0, 33.0, 34.0, 53.0, 31.0, 45.0, 41.0, 48.0, 47.0, 57.0, 36.0, 51.0, 43.0, 56.0, 39.0, 46.0, 32.0, 21.0, 17.0, 24.0, 11.0, 14.0, 9.0, 9.0, 11.0, 11.0, 13.0, 3.0, 3.0, 2.0, 1.0, 1.0, 6.0, 4.0, 1.0], "bins": [-0.551406741142273, -0.5369205474853516, -0.5224342942237854, -0.507948100566864, -0.49346187710762024, -0.47897568345069885, -0.4644894599914551, -0.4500032663345337, -0.4355170428752899, -0.42103081941604614, -0.40654462575912476, -0.392058402299881, -0.3775721788406372, -0.3630859851837158, -0.34859976172447205, -0.33411353826522827, -0.3196273446083069, -0.3051411211490631, -0.2906549274921417, -0.27616870403289795, -0.2616824805736542, -0.2471962869167328, -0.232710063457489, -0.21822385489940643, -0.20373761653900146, -0.18925140798091888, -0.1747651845216751, -0.16027897596359253, -0.14579276740550995, -0.13130655884742737, -0.1168203353881836, -0.10233412683010101, -0.08784791827201843, -0.07336170226335526, -0.058875493705272675, -0.0443892776966095, -0.029903065413236618, -0.015416853129863739, -0.0009306371212005615, 0.013555571436882019, 0.028041787445545197, 0.042527999728918076, 0.057014212012290955, 0.07150042802095413, 0.08598664402961731, 0.10047285258769989, 0.11495906859636307, 0.12944528460502625, 0.14393149316310883, 0.1584177017211914, 0.17290392518043518, 0.18739013373851776, 0.20187634229660034, 0.21636256575584412, 0.2308487743139267, 0.24533498287200928, 0.25982120633125305, 0.2743074297904968, 0.2887936234474182, 0.303279846906662, 0.31776607036590576, 0.33225226402282715, 0.3467384874820709, 0.3612247109413147, 0.3757109045982361]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 6.0, 13.0, 15.0, 17.0, 27.0, 39.0, 50.0, 92.0, 150.0, 213.0, 375.0, 679.0, 1127.0, 2288.0, 4617.0, 10707.0, 29043.0, 108291.0, 2983123.0, 928258.0, 82833.0, 24093.0, 9256.0, 4139.0, 1983.0, 1134.0, 614.0, 397.0, 214.0, 154.0, 105.0, 76.0, 45.0, 40.0, 19.0, 17.0, 9.0, 8.0, 5.0, 2.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0782470703125, -0.07544422149658203, -0.07264137268066406, -0.0698385238647461, -0.06703567504882812, -0.06423282623291016, -0.06142997741699219, -0.05862712860107422, -0.05582427978515625, -0.05302143096923828, -0.05021858215332031, -0.047415733337402344, -0.044612884521484375, -0.041810035705566406, -0.03900718688964844, -0.03620433807373047, -0.0334014892578125, -0.03059864044189453, -0.027795791625976562, -0.024992942810058594, -0.022190093994140625, -0.019387245178222656, -0.016584396362304688, -0.013781547546386719, -0.01097869873046875, -0.008175849914550781, -0.0053730010986328125, -0.0025701522827148438, 0.000232696533203125, 0.0030355453491210938, 0.0058383941650390625, 0.008641242980957031, 0.011444091796875, 0.014246940612792969, 0.017049789428710938, 0.019852638244628906, 0.022655487060546875, 0.025458335876464844, 0.028261184692382812, 0.03106403350830078, 0.03386688232421875, 0.03666973114013672, 0.03947257995605469, 0.042275428771972656, 0.045078277587890625, 0.047881126403808594, 0.05068397521972656, 0.05348682403564453, 0.0562896728515625, 0.05909252166748047, 0.06189537048339844, 0.0646982192993164, 0.06750106811523438, 0.07030391693115234, 0.07310676574707031, 0.07590961456298828, 0.07871246337890625, 0.08151531219482422, 0.08431816101074219, 0.08712100982666016, 0.08992385864257812, 0.0927267074584961, 0.09552955627441406, 0.09833240509033203, 0.10113525390625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 4.0, 6.0, 5.0, 3.0, 4.0, 4.0, 7.0, 8.0, 13.0, 16.0, 25.0, 47.0, 43.0, 47.0, 63.0, 66.0, 49.0, 67.0, 77.0, 68.0, 65.0, 65.0, 64.0, 41.0, 25.0, 25.0, 21.0, 20.0, 17.0, 14.0, 8.0, 6.0, 3.0, 4.0, 6.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01751708984375, -0.016731739044189453, -0.015946388244628906, -0.01516103744506836, -0.014375686645507812, -0.013590335845947266, -0.012804985046386719, -0.012019634246826172, -0.011234283447265625, -0.010448932647705078, -0.009663581848144531, -0.008878231048583984, -0.008092880249023438, -0.007307529449462891, -0.006522178649902344, -0.005736827850341797, -0.00495147705078125, -0.004166126251220703, -0.0033807754516601562, -0.0025954246520996094, -0.0018100738525390625, -0.0010247230529785156, -0.00023937225341796875, 0.0005459785461425781, 0.001331329345703125, 0.002116680145263672, 0.0029020309448242188, 0.0036873817443847656, 0.0044727325439453125, 0.005258083343505859, 0.006043434143066406, 0.006828784942626953, 0.0076141357421875, 0.008399486541748047, 0.009184837341308594, 0.00997018814086914, 0.010755538940429688, 0.011540889739990234, 0.012326240539550781, 0.013111591339111328, 0.013896942138671875, 0.014682292938232422, 0.015467643737792969, 0.016252994537353516, 0.017038345336914062, 0.01782369613647461, 0.018609046936035156, 0.019394397735595703, 0.02017974853515625, 0.020965099334716797, 0.021750450134277344, 0.02253580093383789, 0.023321151733398438, 0.024106502532958984, 0.02489185333251953, 0.025677204132080078, 0.026462554931640625, 0.027247905731201172, 0.02803325653076172, 0.028818607330322266, 0.029603958129882812, 0.03038930892944336, 0.031174659729003906, 0.03196001052856445, 0.032745361328125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 9.0, 14.0, 20.0, 30.0, 41.0, 73.0, 118.0, 178.0, 305.0, 471.0, 970.0, 1748.0, 3324.0, 6416.0, 14026.0, 32387.0, 88407.0, 356761.0, 3100699.0, 425053.0, 98352.0, 35132.0, 15211.0, 6930.0, 3565.0, 1788.0, 919.0, 547.0, 313.0, 178.0, 100.0, 69.0, 42.0, 30.0, 18.0, 14.0, 10.0, 9.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.07757568359375, -0.0753931999206543, -0.0732107162475586, -0.07102823257446289, -0.06884574890136719, -0.06666326522827148, -0.06448078155517578, -0.06229829788208008, -0.060115814208984375, -0.05793333053588867, -0.05575084686279297, -0.053568363189697266, -0.05138587951660156, -0.04920339584350586, -0.047020912170410156, -0.04483842849731445, -0.04265594482421875, -0.04047346115112305, -0.038290977478027344, -0.03610849380493164, -0.03392601013183594, -0.031743526458740234, -0.02956104278564453, -0.027378559112548828, -0.025196075439453125, -0.023013591766357422, -0.02083110809326172, -0.018648624420166016, -0.016466140747070312, -0.01428365707397461, -0.012101173400878906, -0.009918689727783203, -0.0077362060546875, -0.005553722381591797, -0.0033712387084960938, -0.0011887550354003906, 0.0009937286376953125, 0.0031762123107910156, 0.005358695983886719, 0.007541179656982422, 0.009723663330078125, 0.011906147003173828, 0.014088630676269531, 0.016271114349365234, 0.018453598022460938, 0.02063608169555664, 0.022818565368652344, 0.025001049041748047, 0.02718353271484375, 0.029366016387939453, 0.031548500061035156, 0.03373098373413086, 0.03591346740722656, 0.038095951080322266, 0.04027843475341797, 0.04246091842651367, 0.044643402099609375, 0.04682588577270508, 0.04900836944580078, 0.051190853118896484, 0.05337333679199219, 0.05555582046508789, 0.057738304138183594, 0.0599207878112793, 0.062103271484375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 4.0, 8.0, 13.0, 14.0, 15.0, 23.0, 29.0, 43.0, 57.0, 84.0, 109.0, 209.0, 469.0, 1376.0, 793.0, 291.0, 170.0, 102.0, 72.0, 49.0, 33.0, 26.0, 19.0, 14.0, 17.0, 11.0, 9.0, 7.0, 4.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036590576171875, -0.035320281982421875, -0.03404998779296875, -0.032779693603515625, -0.0315093994140625, -0.030239105224609375, -0.02896881103515625, -0.027698516845703125, -0.02642822265625, -0.025157928466796875, -0.02388763427734375, -0.022617340087890625, -0.0213470458984375, -0.020076751708984375, -0.01880645751953125, -0.017536163330078125, -0.016265869140625, -0.014995574951171875, -0.01372528076171875, -0.012454986572265625, -0.0111846923828125, -0.009914398193359375, -0.00864410400390625, -0.007373809814453125, -0.006103515625, -0.004833221435546875, -0.00356292724609375, -0.002292633056640625, -0.0010223388671875, 0.000247955322265625, 0.00151824951171875, 0.002788543701171875, 0.004058837890625, 0.005329132080078125, 0.00659942626953125, 0.007869720458984375, 0.0091400146484375, 0.010410308837890625, 0.01168060302734375, 0.012950897216796875, 0.01422119140625, 0.015491485595703125, 0.01676177978515625, 0.018032073974609375, 0.0193023681640625, 0.020572662353515625, 0.02184295654296875, 0.023113250732421875, 0.024383544921875, 0.025653839111328125, 0.02692413330078125, 0.028194427490234375, 0.0294647216796875, 0.030735015869140625, 0.03200531005859375, 0.033275604248046875, 0.0345458984375, 0.035816192626953125, 0.03708648681640625, 0.038356781005859375, 0.0396270751953125, 0.040897369384765625, 0.04216766357421875, 0.043437957763671875, 0.044708251953125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 8.0, 11.0, 12.0, 31.0, 38.0, 104.0, 127.0, 167.0, 177.0, 128.0, 101.0, 53.0, 29.0, 11.0, 7.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3000304102897644, -0.28862038254737854, -0.2772103548049927, -0.2658003270626068, -0.25439029932022095, -0.24298027157783508, -0.23157022893428802, -0.22016020119190216, -0.2087501734495163, -0.19734014570713043, -0.18593011796474457, -0.1745200753211975, -0.16311004757881165, -0.15170001983642578, -0.14028999209403992, -0.12887996435165405, -0.11746993660926819, -0.10605990886688232, -0.09464988112449646, -0.08323984593153, -0.07182981818914413, -0.06041979044675827, -0.04900975525379181, -0.037599727511405945, -0.02618969976902008, -0.014779670163989067, -0.0033696405589580536, 0.008040390908718109, 0.019450418651103973, 0.030860446393489838, 0.0422704815864563, 0.05368050932884216, 0.06509053707122803, 0.07650056481361389, 0.08791059255599976, 0.09932062774896622, 0.11073065549135208, 0.12214068323373795, 0.1335507184267044, 0.14496074616909027, 0.15637077391147614, 0.167780801653862, 0.17919082939624786, 0.19060087203979492, 0.2020108997821808, 0.21342092752456665, 0.22483095526695251, 0.23624098300933838, 0.24765101075172424, 0.2590610384941101, 0.27047106623649597, 0.28188109397888184, 0.2932911217212677, 0.30470114946365356, 0.3161112070083618, 0.3275212049484253, 0.33893126249313354, 0.3503412902355194, 0.3617513179779053, 0.37316134572029114, 0.384571373462677, 0.39598140120506287, 0.40739142894744873, 0.418801486492157, 0.43021148443222046]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 6.0, 5.0, 4.0, 5.0, 5.0, 8.0, 4.0, 8.0, 17.0, 18.0, 10.0, 21.0, 21.0, 26.0, 23.0, 34.0, 41.0, 33.0, 37.0, 46.0, 46.0, 45.0, 48.0, 36.0, 30.0, 48.0, 38.0, 37.0, 35.0, 33.0, 21.0, 28.0, 21.0, 29.0, 18.0, 14.0, 13.0, 15.0, 23.0, 10.0, 15.0, 7.0, 9.0, 1.0, 1.0, 7.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.14985984563827515, -0.14571259915828705, -0.14156536757946014, -0.13741812109947205, -0.13327087461948395, -0.12912362813949585, -0.12497639656066895, -0.12082915008068085, -0.11668191105127335, -0.11253467202186584, -0.10838742554187775, -0.10424018651247025, -0.10009294748306274, -0.09594570100307465, -0.09179846197366714, -0.08765122294425964, -0.08350397646427155, -0.07935673743486404, -0.07520949095487595, -0.07106225192546844, -0.06691500544548035, -0.06276776641607285, -0.058620527386665344, -0.054473284631967545, -0.050326041877269745, -0.046178799122571945, -0.042031556367874146, -0.037884317338466644, -0.033737074583768845, -0.029589831829071045, -0.025442590937018394, -0.021295350044965744, -0.017148107290267944, -0.01300086546689272, -0.008853623643517494, -0.004706381820142269, -0.0005591399967670441, 0.0035881027579307556, 0.007735343649983406, 0.011882584542036057, 0.016029827296733856, 0.020177070051431656, 0.024324310943484306, 0.028471551835536957, 0.032618794590234756, 0.036766037344932556, 0.04091327637434006, 0.04506051912903786, 0.04920776188373566, 0.053355004638433456, 0.057502247393131256, 0.06164948642253876, 0.06579673290252686, 0.06994397193193436, 0.07409121096134186, 0.07823845744132996, 0.08238569647073746, 0.08653293550014496, 0.09068018198013306, 0.09482742100954056, 0.09897466003894806, 0.10312190651893616, 0.10726914554834366, 0.11141638457775116, 0.11556363105773926]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 11.0, 7.0, 11.0, 7.0, 16.0, 31.0, 64.0, 90.0, 133.0, 213.0, 350.0, 653.0, 1030.0, 2004.0, 3648.0, 7365.0, 15371.0, 36325.0, 100324.0, 486710.0, 275957.0, 67270.0, 26595.0, 11870.0, 5724.0, 2996.0, 1606.0, 869.0, 519.0, 275.0, 179.0, 111.0, 70.0, 57.0, 28.0, 22.0, 17.0, 14.0, 3.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.076416015625, -0.07376480102539062, -0.07111358642578125, -0.06846237182617188, -0.0658111572265625, -0.06315994262695312, -0.06050872802734375, -0.057857513427734375, -0.055206298828125, -0.052555084228515625, -0.04990386962890625, -0.047252655029296875, -0.0446014404296875, -0.041950225830078125, -0.03929901123046875, -0.036647796630859375, -0.03399658203125, -0.031345367431640625, -0.02869415283203125, -0.026042938232421875, -0.0233917236328125, -0.020740509033203125, -0.01808929443359375, -0.015438079833984375, -0.012786865234375, -0.010135650634765625, -0.00748443603515625, -0.004833221435546875, -0.0021820068359375, 0.000469207763671875, 0.00312042236328125, 0.005771636962890625, 0.0084228515625, 0.011074066162109375, 0.01372528076171875, 0.016376495361328125, 0.0190277099609375, 0.021678924560546875, 0.02433013916015625, 0.026981353759765625, 0.029632568359375, 0.032283782958984375, 0.03493499755859375, 0.037586212158203125, 0.0402374267578125, 0.042888641357421875, 0.04553985595703125, 0.048191070556640625, 0.05084228515625, 0.053493499755859375, 0.05614471435546875, 0.058795928955078125, 0.0614471435546875, 0.06409835815429688, 0.06674957275390625, 0.06940078735351562, 0.072052001953125, 0.07470321655273438, 0.07735443115234375, 0.08000564575195312, 0.0826568603515625, 0.08530807495117188, 0.08795928955078125, 0.09061050415039062, 0.09326171875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 0.0, 5.0, 8.0, 2.0, 3.0, 6.0, 2.0, 5.0, 13.0, 11.0, 21.0, 24.0, 22.0, 34.0, 32.0, 39.0, 40.0, 47.0, 43.0, 52.0, 71.0, 49.0, 53.0, 47.0, 51.0, 53.0, 40.0, 32.0, 32.0, 28.0, 28.0, 20.0, 18.0, 23.0, 7.0, 8.0, 11.0, 3.0, 3.0, 5.0, 2.0, 5.0, 5.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0175628662109375, -0.01695084571838379, -0.016338825225830078, -0.015726804733276367, -0.015114784240722656, -0.014502763748168945, -0.013890743255615234, -0.013278722763061523, -0.012666702270507812, -0.012054681777954102, -0.01144266128540039, -0.01083064079284668, -0.010218620300292969, -0.009606599807739258, -0.008994579315185547, -0.008382558822631836, -0.007770538330078125, -0.007158517837524414, -0.006546497344970703, -0.005934476852416992, -0.005322456359863281, -0.00471043586730957, -0.004098415374755859, -0.0034863948822021484, -0.0028743743896484375, -0.0022623538970947266, -0.0016503334045410156, -0.0010383129119873047, -0.00042629241943359375, 0.0001857280731201172, 0.0007977485656738281, 0.001409769058227539, 0.00202178955078125, 0.002633810043334961, 0.003245830535888672, 0.003857851028442383, 0.004469871520996094, 0.005081892013549805, 0.005693912506103516, 0.0063059329986572266, 0.0069179534912109375, 0.0075299739837646484, 0.00814199447631836, 0.00875401496887207, 0.009366035461425781, 0.009978055953979492, 0.010590076446533203, 0.011202096939086914, 0.011814117431640625, 0.012426137924194336, 0.013038158416748047, 0.013650178909301758, 0.014262199401855469, 0.01487421989440918, 0.01548624038696289, 0.0160982608795166, 0.016710281372070312, 0.017322301864624023, 0.017934322357177734, 0.018546342849731445, 0.019158363342285156, 0.019770383834838867, 0.020382404327392578, 0.02099442481994629, 0.0216064453125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 11.0, 9.0, 22.0, 29.0, 29.0, 32.0, 57.0, 96.0, 109.0, 197.0, 307.0, 487.0, 828.0, 1702.0, 4010.0, 11796.0, 42259.0, 194815.0, 638600.0, 110886.0, 27962.0, 8250.0, 2926.0, 1366.0, 665.0, 407.0, 213.0, 135.0, 100.0, 67.0, 43.0, 51.0, 26.0, 16.0, 9.0, 12.0, 9.0, 7.0, 2.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.08184814453125, -0.07885456085205078, -0.07586097717285156, -0.07286739349365234, -0.06987380981445312, -0.0668802261352539, -0.06388664245605469, -0.06089305877685547, -0.05789947509765625, -0.05490589141845703, -0.05191230773925781, -0.048918724060058594, -0.045925140380859375, -0.042931556701660156, -0.03993797302246094, -0.03694438934326172, -0.0339508056640625, -0.03095722198486328, -0.027963638305664062, -0.024970054626464844, -0.021976470947265625, -0.018982887268066406, -0.015989303588867188, -0.012995719909667969, -0.01000213623046875, -0.007008552551269531, -0.0040149688720703125, -0.0010213851928710938, 0.001972198486328125, 0.004965782165527344, 0.007959365844726562, 0.010952949523925781, 0.013946533203125, 0.01694011688232422, 0.019933700561523438, 0.022927284240722656, 0.025920867919921875, 0.028914451599121094, 0.03190803527832031, 0.03490161895751953, 0.03789520263671875, 0.04088878631591797, 0.04388236999511719, 0.046875953674316406, 0.049869537353515625, 0.052863121032714844, 0.05585670471191406, 0.05885028839111328, 0.0618438720703125, 0.06483745574951172, 0.06783103942871094, 0.07082462310791016, 0.07381820678710938, 0.0768117904663086, 0.07980537414550781, 0.08279895782470703, 0.08579254150390625, 0.08878612518310547, 0.09177970886230469, 0.0947732925415039, 0.09776687622070312, 0.10076045989990234, 0.10375404357910156, 0.10674762725830078, 0.1097412109375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 9.0, 9.0, 5.0, 6.0, 16.0, 15.0, 27.0, 14.0, 18.0, 23.0, 33.0, 27.0, 37.0, 40.0, 37.0, 51.0, 48.0, 58.0, 56.0, 51.0, 52.0, 51.0, 37.0, 35.0, 33.0, 31.0, 26.0, 24.0, 20.0, 18.0, 22.0, 14.0, 11.0, 6.0, 11.0, 9.0, 1.0, 3.0, 6.0, 4.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07958984375, -0.07706356048583984, -0.07453727722167969, -0.07201099395751953, -0.06948471069335938, -0.06695842742919922, -0.06443214416503906, -0.061905860900878906, -0.05937957763671875, -0.056853294372558594, -0.05432701110839844, -0.05180072784423828, -0.049274444580078125, -0.04674816131591797, -0.04422187805175781, -0.041695594787597656, -0.0391693115234375, -0.036643028259277344, -0.03411674499511719, -0.03159046173095703, -0.029064178466796875, -0.02653789520263672, -0.024011611938476562, -0.021485328674316406, -0.01895904541015625, -0.016432762145996094, -0.013906478881835938, -0.011380195617675781, -0.008853912353515625, -0.006327629089355469, -0.0038013458251953125, -0.0012750625610351562, 0.001251220703125, 0.0037775039672851562, 0.0063037872314453125, 0.008830070495605469, 0.011356353759765625, 0.013882637023925781, 0.016408920288085938, 0.018935203552246094, 0.02146148681640625, 0.023987770080566406, 0.026514053344726562, 0.02904033660888672, 0.031566619873046875, 0.03409290313720703, 0.03661918640136719, 0.039145469665527344, 0.0416717529296875, 0.044198036193847656, 0.04672431945800781, 0.04925060272216797, 0.051776885986328125, 0.05430316925048828, 0.05682945251464844, 0.059355735778808594, 0.06188201904296875, 0.0644083023071289, 0.06693458557128906, 0.06946086883544922, 0.07198715209960938, 0.07451343536376953, 0.07703971862792969, 0.07956600189208984, 0.08209228515625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 4.0, 4.0, 12.0, 11.0, 16.0, 15.0, 18.0, 36.0, 50.0, 58.0, 102.0, 166.0, 262.0, 416.0, 648.0, 1165.0, 2013.0, 3953.0, 8286.0, 19796.0, 56535.0, 376594.0, 472795.0, 65050.0, 21838.0, 9149.0, 4285.0, 2154.0, 1213.0, 695.0, 419.0, 245.0, 188.0, 113.0, 60.0, 53.0, 39.0, 22.0, 16.0, 17.0, 13.0, 8.0, 2.0, 9.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.055938720703125, -0.05424642562866211, -0.05255413055419922, -0.05086183547973633, -0.04916954040527344, -0.04747724533081055, -0.045784950256347656, -0.044092655181884766, -0.042400360107421875, -0.040708065032958984, -0.039015769958496094, -0.0373234748840332, -0.03563117980957031, -0.03393888473510742, -0.03224658966064453, -0.03055429458618164, -0.02886199951171875, -0.02716970443725586, -0.02547740936279297, -0.023785114288330078, -0.022092819213867188, -0.020400524139404297, -0.018708229064941406, -0.017015933990478516, -0.015323638916015625, -0.013631343841552734, -0.011939048767089844, -0.010246753692626953, -0.008554458618164062, -0.006862163543701172, -0.005169868469238281, -0.0034775733947753906, -0.0017852783203125, -9.298324584960938e-05, 0.0015993118286132812, 0.003291606903076172, 0.0049839019775390625, 0.006676197052001953, 0.008368492126464844, 0.010060787200927734, 0.011753082275390625, 0.013445377349853516, 0.015137672424316406, 0.016829967498779297, 0.018522262573242188, 0.020214557647705078, 0.02190685272216797, 0.02359914779663086, 0.02529144287109375, 0.02698373794555664, 0.02867603302001953, 0.030368328094482422, 0.03206062316894531, 0.0337529182434082, 0.035445213317871094, 0.037137508392333984, 0.038829803466796875, 0.040522098541259766, 0.042214393615722656, 0.04390668869018555, 0.04559898376464844, 0.04729127883911133, 0.04898357391357422, 0.05067586898803711, 0.0523681640625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 11.0, 8.0, 16.0, 37.0, 51.0, 118.0, 169.0, 198.0, 170.0, 88.0, 63.0, 28.0, 22.0, 11.0, 6.0, 4.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.159875869750977e-05, -7.935706526041031e-05, -7.711537182331085e-05, -7.48736783862114e-05, -7.263198494911194e-05, -7.039029151201248e-05, -6.814859807491302e-05, -6.590690463781357e-05, -6.366521120071411e-05, -6.142351776361465e-05, -5.91818243265152e-05, -5.694013088941574e-05, -5.4698437452316284e-05, -5.245674401521683e-05, -5.021505057811737e-05, -4.7973357141017914e-05, -4.573166370391846e-05, -4.3489970266819e-05, -4.1248276829719543e-05, -3.900658339262009e-05, -3.676488995552063e-05, -3.452319651842117e-05, -3.2281503081321716e-05, -3.003980964422226e-05, -2.7798116207122803e-05, -2.5556422770023346e-05, -2.331472933292389e-05, -2.1073035895824432e-05, -1.8831342458724976e-05, -1.658964902162552e-05, -1.4347955584526062e-05, -1.2106262147426605e-05, -9.864568710327148e-06, -7.622875273227692e-06, -5.381181836128235e-06, -3.139488399028778e-06, -8.977949619293213e-07, 1.3438984751701355e-06, 3.5855919122695923e-06, 5.827285349369049e-06, 8.068978786468506e-06, 1.0310672223567963e-05, 1.255236566066742e-05, 1.4794059097766876e-05, 1.7035752534866333e-05, 1.927744597196579e-05, 2.1519139409065247e-05, 2.3760832846164703e-05, 2.600252628326416e-05, 2.8244219720363617e-05, 3.0485913157463074e-05, 3.272760659456253e-05, 3.496930003166199e-05, 3.7210993468761444e-05, 3.94526869058609e-05, 4.169438034296036e-05, 4.3936073780059814e-05, 4.617776721715927e-05, 4.841946065425873e-05, 5.0661154091358185e-05, 5.290284752845764e-05, 5.51445409655571e-05, 5.7386234402656555e-05, 5.962792783975601e-05, 6.186962127685547e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 3.0, 6.0, 8.0, 9.0, 14.0, 20.0, 37.0, 39.0, 83.0, 118.0, 197.0, 289.0, 454.0, 804.0, 1510.0, 2779.0, 6218.0, 16559.0, 57549.0, 568942.0, 325672.0, 43194.0, 13305.0, 5161.0, 2416.0, 1252.0, 711.0, 436.0, 251.0, 164.0, 121.0, 73.0, 41.0, 32.0, 24.0, 16.0, 12.0, 11.0, 8.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0545654296875, -0.05260944366455078, -0.05065345764160156, -0.048697471618652344, -0.046741485595703125, -0.044785499572753906, -0.04282951354980469, -0.04087352752685547, -0.03891754150390625, -0.03696155548095703, -0.03500556945800781, -0.033049583435058594, -0.031093597412109375, -0.029137611389160156, -0.027181625366210938, -0.02522563934326172, -0.0232696533203125, -0.02131366729736328, -0.019357681274414062, -0.017401695251464844, -0.015445709228515625, -0.013489723205566406, -0.011533737182617188, -0.009577751159667969, -0.00762176513671875, -0.005665779113769531, -0.0037097930908203125, -0.0017538070678710938, 0.000202178955078125, 0.0021581649780273438, 0.0041141510009765625, 0.006070137023925781, 0.008026123046875, 0.009982109069824219, 0.011938095092773438, 0.013894081115722656, 0.015850067138671875, 0.017806053161621094, 0.019762039184570312, 0.02171802520751953, 0.02367401123046875, 0.02562999725341797, 0.027585983276367188, 0.029541969299316406, 0.031497955322265625, 0.033453941345214844, 0.03540992736816406, 0.03736591339111328, 0.0393218994140625, 0.04127788543701172, 0.04323387145996094, 0.045189857482910156, 0.047145843505859375, 0.049101829528808594, 0.05105781555175781, 0.05301380157470703, 0.05496978759765625, 0.05692577362060547, 0.05888175964355469, 0.060837745666503906, 0.06279373168945312, 0.06474971771240234, 0.06670570373535156, 0.06866168975830078, 0.07061767578125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 4.0, 8.0, 9.0, 7.0, 10.0, 12.0, 25.0, 23.0, 38.0, 46.0, 75.0, 127.0, 187.0, 131.0, 87.0, 48.0, 36.0, 29.0, 24.0, 10.0, 7.0, 9.0, 8.0, 10.0, 6.0, 2.0, 3.0, 1.0, 2.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.045379638671875, -0.0439448356628418, -0.042510032653808594, -0.04107522964477539, -0.03964042663574219, -0.038205623626708984, -0.03677082061767578, -0.03533601760864258, -0.033901214599609375, -0.03246641159057617, -0.03103160858154297, -0.029596805572509766, -0.028162002563476562, -0.02672719955444336, -0.025292396545410156, -0.023857593536376953, -0.02242279052734375, -0.020987987518310547, -0.019553184509277344, -0.01811838150024414, -0.016683578491210938, -0.015248775482177734, -0.013813972473144531, -0.012379169464111328, -0.010944366455078125, -0.009509563446044922, -0.008074760437011719, -0.006639957427978516, -0.0052051544189453125, -0.0037703514099121094, -0.0023355484008789062, -0.0009007453918457031, 0.0005340576171875, 0.001968860626220703, 0.0034036636352539062, 0.004838466644287109, 0.0062732696533203125, 0.007708072662353516, 0.009142875671386719, 0.010577678680419922, 0.012012481689453125, 0.013447284698486328, 0.014882087707519531, 0.016316890716552734, 0.017751693725585938, 0.01918649673461914, 0.020621299743652344, 0.022056102752685547, 0.02349090576171875, 0.024925708770751953, 0.026360511779785156, 0.02779531478881836, 0.029230117797851562, 0.030664920806884766, 0.03209972381591797, 0.03353452682495117, 0.034969329833984375, 0.03640413284301758, 0.03783893585205078, 0.039273738861083984, 0.04070854187011719, 0.04214334487915039, 0.043578147888183594, 0.0450129508972168, 0.04644775390625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 9.0, 9.0, 54.0, 154.0, 294.0, 287.0, 149.0, 39.0, 10.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.5535879135131836, -2.5014238357543945, -2.4492597579956055, -2.3970954418182373, -2.3449313640594482, -2.292767286300659, -2.24060320854187, -2.188438892364502, -2.136274814605713, -2.084110736846924, -2.0319466590881348, -1.9797824621200562, -1.9276182651519775, -1.8754541873931885, -1.8232901096343994, -1.7711259126663208, -1.7189618349075317, -1.6667977571487427, -1.614633560180664, -1.562469482421875, -1.5103052854537964, -1.4581412076950073, -1.4059770107269287, -1.3538129329681396, -1.3016488552093506, -1.2494847774505615, -1.197320580482483, -1.1451565027236938, -1.0929923057556152, -1.0408282279968262, -0.9886640906333923, -0.9364999532699585, -0.8843357563018799, -0.832171618938446, -0.7800074815750122, -0.7278434038162231, -0.6756792068481445, -0.6235151290893555, -0.5713509917259216, -0.5191868543624878, -0.46702271699905396, -0.4148585796356201, -0.3626944422721863, -0.31053033471107483, -0.258366197347641, -0.20620205998420715, -0.1540379524230957, -0.10187381505966187, -0.04970967769622803, 0.0024544522166252136, 0.054618582129478455, 0.1067827045917511, 0.15894684195518494, 0.21111097931861877, 0.2632750868797302, 0.31543922424316406, 0.3676033616065979, 0.41976749897003174, 0.4719316363334656, 0.5240957736968994, 0.5762598514556885, 0.6284240484237671, 0.6805881261825562, 0.73275226354599, 0.7849164009094238]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 1.0, 4.0, 6.0, 4.0, 8.0, 8.0, 16.0, 17.0, 20.0, 21.0, 18.0, 35.0, 21.0, 40.0, 41.0, 38.0, 41.0, 41.0, 36.0, 42.0, 35.0, 46.0, 41.0, 51.0, 55.0, 45.0, 35.0, 43.0, 27.0, 25.0, 19.0, 21.0, 15.0, 18.0, 14.0, 10.0, 13.0, 7.0, 7.0, 6.0, 4.0, 3.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36976349353790283, -0.3567947745323181, -0.3438260555267334, -0.3308573365211487, -0.31788861751556396, -0.30491989850997925, -0.29195117950439453, -0.2789824604988098, -0.2660137414932251, -0.2530450224876404, -0.24007630348205566, -0.22710758447647095, -0.21413886547088623, -0.2011701464653015, -0.1882014274597168, -0.17523270845413208, -0.16226397454738617, -0.14929525554180145, -0.13632653653621674, -0.12335781753063202, -0.1103890985250473, -0.09742037206888199, -0.08445165306329727, -0.07148293405771255, -0.05851421505212784, -0.04554549604654312, -0.032576777040958405, -0.01960805431008339, -0.0066393353044986725, 0.006329387426376343, 0.01929810643196106, 0.032266825437545776, 0.04523554444313049, 0.05820426344871521, 0.07117298245429993, 0.08414170145988464, 0.09711042046546936, 0.11007914692163467, 0.12304786592721939, 0.1360165774822235, 0.14898529648780823, 0.16195401549339294, 0.17492273449897766, 0.18789145350456238, 0.2008601725101471, 0.2138288915157318, 0.22679761052131653, 0.23976632952690125, 0.25273507833480835, 0.26570379734039307, 0.2786725163459778, 0.2916412353515625, 0.3046099543571472, 0.31757867336273193, 0.33054739236831665, 0.34351611137390137, 0.3564848303794861, 0.3694535493850708, 0.3824222683906555, 0.39539098739624023, 0.40835970640182495, 0.42132842540740967, 0.4342971444129944, 0.4472658634185791, 0.4602345824241638]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 7.0, 4.0, 12.0, 14.0, 24.0, 31.0, 58.0, 94.0, 110.0, 175.0, 302.0, 426.0, 725.0, 1201.0, 1877.0, 3351.0, 6361.0, 12574.0, 29478.0, 88837.0, 628344.0, 3208204.0, 137802.0, 40268.0, 15863.0, 7774.0, 4062.0, 2296.0, 1425.0, 878.0, 569.0, 378.0, 258.0, 144.0, 115.0, 72.0, 58.0, 31.0, 25.0, 17.0, 13.0, 7.0, 9.0, 6.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06707763671875, -0.06477737426757812, -0.06247711181640625, -0.060176849365234375, -0.0578765869140625, -0.055576324462890625, -0.05327606201171875, -0.050975799560546875, -0.048675537109375, -0.046375274658203125, -0.04407501220703125, -0.041774749755859375, -0.0394744873046875, -0.037174224853515625, -0.03487396240234375, -0.032573699951171875, -0.0302734375, -0.027973175048828125, -0.02567291259765625, -0.023372650146484375, -0.0210723876953125, -0.018772125244140625, -0.01647186279296875, -0.014171600341796875, -0.011871337890625, -0.009571075439453125, -0.00727081298828125, -0.004970550537109375, -0.0026702880859375, -0.000370025634765625, 0.00193023681640625, 0.004230499267578125, 0.00653076171875, 0.008831024169921875, 0.01113128662109375, 0.013431549072265625, 0.0157318115234375, 0.018032073974609375, 0.02033233642578125, 0.022632598876953125, 0.024932861328125, 0.027233123779296875, 0.02953338623046875, 0.031833648681640625, 0.0341339111328125, 0.036434173583984375, 0.03873443603515625, 0.041034698486328125, 0.0433349609375, 0.045635223388671875, 0.04793548583984375, 0.050235748291015625, 0.0525360107421875, 0.054836273193359375, 0.05713653564453125, 0.059436798095703125, 0.061737060546875, 0.06403732299804688, 0.06633758544921875, 0.06863784790039062, 0.0709381103515625, 0.07323837280273438, 0.07553863525390625, 0.07783889770507812, 0.08013916015625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 7.0, 2.0, 2.0, 7.0, 6.0, 8.0, 6.0, 17.0, 14.0, 21.0, 25.0, 41.0, 35.0, 39.0, 49.0, 61.0, 39.0, 56.0, 71.0, 54.0, 57.0, 45.0, 48.0, 52.0, 44.0, 33.0, 35.0, 28.0, 18.0, 23.0, 14.0, 12.0, 11.0, 4.0, 9.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015869140625, -0.015159845352172852, -0.014450550079345703, -0.013741254806518555, -0.013031959533691406, -0.012322664260864258, -0.01161336898803711, -0.010904073715209961, -0.010194778442382812, -0.009485483169555664, -0.008776187896728516, -0.008066892623901367, -0.007357597351074219, -0.00664830207824707, -0.005939006805419922, -0.0052297115325927734, -0.004520416259765625, -0.0038111209869384766, -0.003101825714111328, -0.0023925304412841797, -0.0016832351684570312, -0.0009739398956298828, -0.0002646446228027344, 0.00044465065002441406, 0.0011539459228515625, 0.001863241195678711, 0.0025725364685058594, 0.003281831741333008, 0.003991127014160156, 0.004700422286987305, 0.005409717559814453, 0.0061190128326416016, 0.00682830810546875, 0.0075376033782958984, 0.008246898651123047, 0.008956193923950195, 0.009665489196777344, 0.010374784469604492, 0.01108407974243164, 0.011793375015258789, 0.012502670288085938, 0.013211965560913086, 0.013921260833740234, 0.014630556106567383, 0.015339851379394531, 0.01604914665222168, 0.016758441925048828, 0.017467737197875977, 0.018177032470703125, 0.018886327743530273, 0.019595623016357422, 0.02030491828918457, 0.02101421356201172, 0.021723508834838867, 0.022432804107666016, 0.023142099380493164, 0.023851394653320312, 0.02456068992614746, 0.02526998519897461, 0.025979280471801758, 0.026688575744628906, 0.027397871017456055, 0.028107166290283203, 0.02881646156311035, 0.0295257568359375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 8.0, 9.0, 20.0, 14.0, 27.0, 44.0, 59.0, 133.0, 163.0, 257.0, 449.0, 749.0, 1354.0, 2465.0, 4679.0, 9077.0, 19332.0, 47862.0, 159069.0, 2491786.0, 1240920.0, 136003.0, 42958.0, 18162.0, 8776.0, 4342.0, 2344.0, 1294.0, 765.0, 429.0, 272.0, 190.0, 76.0, 66.0, 47.0, 29.0, 21.0, 15.0, 8.0, 7.0, 0.0, 5.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.063720703125, -0.061440467834472656, -0.05916023254394531, -0.05687999725341797, -0.054599761962890625, -0.05231952667236328, -0.05003929138183594, -0.047759056091308594, -0.04547882080078125, -0.043198585510253906, -0.04091835021972656, -0.03863811492919922, -0.036357879638671875, -0.03407764434814453, -0.03179740905761719, -0.029517173767089844, -0.0272369384765625, -0.024956703186035156, -0.022676467895507812, -0.02039623260498047, -0.018115997314453125, -0.01583576202392578, -0.013555526733398438, -0.011275291442871094, -0.00899505615234375, -0.006714820861816406, -0.0044345855712890625, -0.0021543502807617188, 0.000125885009765625, 0.0024061203002929688, 0.0046863555908203125, 0.006966590881347656, 0.009246826171875, 0.011527061462402344, 0.013807296752929688, 0.01608753204345703, 0.018367767333984375, 0.02064800262451172, 0.022928237915039062, 0.025208473205566406, 0.02748870849609375, 0.029768943786621094, 0.03204917907714844, 0.03432941436767578, 0.036609649658203125, 0.03888988494873047, 0.04117012023925781, 0.043450355529785156, 0.0457305908203125, 0.048010826110839844, 0.05029106140136719, 0.05257129669189453, 0.054851531982421875, 0.05713176727294922, 0.05941200256347656, 0.061692237854003906, 0.06397247314453125, 0.0662527084350586, 0.06853294372558594, 0.07081317901611328, 0.07309341430664062, 0.07537364959716797, 0.07765388488769531, 0.07993412017822266, 0.08221435546875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 7.0, 8.0, 13.0, 15.0, 24.0, 31.0, 43.0, 65.0, 123.0, 246.0, 690.0, 1881.0, 426.0, 193.0, 91.0, 66.0, 37.0, 30.0, 21.0, 15.0, 14.0, 12.0, 8.0, 6.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047454833984375, -0.04602956771850586, -0.04460430145263672, -0.04317903518676758, -0.04175376892089844, -0.0403285026550293, -0.038903236389160156, -0.037477970123291016, -0.036052703857421875, -0.034627437591552734, -0.033202171325683594, -0.03177690505981445, -0.030351638793945312, -0.028926372528076172, -0.02750110626220703, -0.02607583999633789, -0.02465057373046875, -0.02322530746459961, -0.02180004119873047, -0.020374774932861328, -0.018949508666992188, -0.017524242401123047, -0.016098976135253906, -0.014673709869384766, -0.013248443603515625, -0.011823177337646484, -0.010397911071777344, -0.008972644805908203, -0.0075473785400390625, -0.006122112274169922, -0.004696846008300781, -0.0032715797424316406, -0.0018463134765625, -0.0004210472106933594, 0.0010042190551757812, 0.002429485321044922, 0.0038547515869140625, 0.005280017852783203, 0.006705284118652344, 0.008130550384521484, 0.009555816650390625, 0.010981082916259766, 0.012406349182128906, 0.013831615447998047, 0.015256881713867188, 0.016682147979736328, 0.01810741424560547, 0.01953268051147461, 0.02095794677734375, 0.02238321304321289, 0.02380847930908203, 0.025233745574951172, 0.026659011840820312, 0.028084278106689453, 0.029509544372558594, 0.030934810638427734, 0.032360076904296875, 0.033785343170166016, 0.035210609436035156, 0.0366358757019043, 0.03806114196777344, 0.03948640823364258, 0.04091167449951172, 0.04233694076538086, 0.04376220703125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 10.0, 10.0, 36.0, 70.0, 130.0, 181.0, 193.0, 153.0, 111.0, 61.0, 25.0, 17.0, 5.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.14869078993797302, -0.13735340535640717, -0.1260160207748413, -0.11467864364385605, -0.10334125906229019, -0.09200387448072433, -0.08066649734973907, -0.06932911276817322, -0.05799172818660736, -0.046654343605041504, -0.035316962748765945, -0.023979581892490387, -0.01264219731092453, -0.001304812729358673, 0.010032564401626587, 0.021369948983192444, 0.0327073335647583, 0.04404471814632416, 0.055382099002599716, 0.06671947985887527, 0.07805686444044113, 0.08939424902200699, 0.10073162615299225, 0.1120690107345581, 0.12340639531612396, 0.13474377989768982, 0.14608116447925568, 0.15741854906082153, 0.1687559187412262, 0.18009331822395325, 0.1914306879043579, 0.20276807248592377, 0.21410542726516724, 0.2254428118467331, 0.23678019642829895, 0.2481175661087036, 0.25945496559143066, 0.2707923352718353, 0.28212970495224, 0.29346710443496704, 0.3048045039176941, 0.31614187359809875, 0.3274792730808258, 0.33881664276123047, 0.3501540422439575, 0.3614914119243622, 0.37282878160476685, 0.3841661810874939, 0.39550355076789856, 0.4068409204483032, 0.4181783199310303, 0.42951568961143494, 0.440853089094162, 0.45219045877456665, 0.4635278582572937, 0.47486522793769836, 0.486202597618103, 0.4975399672985077, 0.5088773369789124, 0.5202147364616394, 0.5315521359443665, 0.5428895354270935, 0.5542268753051758, 0.5655642747879028, 0.5769016742706299]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 5.0, 7.0, 8.0, 11.0, 16.0, 27.0, 34.0, 29.0, 33.0, 28.0, 35.0, 36.0, 45.0, 35.0, 52.0, 55.0, 51.0, 53.0, 62.0, 44.0, 51.0, 42.0, 45.0, 32.0, 24.0, 28.0, 23.0, 28.0, 13.0, 16.0, 10.0, 7.0, 5.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11925679445266724, -0.11501452326774597, -0.11077225208282471, -0.10652998089790344, -0.10228770971298218, -0.09804543852806091, -0.09380317479372025, -0.08956090360879898, -0.08531863242387772, -0.08107636123895645, -0.07683409005403519, -0.07259181886911392, -0.06834955513477325, -0.06410728394985199, -0.059865012764930725, -0.05562274158000946, -0.051380470395088196, -0.04713819921016693, -0.042895928025245667, -0.0386536605656147, -0.034411389380693436, -0.03016911819577217, -0.025926848873496056, -0.02168457955121994, -0.017442308366298676, -0.013200038112699986, -0.008957767859101295, -0.0047154976055026054, -0.0004732273519039154, 0.0037690438330173492, 0.008011313155293465, 0.01225358247756958, 0.016495853662490845, 0.02073812484741211, 0.024980394169688225, 0.02922266349196434, 0.033464934676885605, 0.03770720586180687, 0.041949473321437836, 0.0461917445063591, 0.050434015691280365, 0.05467628687620163, 0.058918558061122894, 0.06316082924604416, 0.06740309298038483, 0.07164536416530609, 0.07588763535022736, 0.08012990653514862, 0.08437217772006989, 0.08861444890499115, 0.09285672008991241, 0.09709899127483368, 0.10134126245975494, 0.10558353364467621, 0.10982579737901688, 0.11406806856393814, 0.1183103397488594, 0.12255261093378067, 0.12679487466812134, 0.1310371458530426, 0.13527941703796387, 0.13952168822288513, 0.1437639594078064, 0.14800623059272766, 0.15224850177764893]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 1.0, 4.0, 7.0, 9.0, 17.0, 14.0, 38.0, 38.0, 65.0, 135.0, 237.0, 476.0, 1029.0, 2567.0, 6415.0, 17366.0, 50876.0, 229459.0, 577964.0, 110242.0, 32394.0, 11485.0, 4345.0, 1759.0, 778.0, 357.0, 183.0, 99.0, 63.0, 49.0, 32.0, 14.0, 15.0, 7.0, 4.0, 3.0, 8.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07135009765625, -0.06863689422607422, -0.06592369079589844, -0.06321048736572266, -0.060497283935546875, -0.057784080505371094, -0.05507087707519531, -0.05235767364501953, -0.04964447021484375, -0.04693126678466797, -0.04421806335449219, -0.041504859924316406, -0.038791656494140625, -0.036078453063964844, -0.03336524963378906, -0.03065204620361328, -0.0279388427734375, -0.02522563934326172, -0.022512435913085938, -0.019799232482910156, -0.017086029052734375, -0.014372825622558594, -0.011659622192382812, -0.008946418762207031, -0.00623321533203125, -0.0035200119018554688, -0.0008068084716796875, 0.0019063949584960938, 0.004619598388671875, 0.007332801818847656, 0.010046005249023438, 0.012759208679199219, 0.015472412109375, 0.01818561553955078, 0.020898818969726562, 0.023612022399902344, 0.026325225830078125, 0.029038429260253906, 0.03175163269042969, 0.03446483612060547, 0.03717803955078125, 0.03989124298095703, 0.04260444641113281, 0.045317649841308594, 0.048030853271484375, 0.050744056701660156, 0.05345726013183594, 0.05617046356201172, 0.0588836669921875, 0.06159687042236328, 0.06431007385253906, 0.06702327728271484, 0.06973648071289062, 0.0724496841430664, 0.07516288757324219, 0.07787609100341797, 0.08058929443359375, 0.08330249786376953, 0.08601570129394531, 0.0887289047241211, 0.09144210815429688, 0.09415531158447266, 0.09686851501464844, 0.09958171844482422, 0.102294921875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 7.0, 4.0, 4.0, 4.0, 6.0, 4.0, 11.0, 18.0, 24.0, 17.0, 37.0, 22.0, 26.0, 37.0, 46.0, 52.0, 38.0, 49.0, 67.0, 57.0, 49.0, 49.0, 49.0, 40.0, 46.0, 32.0, 38.0, 25.0, 28.0, 17.0, 22.0, 11.0, 10.0, 16.0, 8.0, 9.0, 5.0, 7.0, 4.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0184173583984375, -0.017778873443603516, -0.01714038848876953, -0.016501903533935547, -0.015863418579101562, -0.015224933624267578, -0.014586448669433594, -0.01394796371459961, -0.013309478759765625, -0.01267099380493164, -0.012032508850097656, -0.011394023895263672, -0.010755538940429688, -0.010117053985595703, -0.009478569030761719, -0.008840084075927734, -0.00820159912109375, -0.007563114166259766, -0.006924629211425781, -0.006286144256591797, -0.0056476593017578125, -0.005009174346923828, -0.004370689392089844, -0.0037322044372558594, -0.003093719482421875, -0.0024552345275878906, -0.0018167495727539062, -0.0011782646179199219, -0.0005397796630859375, 9.870529174804688e-05, 0.0007371902465820312, 0.0013756752014160156, 0.00201416015625, 0.0026526451110839844, 0.0032911300659179688, 0.003929615020751953, 0.0045680999755859375, 0.005206584930419922, 0.005845069885253906, 0.006483554840087891, 0.007122039794921875, 0.007760524749755859, 0.008399009704589844, 0.009037494659423828, 0.009675979614257812, 0.010314464569091797, 0.010952949523925781, 0.011591434478759766, 0.01222991943359375, 0.012868404388427734, 0.013506889343261719, 0.014145374298095703, 0.014783859252929688, 0.015422344207763672, 0.016060829162597656, 0.01669931411743164, 0.017337799072265625, 0.01797628402709961, 0.018614768981933594, 0.019253253936767578, 0.019891738891601562, 0.020530223846435547, 0.02116870880126953, 0.021807193756103516, 0.0224456787109375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 5.0, 3.0, 3.0, 4.0, 7.0, 5.0, 5.0, 14.0, 11.0, 16.0, 31.0, 37.0, 58.0, 93.0, 145.0, 256.0, 464.0, 844.0, 1947.0, 4356.0, 10931.0, 29395.0, 96361.0, 629253.0, 204077.0, 43211.0, 15706.0, 6100.0, 2628.0, 1132.0, 591.0, 321.0, 186.0, 112.0, 71.0, 55.0, 34.0, 21.0, 16.0, 15.0, 10.0, 11.0, 1.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.09130859375, -0.08859825134277344, -0.08588790893554688, -0.08317756652832031, -0.08046722412109375, -0.07775688171386719, -0.07504653930664062, -0.07233619689941406, -0.0696258544921875, -0.06691551208496094, -0.06420516967773438, -0.06149482727050781, -0.05878448486328125, -0.05607414245605469, -0.053363800048828125, -0.05065345764160156, -0.047943115234375, -0.04523277282714844, -0.042522430419921875, -0.03981208801269531, -0.03710174560546875, -0.03439140319824219, -0.031681060791015625, -0.028970718383789062, -0.0262603759765625, -0.023550033569335938, -0.020839691162109375, -0.018129348754882812, -0.01541900634765625, -0.012708663940429688, -0.009998321533203125, -0.0072879791259765625, -0.00457763671875, -0.0018672943115234375, 0.000843048095703125, 0.0035533905029296875, 0.00626373291015625, 0.008974075317382812, 0.011684417724609375, 0.014394760131835938, 0.0171051025390625, 0.019815444946289062, 0.022525787353515625, 0.025236129760742188, 0.02794647216796875, 0.030656814575195312, 0.033367156982421875, 0.03607749938964844, 0.038787841796875, 0.04149818420410156, 0.044208526611328125, 0.04691886901855469, 0.04962921142578125, 0.05233955383300781, 0.055049896240234375, 0.05776023864746094, 0.0604705810546875, 0.06318092346191406, 0.06589126586914062, 0.06860160827636719, 0.07131195068359375, 0.07402229309082031, 0.07673263549804688, 0.07944297790527344, 0.0821533203125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 6.0, 7.0, 5.0, 13.0, 8.0, 16.0, 19.0, 23.0, 31.0, 46.0, 58.0, 57.0, 58.0, 66.0, 68.0, 73.0, 45.0, 57.0, 61.0, 62.0, 37.0, 38.0, 30.0, 24.0, 15.0, 22.0, 12.0, 10.0, 10.0, 6.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11737060546875, -0.1137704849243164, -0.11017036437988281, -0.10657024383544922, -0.10297012329101562, -0.09937000274658203, -0.09576988220214844, -0.09216976165771484, -0.08856964111328125, -0.08496952056884766, -0.08136940002441406, -0.07776927947998047, -0.07416915893554688, -0.07056903839111328, -0.06696891784667969, -0.0633687973022461, -0.0597686767578125, -0.056168556213378906, -0.05256843566894531, -0.04896831512451172, -0.045368194580078125, -0.04176807403564453, -0.03816795349121094, -0.034567832946777344, -0.03096771240234375, -0.027367591857910156, -0.023767471313476562, -0.02016735076904297, -0.016567230224609375, -0.012967109680175781, -0.009366989135742188, -0.005766868591308594, -0.002166748046875, 0.0014333724975585938, 0.0050334930419921875, 0.008633613586425781, 0.012233734130859375, 0.01583385467529297, 0.019433975219726562, 0.023034095764160156, 0.02663421630859375, 0.030234336853027344, 0.03383445739746094, 0.03743457794189453, 0.041034698486328125, 0.04463481903076172, 0.04823493957519531, 0.051835060119628906, 0.0554351806640625, 0.059035301208496094, 0.06263542175292969, 0.06623554229736328, 0.06983566284179688, 0.07343578338623047, 0.07703590393066406, 0.08063602447509766, 0.08423614501953125, 0.08783626556396484, 0.09143638610839844, 0.09503650665283203, 0.09863662719726562, 0.10223674774169922, 0.10583686828613281, 0.1094369888305664, 0.113037109375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 8.0, 5.0, 16.0, 14.0, 29.0, 31.0, 61.0, 67.0, 93.0, 128.0, 217.0, 301.0, 431.0, 752.0, 1166.0, 2052.0, 3795.0, 8838.0, 23927.0, 96725.0, 689110.0, 165999.0, 32836.0, 11130.0, 4804.0, 2371.0, 1335.0, 765.0, 559.0, 333.0, 188.0, 140.0, 106.0, 71.0, 44.0, 34.0, 30.0, 18.0, 10.0, 4.0, 2.0, 8.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048675537109375, -0.047086238861083984, -0.04549694061279297, -0.04390764236450195, -0.04231834411621094, -0.04072904586791992, -0.039139747619628906, -0.03755044937133789, -0.035961151123046875, -0.03437185287475586, -0.032782554626464844, -0.031193256378173828, -0.029603958129882812, -0.028014659881591797, -0.02642536163330078, -0.024836063385009766, -0.02324676513671875, -0.021657466888427734, -0.02006816864013672, -0.018478870391845703, -0.016889572143554688, -0.015300273895263672, -0.013710975646972656, -0.01212167739868164, -0.010532379150390625, -0.00894308090209961, -0.007353782653808594, -0.005764484405517578, -0.0041751861572265625, -0.002585887908935547, -0.0009965896606445312, 0.0005927085876464844, 0.0021820068359375, 0.0037713050842285156, 0.005360603332519531, 0.006949901580810547, 0.008539199829101562, 0.010128498077392578, 0.011717796325683594, 0.01330709457397461, 0.014896392822265625, 0.01648569107055664, 0.018074989318847656, 0.019664287567138672, 0.021253585815429688, 0.022842884063720703, 0.02443218231201172, 0.026021480560302734, 0.02761077880859375, 0.029200077056884766, 0.03078937530517578, 0.0323786735534668, 0.03396797180175781, 0.03555727005004883, 0.037146568298339844, 0.03873586654663086, 0.040325164794921875, 0.04191446304321289, 0.043503761291503906, 0.04509305953979492, 0.04668235778808594, 0.04827165603637695, 0.04986095428466797, 0.051450252532958984, 0.05303955078125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 8.0, 6.0, 13.0, 17.0, 29.0, 55.0, 77.0, 111.0, 177.0, 142.0, 143.0, 91.0, 55.0, 25.0, 15.0, 7.0, 11.0, 7.0, 8.0, 8.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.036592483520508e-05, -4.874635487794876e-05, -4.7126784920692444e-05, -4.550721496343613e-05, -4.388764500617981e-05, -4.226807504892349e-05, -4.0648505091667175e-05, -3.902893513441086e-05, -3.740936517715454e-05, -3.5789795219898224e-05, -3.417022526264191e-05, -3.255065530538559e-05, -3.093108534812927e-05, -2.9311515390872955e-05, -2.7691945433616638e-05, -2.607237547636032e-05, -2.4452805519104004e-05, -2.2833235561847687e-05, -2.121366560459137e-05, -1.9594095647335052e-05, -1.7974525690078735e-05, -1.6354955732822418e-05, -1.4735385775566101e-05, -1.3115815818309784e-05, -1.1496245861053467e-05, -9.87667590379715e-06, -8.257105946540833e-06, -6.637535989284515e-06, -5.017966032028198e-06, -3.398396074771881e-06, -1.778826117515564e-06, -1.5925616025924683e-07, 1.4603137969970703e-06, 3.0798837542533875e-06, 4.699453711509705e-06, 6.319023668766022e-06, 7.938593626022339e-06, 9.558163583278656e-06, 1.1177733540534973e-05, 1.279730349779129e-05, 1.4416873455047607e-05, 1.6036443412303925e-05, 1.7656013369560242e-05, 1.927558332681656e-05, 2.0895153284072876e-05, 2.2514723241329193e-05, 2.413429319858551e-05, 2.5753863155841827e-05, 2.7373433113098145e-05, 2.899300307035446e-05, 3.061257302761078e-05, 3.2232142984867096e-05, 3.385171294212341e-05, 3.547128289937973e-05, 3.709085285663605e-05, 3.8710422813892365e-05, 4.032999277114868e-05, 4.1949562728405e-05, 4.3569132685661316e-05, 4.518870264291763e-05, 4.680827260017395e-05, 4.842784255743027e-05, 5.0047412514686584e-05, 5.16669824719429e-05, 5.328655242919922e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 10.0, 5.0, 8.0, 17.0, 22.0, 23.0, 38.0, 79.0, 114.0, 207.0, 389.0, 902.0, 2444.0, 7322.0, 34522.0, 718804.0, 254899.0, 20190.0, 5154.0, 1879.0, 792.0, 325.0, 148.0, 91.0, 58.0, 39.0, 24.0, 21.0, 7.0, 13.0, 4.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08721923828125, -0.08448123931884766, -0.08174324035644531, -0.07900524139404297, -0.07626724243164062, -0.07352924346923828, -0.07079124450683594, -0.0680532455444336, -0.06531524658203125, -0.0625772476196289, -0.05983924865722656, -0.05710124969482422, -0.054363250732421875, -0.05162525177001953, -0.04888725280761719, -0.046149253845214844, -0.0434112548828125, -0.040673255920410156, -0.03793525695800781, -0.03519725799560547, -0.032459259033203125, -0.02972126007080078, -0.026983261108398438, -0.024245262145996094, -0.02150726318359375, -0.018769264221191406, -0.016031265258789062, -0.013293266296386719, -0.010555267333984375, -0.007817268371582031, -0.0050792694091796875, -0.0023412704467773438, 0.000396728515625, 0.0031347274780273438, 0.0058727264404296875, 0.008610725402832031, 0.011348724365234375, 0.014086723327636719, 0.016824722290039062, 0.019562721252441406, 0.02230072021484375, 0.025038719177246094, 0.027776718139648438, 0.03051471710205078, 0.033252716064453125, 0.03599071502685547, 0.03872871398925781, 0.041466712951660156, 0.0442047119140625, 0.046942710876464844, 0.04968070983886719, 0.05241870880126953, 0.055156707763671875, 0.05789470672607422, 0.06063270568847656, 0.0633707046508789, 0.06610870361328125, 0.0688467025756836, 0.07158470153808594, 0.07432270050048828, 0.07706069946289062, 0.07979869842529297, 0.08253669738769531, 0.08527469635009766, 0.0880126953125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 4.0, 4.0, 9.0, 6.0, 16.0, 14.0, 22.0, 47.0, 88.0, 147.0, 211.0, 172.0, 89.0, 67.0, 32.0, 15.0, 8.0, 11.0, 4.0, 6.0, 7.0, 5.0, 1.0, 1.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.072265625, -0.07039642333984375, -0.0685272216796875, -0.06665802001953125, -0.064788818359375, -0.06291961669921875, -0.0610504150390625, -0.05918121337890625, -0.05731201171875, -0.05544281005859375, -0.0535736083984375, -0.05170440673828125, -0.049835205078125, -0.04796600341796875, -0.0460968017578125, -0.04422760009765625, -0.0423583984375, -0.04048919677734375, -0.0386199951171875, -0.03675079345703125, -0.034881591796875, -0.03301239013671875, -0.0311431884765625, -0.02927398681640625, -0.02740478515625, -0.02553558349609375, -0.0236663818359375, -0.02179718017578125, -0.019927978515625, -0.01805877685546875, -0.0161895751953125, -0.01432037353515625, -0.012451171875, -0.01058197021484375, -0.0087127685546875, -0.00684356689453125, -0.004974365234375, -0.00310516357421875, -0.0012359619140625, 0.00063323974609375, 0.00250244140625, 0.00437164306640625, 0.0062408447265625, 0.00811004638671875, 0.009979248046875, 0.01184844970703125, 0.0137176513671875, 0.01558685302734375, 0.0174560546875, 0.01932525634765625, 0.0211944580078125, 0.02306365966796875, 0.024932861328125, 0.02680206298828125, 0.0286712646484375, 0.03054046630859375, 0.03240966796875, 0.03427886962890625, 0.0361480712890625, 0.03801727294921875, 0.039886474609375, 0.04175567626953125, 0.0436248779296875, 0.04549407958984375, 0.04736328125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 7.0, 28.0, 38.0, 87.0, 158.0, 237.0, 203.0, 113.0, 84.0, 33.0, 13.0, 6.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9615683555603027, -0.9269771575927734, -0.8923859596252441, -0.8577947616577148, -0.8232035636901855, -0.7886123657226562, -0.754021167755127, -0.7194299697875977, -0.6848387718200684, -0.6502475738525391, -0.6156563758850098, -0.5810651779174805, -0.5464739799499512, -0.5118827819824219, -0.4772915840148926, -0.4427003860473633, -0.408109188079834, -0.3735179901123047, -0.3389267921447754, -0.3043355941772461, -0.2697443962097168, -0.2351531982421875, -0.2005620002746582, -0.1659708023071289, -0.1313796043395996, -0.09678840637207031, -0.062197208404541016, -0.02760601043701172, 0.006985187530517578, 0.041576385498046875, 0.07616758346557617, 0.11075878143310547, 0.14534986019134521, 0.1799410581588745, 0.2145322561264038, 0.2491234540939331, 0.2837146520614624, 0.3183058500289917, 0.352897047996521, 0.3874882459640503, 0.4220794439315796, 0.4566706418991089, 0.4912618398666382, 0.5258530378341675, 0.5604442358016968, 0.5950354337692261, 0.6296266317367554, 0.6642178297042847, 0.698809027671814, 0.7334002256393433, 0.7679914236068726, 0.8025826215744019, 0.8371738195419312, 0.8717650175094604, 0.9063562154769897, 0.940947413444519, 0.9755386114120483, 1.0101298093795776, 1.044721007347107, 1.0793122053146362, 1.1139034032821655, 1.1484946012496948, 1.1830857992172241, 1.2176769971847534, 1.2522681951522827]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 4.0, 5.0, 2.0, 8.0, 9.0, 15.0, 10.0, 19.0, 9.0, 11.0, 21.0, 23.0, 23.0, 24.0, 24.0, 35.0, 32.0, 41.0, 34.0, 42.0, 40.0, 43.0, 34.0, 39.0, 47.0, 46.0, 33.0, 43.0, 34.0, 27.0, 25.0, 23.0, 22.0, 21.0, 20.0, 23.0, 13.0, 9.0, 15.0, 8.0, 8.0, 5.0, 9.0, 4.0, 6.0, 8.0, 3.0, 0.0, 1.0, 3.0, 3.0, 0.0, 2.0], "bins": [-0.3852055072784424, -0.37379270792007446, -0.36237990856170654, -0.350967139005661, -0.3395543396472931, -0.32814154028892517, -0.31672874093055725, -0.3053159713745117, -0.2939031720161438, -0.2824903726577759, -0.27107757329940796, -0.2596648037433624, -0.2482520043849945, -0.2368392050266266, -0.22542640566825867, -0.21401362121105194, -0.20260082185268402, -0.1911880224943161, -0.17977523803710938, -0.16836243867874146, -0.15694965422153473, -0.1455368548631668, -0.13412407040596008, -0.12271127104759216, -0.11129847913980484, -0.09988568723201752, -0.0884728953242302, -0.07706010341644287, -0.06564730405807495, -0.05423451587557793, -0.042821720242500305, -0.03140892833471298, -0.01999613642692566, -0.008583343587815762, 0.002829449251294136, 0.014242243021726608, 0.02565503492951393, 0.037067826837301254, 0.048480622470378876, 0.0598934143781662, 0.07130620628595352, 0.08271899819374084, 0.09413179010152817, 0.10554458200931549, 0.11695738136768341, 0.12837016582489014, 0.13978296518325806, 0.15119576454162598, 0.1626085489988327, 0.17402134835720062, 0.18543413281440735, 0.19684693217277527, 0.208259716629982, 0.21967251598834991, 0.23108530044555664, 0.24249809980392456, 0.2539108991622925, 0.2653236985206604, 0.2767364978790283, 0.28814926743507385, 0.2995620667934418, 0.3109748661518097, 0.3223876655101776, 0.33380043506622314, 0.34521323442459106]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 7.0, 5.0, 20.0, 23.0, 21.0, 48.0, 62.0, 92.0, 168.0, 223.0, 390.0, 722.0, 1101.0, 2141.0, 4268.0, 9189.0, 22546.0, 73230.0, 644900.0, 3277758.0, 106134.0, 28944.0, 11243.0, 5045.0, 2602.0, 1341.0, 789.0, 464.0, 255.0, 189.0, 113.0, 72.0, 53.0, 33.0, 24.0, 16.0, 13.0, 6.0, 8.0, 7.0, 6.0, 4.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10296630859375, -0.09954833984375, -0.09613037109375, -0.09271240234375, -0.08929443359375, -0.08587646484375, -0.08245849609375, -0.07904052734375, -0.07562255859375, -0.07220458984375, -0.06878662109375, -0.06536865234375, -0.06195068359375, -0.05853271484375, -0.05511474609375, -0.05169677734375, -0.04827880859375, -0.04486083984375, -0.04144287109375, -0.03802490234375, -0.03460693359375, -0.03118896484375, -0.02777099609375, -0.02435302734375, -0.02093505859375, -0.01751708984375, -0.01409912109375, -0.01068115234375, -0.00726318359375, -0.00384521484375, -0.00042724609375, 0.00299072265625, 0.00640869140625, 0.00982666015625, 0.01324462890625, 0.01666259765625, 0.02008056640625, 0.02349853515625, 0.02691650390625, 0.03033447265625, 0.03375244140625, 0.03717041015625, 0.04058837890625, 0.04400634765625, 0.04742431640625, 0.05084228515625, 0.05426025390625, 0.05767822265625, 0.06109619140625, 0.06451416015625, 0.06793212890625, 0.07135009765625, 0.07476806640625, 0.07818603515625, 0.08160400390625, 0.08502197265625, 0.08843994140625, 0.09185791015625, 0.09527587890625, 0.09869384765625, 0.10211181640625, 0.10552978515625, 0.10894775390625, 0.11236572265625, 0.11578369140625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 6.0, 3.0, 10.0, 8.0, 9.0, 16.0, 14.0, 26.0, 16.0, 33.0, 28.0, 35.0, 50.0, 44.0, 56.0, 49.0, 56.0, 62.0, 53.0, 61.0, 39.0, 53.0, 49.0, 35.0, 31.0, 32.0, 29.0, 14.0, 15.0, 18.0, 4.0, 10.0, 8.0, 10.0, 8.0, 2.0, 4.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0175933837890625, -0.016881942749023438, -0.016170501708984375, -0.015459060668945312, -0.01474761962890625, -0.014036178588867188, -0.013324737548828125, -0.012613296508789062, -0.01190185546875, -0.011190414428710938, -0.010478973388671875, -0.009767532348632812, -0.00905609130859375, -0.008344650268554688, -0.007633209228515625, -0.0069217681884765625, -0.0062103271484375, -0.0054988861083984375, -0.004787445068359375, -0.0040760040283203125, -0.00336456298828125, -0.0026531219482421875, -0.001941680908203125, -0.0012302398681640625, -0.000518798828125, 0.0001926422119140625, 0.000904083251953125, 0.0016155242919921875, 0.00232696533203125, 0.0030384063720703125, 0.003749847412109375, 0.0044612884521484375, 0.0051727294921875, 0.0058841705322265625, 0.006595611572265625, 0.0073070526123046875, 0.00801849365234375, 0.008729934692382812, 0.009441375732421875, 0.010152816772460938, 0.0108642578125, 0.011575698852539062, 0.012287139892578125, 0.012998580932617188, 0.01371002197265625, 0.014421463012695312, 0.015132904052734375, 0.015844345092773438, 0.0165557861328125, 0.017267227172851562, 0.017978668212890625, 0.018690109252929688, 0.01940155029296875, 0.020112991333007812, 0.020824432373046875, 0.021535873413085938, 0.022247314453125, 0.022958755493164062, 0.023670196533203125, 0.024381637573242188, 0.02509307861328125, 0.025804519653320312, 0.026515960693359375, 0.027227401733398438, 0.0279388427734375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 7.0, 2.0, 6.0, 6.0, 12.0, 14.0, 25.0, 25.0, 31.0, 55.0, 75.0, 106.0, 162.0, 226.0, 359.0, 638.0, 1054.0, 1990.0, 3982.0, 8114.0, 18702.0, 52059.0, 209444.0, 3370290.0, 405085.0, 75245.0, 25433.0, 10554.0, 4977.0, 2340.0, 1346.0, 731.0, 445.0, 253.0, 154.0, 104.0, 67.0, 48.0, 35.0, 27.0, 17.0, 8.0, 8.0, 8.0, 9.0, 4.0, 1.0, 4.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10577392578125, -0.10232353210449219, -0.09887313842773438, -0.09542274475097656, -0.09197235107421875, -0.08852195739746094, -0.08507156372070312, -0.08162117004394531, -0.0781707763671875, -0.07472038269042969, -0.07126998901367188, -0.06781959533691406, -0.06436920166015625, -0.06091880798339844, -0.057468414306640625, -0.05401802062988281, -0.050567626953125, -0.04711723327636719, -0.043666839599609375, -0.04021644592285156, -0.03676605224609375, -0.03331565856933594, -0.029865264892578125, -0.026414871215820312, -0.0229644775390625, -0.019514083862304688, -0.016063690185546875, -0.012613296508789062, -0.00916290283203125, -0.0057125091552734375, -0.002262115478515625, 0.0011882781982421875, 0.004638671875, 0.008089065551757812, 0.011539459228515625, 0.014989852905273438, 0.01844024658203125, 0.021890640258789062, 0.025341033935546875, 0.028791427612304688, 0.0322418212890625, 0.03569221496582031, 0.039142608642578125, 0.04259300231933594, 0.04604339599609375, 0.04949378967285156, 0.052944183349609375, 0.05639457702636719, 0.059844970703125, 0.06329536437988281, 0.06674575805664062, 0.07019615173339844, 0.07364654541015625, 0.07709693908691406, 0.08054733276367188, 0.08399772644042969, 0.0874481201171875, 0.09089851379394531, 0.09434890747070312, 0.09779930114746094, 0.10124969482421875, 0.10470008850097656, 0.10815048217773438, 0.11160087585449219, 0.11505126953125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 1.0, 4.0, 6.0, 10.0, 16.0, 19.0, 41.0, 38.0, 65.0, 83.0, 134.0, 301.0, 1821.0, 895.0, 245.0, 126.0, 71.0, 50.0, 50.0, 24.0, 18.0, 8.0, 10.0, 12.0, 7.0, 2.0, 6.0, 3.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049835205078125, -0.04822063446044922, -0.04660606384277344, -0.044991493225097656, -0.043376922607421875, -0.041762351989746094, -0.04014778137207031, -0.03853321075439453, -0.03691864013671875, -0.03530406951904297, -0.03368949890136719, -0.032074928283691406, -0.030460357666015625, -0.028845787048339844, -0.027231216430664062, -0.02561664581298828, -0.0240020751953125, -0.02238750457763672, -0.020772933959960938, -0.019158363342285156, -0.017543792724609375, -0.015929222106933594, -0.014314651489257812, -0.012700080871582031, -0.01108551025390625, -0.009470939636230469, -0.007856369018554688, -0.006241798400878906, -0.004627227783203125, -0.0030126571655273438, -0.0013980865478515625, 0.00021648406982421875, 0.0018310546875, 0.0034456253051757812, 0.0050601959228515625, 0.006674766540527344, 0.008289337158203125, 0.009903907775878906, 0.011518478393554688, 0.013133049011230469, 0.01474761962890625, 0.01636219024658203, 0.017976760864257812, 0.019591331481933594, 0.021205902099609375, 0.022820472717285156, 0.024435043334960938, 0.02604961395263672, 0.0276641845703125, 0.02927875518798828, 0.030893325805664062, 0.032507896423339844, 0.034122467041015625, 0.035737037658691406, 0.03735160827636719, 0.03896617889404297, 0.04058074951171875, 0.04219532012939453, 0.04380989074707031, 0.045424461364746094, 0.047039031982421875, 0.048653602600097656, 0.05026817321777344, 0.05188274383544922, 0.053497314453125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 7.0, 5.0, 7.0, 15.0, 20.0, 53.0, 63.0, 100.0, 124.0, 144.0, 125.0, 113.0, 96.0, 51.0, 36.0, 19.0, 9.0, 14.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34678295254707336, -0.33577069640159607, -0.3247584104537964, -0.3137461543083191, -0.3027338981628418, -0.2917216420173645, -0.2807093858718872, -0.2696970999240875, -0.25868484377861023, -0.24767258763313293, -0.23666031658649445, -0.22564804553985596, -0.21463578939437866, -0.20362353324890137, -0.19261126220226288, -0.1815989911556244, -0.1705867350101471, -0.1595744788646698, -0.1485622078180313, -0.13754993677139282, -0.12653768062591553, -0.11552541702985764, -0.10451315343379974, -0.09350088983774185, -0.08248862624168396, -0.07147636264562607, -0.060464099049568176, -0.049451835453510284, -0.03843957185745239, -0.0274273082613945, -0.01641504466533661, -0.005402781069278717, 0.0056095123291015625, 0.016621775925159454, 0.027634039521217346, 0.03864630311727524, 0.04965856671333313, 0.06067083030939102, 0.07168309390544891, 0.0826953575015068, 0.0937076210975647, 0.10471988469362259, 0.11573214828968048, 0.12674441933631897, 0.13775667548179626, 0.14876893162727356, 0.15978120267391205, 0.17079347372055054, 0.18180572986602783, 0.19281798601150513, 0.20383025705814362, 0.2148425281047821, 0.2258547842502594, 0.2368670403957367, 0.24787931144237518, 0.25889158248901367, 0.26990383863449097, 0.28091609477996826, 0.29192835092544556, 0.30294063687324524, 0.31395289301872253, 0.32496514916419983, 0.3359774351119995, 0.3469896912574768, 0.3580019474029541]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 8.0, 5.0, 11.0, 8.0, 12.0, 12.0, 15.0, 13.0, 27.0, 24.0, 22.0, 22.0, 28.0, 17.0, 40.0, 29.0, 35.0, 31.0, 50.0, 41.0, 46.0, 37.0, 49.0, 33.0, 36.0, 46.0, 35.0, 27.0, 26.0, 25.0, 26.0, 28.0, 24.0, 14.0, 14.0, 13.0, 6.0, 9.0, 11.0, 5.0, 8.0, 6.0, 7.0, 7.0, 7.0, 1.0, 4.0, 0.0, 2.0], "bins": [-0.155536949634552, -0.15125305950641632, -0.14696915447711945, -0.14268526434898376, -0.1384013593196869, -0.1341174691915512, -0.12983357906341553, -0.12554967403411865, -0.12126578390598297, -0.1169818863272667, -0.11269798874855042, -0.10841409862041473, -0.10413020104169846, -0.09984630346298218, -0.0955624133348465, -0.09127851575613022, -0.08699461817741394, -0.08271072059869766, -0.07842682301998138, -0.0741429328918457, -0.06985903531312943, -0.06557513773441315, -0.06129124388098717, -0.05700735002756119, -0.05272345244884491, -0.04843955487012863, -0.04415566101670265, -0.03987176716327667, -0.035587869584560394, -0.031303972005844116, -0.027020078152418137, -0.022736182436347008, -0.01845228672027588, -0.01416839100420475, -0.009884495288133621, -0.005600599572062492, -0.0013167038559913635, 0.0029671918600797653, 0.007251087576150894, 0.011534983292222023, 0.015818879008293152, 0.02010277472436428, 0.02438667044043541, 0.02867056615650654, 0.03295446187257767, 0.037238359451293945, 0.041522253304719925, 0.045806147158145905, 0.05009004473686218, 0.05437394231557846, 0.05865783616900444, 0.06294173002243042, 0.0672256276011467, 0.07150952517986298, 0.07579341530799866, 0.08007731288671494, 0.08436121046543121, 0.08864510804414749, 0.09292900562286377, 0.09721289575099945, 0.10149679332971573, 0.105780690908432, 0.11006458103656769, 0.11434847861528397, 0.11863237619400024]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 2.0, 7.0, 5.0, 17.0, 15.0, 17.0, 29.0, 58.0, 60.0, 114.0, 142.0, 247.0, 367.0, 634.0, 1094.0, 1857.0, 3454.0, 6297.0, 11836.0, 22768.0, 43621.0, 85845.0, 183577.0, 322907.0, 184358.0, 86831.0, 43383.0, 22349.0, 11887.0, 6429.0, 3556.0, 1921.0, 1166.0, 635.0, 375.0, 266.0, 131.0, 90.0, 62.0, 46.0, 26.0, 22.0, 20.0, 14.0, 5.0, 3.0, 6.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.065673828125, -0.06371355056762695, -0.061753273010253906, -0.05979299545288086, -0.05783271789550781, -0.055872440338134766, -0.05391216278076172, -0.05195188522338867, -0.049991607666015625, -0.04803133010864258, -0.04607105255126953, -0.044110774993896484, -0.04215049743652344, -0.04019021987915039, -0.038229942321777344, -0.0362696647644043, -0.03430938720703125, -0.0323491096496582, -0.030388832092285156, -0.02842855453491211, -0.026468276977539062, -0.024507999420166016, -0.02254772186279297, -0.020587444305419922, -0.018627166748046875, -0.016666889190673828, -0.014706611633300781, -0.012746334075927734, -0.010786056518554688, -0.00882577896118164, -0.006865501403808594, -0.004905223846435547, -0.0029449462890625, -0.0009846687316894531, 0.0009756088256835938, 0.0029358863830566406, 0.0048961639404296875, 0.006856441497802734, 0.008816719055175781, 0.010776996612548828, 0.012737274169921875, 0.014697551727294922, 0.01665782928466797, 0.018618106842041016, 0.020578384399414062, 0.02253866195678711, 0.024498939514160156, 0.026459217071533203, 0.02841949462890625, 0.030379772186279297, 0.032340049743652344, 0.03430032730102539, 0.03626060485839844, 0.038220882415771484, 0.04018115997314453, 0.04214143753051758, 0.044101715087890625, 0.04606199264526367, 0.04802227020263672, 0.049982547760009766, 0.05194282531738281, 0.05390310287475586, 0.055863380432128906, 0.05782365798950195, 0.059783935546875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 8.0, 6.0, 9.0, 7.0, 13.0, 9.0, 8.0, 16.0, 23.0, 21.0, 25.0, 16.0, 30.0, 28.0, 30.0, 42.0, 52.0, 48.0, 47.0, 36.0, 49.0, 42.0, 33.0, 41.0, 28.0, 45.0, 31.0, 33.0, 34.0, 21.0, 18.0, 24.0, 24.0, 19.0, 9.0, 11.0, 12.0, 10.0, 12.0, 6.0, 2.0, 3.0, 4.0, 3.0, 3.0, 3.0, 3.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.01678466796875, -0.016205310821533203, -0.015625953674316406, -0.01504659652709961, -0.014467239379882812, -0.013887882232666016, -0.013308525085449219, -0.012729167938232422, -0.012149810791015625, -0.011570453643798828, -0.010991096496582031, -0.010411739349365234, -0.009832382202148438, -0.00925302505493164, -0.008673667907714844, -0.008094310760498047, -0.00751495361328125, -0.006935596466064453, -0.006356239318847656, -0.005776882171630859, -0.0051975250244140625, -0.004618167877197266, -0.004038810729980469, -0.003459453582763672, -0.002880096435546875, -0.002300739288330078, -0.0017213821411132812, -0.0011420249938964844, -0.0005626678466796875, 1.6689300537109375e-05, 0.0005960464477539062, 0.0011754035949707031, 0.0017547607421875, 0.002334117889404297, 0.0029134750366210938, 0.0034928321838378906, 0.0040721893310546875, 0.004651546478271484, 0.005230903625488281, 0.005810260772705078, 0.006389617919921875, 0.006968975067138672, 0.007548332214355469, 0.008127689361572266, 0.008707046508789062, 0.00928640365600586, 0.009865760803222656, 0.010445117950439453, 0.01102447509765625, 0.011603832244873047, 0.012183189392089844, 0.01276254653930664, 0.013341903686523438, 0.013921260833740234, 0.014500617980957031, 0.015079975128173828, 0.015659332275390625, 0.016238689422607422, 0.01681804656982422, 0.017397403717041016, 0.017976760864257812, 0.01855611801147461, 0.019135475158691406, 0.019714832305908203, 0.020294189453125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 8.0, 9.0, 7.0, 14.0, 21.0, 18.0, 41.0, 62.0, 69.0, 94.0, 131.0, 160.0, 267.0, 379.0, 582.0, 1014.0, 1747.0, 3596.0, 8250.0, 20084.0, 52175.0, 142129.0, 438034.0, 244519.0, 80789.0, 30855.0, 12358.0, 5111.0, 2496.0, 1252.0, 741.0, 469.0, 285.0, 201.0, 161.0, 97.0, 95.0, 66.0, 49.0, 36.0, 16.0, 25.0, 11.0, 9.0, 6.0, 10.0, 0.0, 1.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.06939697265625, -0.06698131561279297, -0.06456565856933594, -0.062150001525878906, -0.059734344482421875, -0.057318687438964844, -0.05490303039550781, -0.05248737335205078, -0.05007171630859375, -0.04765605926513672, -0.04524040222167969, -0.042824745178222656, -0.040409088134765625, -0.037993431091308594, -0.03557777404785156, -0.03316211700439453, -0.0307464599609375, -0.02833080291748047, -0.025915145874023438, -0.023499488830566406, -0.021083831787109375, -0.018668174743652344, -0.016252517700195312, -0.013836860656738281, -0.01142120361328125, -0.009005546569824219, -0.0065898895263671875, -0.004174232482910156, -0.001758575439453125, 0.0006570816040039062, 0.0030727386474609375, 0.005488395690917969, 0.007904052734375, 0.010319709777832031, 0.012735366821289062, 0.015151023864746094, 0.017566680908203125, 0.019982337951660156, 0.022397994995117188, 0.02481365203857422, 0.02722930908203125, 0.02964496612548828, 0.03206062316894531, 0.034476280212402344, 0.036891937255859375, 0.039307594299316406, 0.04172325134277344, 0.04413890838623047, 0.0465545654296875, 0.04897022247314453, 0.05138587951660156, 0.053801536560058594, 0.056217193603515625, 0.058632850646972656, 0.06104850769042969, 0.06346416473388672, 0.06587982177734375, 0.06829547882080078, 0.07071113586425781, 0.07312679290771484, 0.07554244995117188, 0.0779581069946289, 0.08037376403808594, 0.08278942108154297, 0.085205078125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 3.0, 6.0, 6.0, 11.0, 12.0, 10.0, 8.0, 18.0, 18.0, 33.0, 39.0, 31.0, 46.0, 25.0, 44.0, 44.0, 37.0, 46.0, 44.0, 46.0, 38.0, 48.0, 54.0, 21.0, 46.0, 47.0, 39.0, 29.0, 20.0, 27.0, 17.0, 10.0, 13.0, 13.0, 14.0, 9.0, 4.0, 5.0, 7.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1044921875, -0.10136032104492188, -0.09822845458984375, -0.09509658813476562, -0.0919647216796875, -0.08883285522460938, -0.08570098876953125, -0.08256912231445312, -0.079437255859375, -0.07630538940429688, -0.07317352294921875, -0.07004165649414062, -0.0669097900390625, -0.06377792358398438, -0.06064605712890625, -0.057514190673828125, -0.05438232421875, -0.051250457763671875, -0.04811859130859375, -0.044986724853515625, -0.0418548583984375, -0.038722991943359375, -0.03559112548828125, -0.032459259033203125, -0.029327392578125, -0.026195526123046875, -0.02306365966796875, -0.019931793212890625, -0.0167999267578125, -0.013668060302734375, -0.01053619384765625, -0.007404327392578125, -0.0042724609375, -0.001140594482421875, 0.00199127197265625, 0.005123138427734375, 0.0082550048828125, 0.011386871337890625, 0.01451873779296875, 0.017650604248046875, 0.020782470703125, 0.023914337158203125, 0.02704620361328125, 0.030178070068359375, 0.0333099365234375, 0.036441802978515625, 0.03957366943359375, 0.042705535888671875, 0.04583740234375, 0.048969268798828125, 0.05210113525390625, 0.055233001708984375, 0.0583648681640625, 0.061496734619140625, 0.06462860107421875, 0.06776046752929688, 0.070892333984375, 0.07402420043945312, 0.07715606689453125, 0.08028793334960938, 0.0834197998046875, 0.08655166625976562, 0.08968353271484375, 0.09281539916992188, 0.095947265625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 5.0, 3.0, 6.0, 12.0, 13.0, 23.0, 33.0, 57.0, 109.0, 238.0, 507.0, 1266.0, 3743.0, 13626.0, 68414.0, 421708.0, 446997.0, 71331.0, 14383.0, 3790.0, 1331.0, 487.0, 220.0, 104.0, 69.0, 39.0, 20.0, 7.0, 9.0, 6.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07391357421875, -0.07160472869873047, -0.06929588317871094, -0.0669870376586914, -0.06467819213867188, -0.062369346618652344, -0.06006050109863281, -0.05775165557861328, -0.05544281005859375, -0.05313396453857422, -0.05082511901855469, -0.048516273498535156, -0.046207427978515625, -0.043898582458496094, -0.04158973693847656, -0.03928089141845703, -0.0369720458984375, -0.03466320037841797, -0.03235435485839844, -0.030045509338378906, -0.027736663818359375, -0.025427818298339844, -0.023118972778320312, -0.02081012725830078, -0.01850128173828125, -0.01619243621826172, -0.013883590698242188, -0.011574745178222656, -0.009265899658203125, -0.006957054138183594, -0.0046482086181640625, -0.0023393630981445312, -3.0517578125e-05, 0.0022783279418945312, 0.0045871734619140625, 0.006896018981933594, 0.009204864501953125, 0.011513710021972656, 0.013822555541992188, 0.01613140106201172, 0.01844024658203125, 0.02074909210205078, 0.023057937622070312, 0.025366783142089844, 0.027675628662109375, 0.029984474182128906, 0.03229331970214844, 0.03460216522216797, 0.0369110107421875, 0.03921985626220703, 0.04152870178222656, 0.043837547302246094, 0.046146392822265625, 0.048455238342285156, 0.05076408386230469, 0.05307292938232422, 0.05538177490234375, 0.05769062042236328, 0.05999946594238281, 0.062308311462402344, 0.06461715698242188, 0.0669260025024414, 0.06923484802246094, 0.07154369354248047, 0.0738525390625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 9.0, 11.0, 14.0, 20.0, 14.0, 21.0, 30.0, 37.0, 56.0, 68.0, 98.0, 91.0, 87.0, 94.0, 69.0, 61.0, 66.0, 36.0, 24.0, 22.0, 16.0, 14.0, 8.0, 9.0, 6.0, 9.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.170967102050781e-05, -3.06982547044754e-05, -2.9686838388442993e-05, -2.8675422072410583e-05, -2.7664005756378174e-05, -2.6652589440345764e-05, -2.5641173124313354e-05, -2.4629756808280945e-05, -2.3618340492248535e-05, -2.2606924176216125e-05, -2.1595507860183716e-05, -2.0584091544151306e-05, -1.9572675228118896e-05, -1.8561258912086487e-05, -1.7549842596054077e-05, -1.6538426280021667e-05, -1.5527009963989258e-05, -1.4515593647956848e-05, -1.3504177331924438e-05, -1.2492761015892029e-05, -1.1481344699859619e-05, -1.046992838382721e-05, -9.4585120677948e-06, -8.44709575176239e-06, -7.4356794357299805e-06, -6.424263119697571e-06, -5.412846803665161e-06, -4.4014304876327515e-06, -3.390014171600342e-06, -2.378597855567932e-06, -1.3671815395355225e-06, -3.557652235031128e-07, 6.556510925292969e-07, 1.6670674085617065e-06, 2.678483724594116e-06, 3.689900040626526e-06, 4.7013163566589355e-06, 5.712732672691345e-06, 6.724148988723755e-06, 7.735565304756165e-06, 8.746981620788574e-06, 9.758397936820984e-06, 1.0769814252853394e-05, 1.1781230568885803e-05, 1.2792646884918213e-05, 1.3804063200950623e-05, 1.4815479516983032e-05, 1.5826895833015442e-05, 1.683831214904785e-05, 1.784972846508026e-05, 1.886114478111267e-05, 1.987256109714508e-05, 2.088397741317749e-05, 2.18953937292099e-05, 2.290681004524231e-05, 2.391822636127472e-05, 2.492964267730713e-05, 2.594105899333954e-05, 2.6952475309371948e-05, 2.7963891625404358e-05, 2.8975307941436768e-05, 2.9986724257469177e-05, 3.099814057350159e-05, 3.2009556889533997e-05, 3.3020973205566406e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 6.0, 6.0, 9.0, 20.0, 42.0, 88.0, 210.0, 497.0, 1423.0, 5322.0, 36800.0, 470600.0, 487388.0, 38337.0, 5493.0, 1454.0, 502.0, 193.0, 74.0, 36.0, 21.0, 15.0, 9.0, 7.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12078857421875, -0.11733818054199219, -0.11388778686523438, -0.11043739318847656, -0.10698699951171875, -0.10353660583496094, -0.10008621215820312, -0.09663581848144531, -0.0931854248046875, -0.08973503112792969, -0.08628463745117188, -0.08283424377441406, -0.07938385009765625, -0.07593345642089844, -0.07248306274414062, -0.06903266906738281, -0.065582275390625, -0.06213188171386719, -0.058681488037109375, -0.05523109436035156, -0.05178070068359375, -0.04833030700683594, -0.044879913330078125, -0.04142951965332031, -0.0379791259765625, -0.03452873229980469, -0.031078338623046875, -0.027627944946289062, -0.02417755126953125, -0.020727157592773438, -0.017276763916015625, -0.013826370239257812, -0.0103759765625, -0.0069255828857421875, -0.003475189208984375, -2.47955322265625e-05, 0.00342559814453125, 0.0068759918212890625, 0.010326385498046875, 0.013776779174804688, 0.0172271728515625, 0.020677566528320312, 0.024127960205078125, 0.027578353881835938, 0.03102874755859375, 0.03447914123535156, 0.037929534912109375, 0.04137992858886719, 0.044830322265625, 0.04828071594238281, 0.051731109619140625, 0.05518150329589844, 0.05863189697265625, 0.06208229064941406, 0.06553268432617188, 0.06898307800292969, 0.0724334716796875, 0.07588386535644531, 0.07933425903320312, 0.08278465270996094, 0.08623504638671875, 0.08968544006347656, 0.09313583374023438, 0.09658622741699219, 0.10003662109375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 5.0, 11.0, 8.0, 15.0, 17.0, 29.0, 30.0, 45.0, 48.0, 67.0, 98.0, 119.0, 132.0, 100.0, 55.0, 46.0, 43.0, 39.0, 22.0, 13.0, 13.0, 15.0, 13.0, 7.0, 3.0, 7.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.07861328125, -0.07664871215820312, -0.07468414306640625, -0.07271957397460938, -0.0707550048828125, -0.06879043579101562, -0.06682586669921875, -0.06486129760742188, -0.062896728515625, -0.060932159423828125, -0.05896759033203125, -0.057003021240234375, -0.0550384521484375, -0.053073883056640625, -0.05110931396484375, -0.049144744873046875, -0.04718017578125, -0.045215606689453125, -0.04325103759765625, -0.041286468505859375, -0.0393218994140625, -0.037357330322265625, -0.03539276123046875, -0.033428192138671875, -0.031463623046875, -0.029499053955078125, -0.02753448486328125, -0.025569915771484375, -0.0236053466796875, -0.021640777587890625, -0.01967620849609375, -0.017711639404296875, -0.0157470703125, -0.013782501220703125, -0.01181793212890625, -0.009853363037109375, -0.0078887939453125, -0.005924224853515625, -0.00395965576171875, -0.001995086669921875, -3.0517578125e-05, 0.001934051513671875, 0.00389862060546875, 0.005863189697265625, 0.0078277587890625, 0.009792327880859375, 0.01175689697265625, 0.013721466064453125, 0.01568603515625, 0.017650604248046875, 0.01961517333984375, 0.021579742431640625, 0.0235443115234375, 0.025508880615234375, 0.02747344970703125, 0.029438018798828125, 0.031402587890625, 0.033367156982421875, 0.03533172607421875, 0.037296295166015625, 0.0392608642578125, 0.041225433349609375, 0.04319000244140625, 0.045154571533203125, 0.047119140625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 16.0, 55.0, 169.0, 296.0, 288.0, 130.0, 39.0, 11.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9571785926818848, -2.8942370414733887, -2.8312954902648926, -2.7683537006378174, -2.7054121494293213, -2.642470598220825, -2.57952880859375, -2.516587257385254, -2.453645706176758, -2.3907041549682617, -2.3277626037597656, -2.2648208141326904, -2.2018792629241943, -2.1389377117156982, -2.075995922088623, -2.013054370880127, -1.9501128196716309, -1.8871712684631348, -1.8242295980453491, -1.7612879276275635, -1.6983463764190674, -1.6354048252105713, -1.5724631547927856, -1.509521484375, -1.446579933166504, -1.3836383819580078, -1.3206967115402222, -1.2577550411224365, -1.1948134899139404, -1.1318719387054443, -1.0689302682876587, -1.005988597869873, -0.9430468082427979, -0.880105197429657, -0.8171635866165161, -0.7542219758033752, -0.6912803649902344, -0.6283387541770935, -0.5653971433639526, -0.5024555325508118, -0.4395139217376709, -0.37657231092453003, -0.31363070011138916, -0.2506890892982483, -0.18774747848510742, -0.12480586767196655, -0.061864256858825684, 0.0010773539543151855, 0.06401896476745605, 0.12696057558059692, 0.1899021863937378, 0.25284379720687866, 0.31578540802001953, 0.3787270188331604, 0.44166862964630127, 0.5046102404594421, 0.567551851272583, 0.6304934620857239, 0.6934350728988647, 0.7563766837120056, 0.8193182945251465, 0.8822599053382874, 0.9452015161514282, 1.0081431865692139, 1.07108473777771]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 6.0, 9.0, 5.0, 14.0, 16.0, 14.0, 20.0, 19.0, 22.0, 31.0, 34.0, 38.0, 37.0, 23.0, 47.0, 40.0, 62.0, 64.0, 55.0, 30.0, 53.0, 41.0, 29.0, 38.0, 39.0, 28.0, 27.0, 24.0, 20.0, 13.0, 16.0, 13.0, 11.0, 12.0, 10.0, 6.0, 8.0, 4.0, 4.0, 6.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.5803826451301575, -0.5642767548561096, -0.548170804977417, -0.5320649147033691, -0.5159590244293213, -0.49985307455062866, -0.4837471842765808, -0.46764126420021057, -0.45153534412384033, -0.4354294240474701, -0.41932350397109985, -0.403217613697052, -0.38711169362068176, -0.3710057735443115, -0.35489988327026367, -0.33879396319389343, -0.3226880431175232, -0.30658212304115295, -0.2904762029647827, -0.27437031269073486, -0.2582643926143646, -0.24215847253799438, -0.22605256736278534, -0.2099466621875763, -0.19384074211120605, -0.17773482203483582, -0.16162891685962677, -0.14552301168441772, -0.12941709160804749, -0.11331117898225784, -0.0972052663564682, -0.08109935373067856, -0.06499338150024414, -0.0488874688744545, -0.032781556248664856, -0.016675643622875214, -0.0005697309970855713, 0.015536181628704071, 0.03164209425449371, 0.047748006880283356, 0.063853919506073, 0.07995983213186264, 0.09606574475765228, 0.11217165738344193, 0.12827757000923157, 0.1443834900856018, 0.16048939526081085, 0.1765953004360199, 0.19270122051239014, 0.20880714058876038, 0.22491304576396942, 0.24101895093917847, 0.2571248710155487, 0.27323079109191895, 0.2893366813659668, 0.30544260144233704, 0.3215485215187073, 0.3376544415950775, 0.35376036167144775, 0.3698662519454956, 0.38597217202186584, 0.4020780920982361, 0.41818398237228394, 0.4342899024486542, 0.4503958225250244]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 4.0, 6.0, 9.0, 13.0, 11.0, 18.0, 37.0, 54.0, 83.0, 122.0, 183.0, 295.0, 513.0, 961.0, 1773.0, 3700.0, 7951.0, 20058.0, 66287.0, 559884.0, 3360481.0, 120431.0, 29728.0, 11248.0, 5066.0, 2376.0, 1243.0, 664.0, 394.0, 228.0, 159.0, 78.0, 68.0, 54.0, 31.0, 15.0, 15.0, 10.0, 7.0, 7.0, 4.0, 4.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.1329345703125, -0.12904644012451172, -0.12515830993652344, -0.12127017974853516, -0.11738204956054688, -0.1134939193725586, -0.10960578918457031, -0.10571765899658203, -0.10182952880859375, -0.09794139862060547, -0.09405326843261719, -0.0901651382446289, -0.08627700805664062, -0.08238887786865234, -0.07850074768066406, -0.07461261749267578, -0.0707244873046875, -0.06683635711669922, -0.06294822692871094, -0.059060096740722656, -0.055171966552734375, -0.051283836364746094, -0.04739570617675781, -0.04350757598876953, -0.03961944580078125, -0.03573131561279297, -0.03184318542480469, -0.027955055236816406, -0.024066925048828125, -0.020178794860839844, -0.016290664672851562, -0.012402534484863281, -0.008514404296875, -0.004626274108886719, -0.0007381439208984375, 0.0031499862670898438, 0.007038116455078125, 0.010926246643066406, 0.014814376831054688, 0.01870250701904297, 0.02259063720703125, 0.02647876739501953, 0.030366897583007812, 0.034255027770996094, 0.038143157958984375, 0.042031288146972656, 0.04591941833496094, 0.04980754852294922, 0.0536956787109375, 0.05758380889892578, 0.06147193908691406, 0.06536006927490234, 0.06924819946289062, 0.0731363296508789, 0.07702445983886719, 0.08091259002685547, 0.08480072021484375, 0.08868885040283203, 0.09257698059082031, 0.0964651107788086, 0.10035324096679688, 0.10424137115478516, 0.10812950134277344, 0.11201763153076172, 0.11590576171875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 6.0, 3.0, 1.0, 12.0, 7.0, 6.0, 14.0, 19.0, 19.0, 14.0, 19.0, 24.0, 26.0, 30.0, 29.0, 47.0, 40.0, 46.0, 46.0, 39.0, 46.0, 51.0, 46.0, 46.0, 49.0, 39.0, 36.0, 33.0, 28.0, 23.0, 19.0, 18.0, 22.0, 16.0, 15.0, 18.0, 10.0, 5.0, 11.0, 6.0, 6.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0202484130859375, -0.019598960876464844, -0.018949508666992188, -0.01830005645751953, -0.017650604248046875, -0.01700115203857422, -0.016351699829101562, -0.015702247619628906, -0.01505279541015625, -0.014403343200683594, -0.013753890991210938, -0.013104438781738281, -0.012454986572265625, -0.011805534362792969, -0.011156082153320312, -0.010506629943847656, -0.009857177734375, -0.009207725524902344, -0.008558273315429688, -0.007908821105957031, -0.007259368896484375, -0.006609916687011719, -0.0059604644775390625, -0.005311012268066406, -0.00466156005859375, -0.004012107849121094, -0.0033626556396484375, -0.0027132034301757812, -0.002063751220703125, -0.0014142990112304688, -0.0007648468017578125, -0.00011539459228515625, 0.0005340576171875, 0.0011835098266601562, 0.0018329620361328125, 0.0024824142456054688, 0.003131866455078125, 0.0037813186645507812, 0.0044307708740234375, 0.005080223083496094, 0.00572967529296875, 0.006379127502441406, 0.0070285797119140625, 0.007678031921386719, 0.008327484130859375, 0.008976936340332031, 0.009626388549804688, 0.010275840759277344, 0.01092529296875, 0.011574745178222656, 0.012224197387695312, 0.012873649597167969, 0.013523101806640625, 0.014172554016113281, 0.014822006225585938, 0.015471458435058594, 0.01612091064453125, 0.016770362854003906, 0.017419815063476562, 0.01806926727294922, 0.018718719482421875, 0.01936817169189453, 0.020017623901367188, 0.020667076110839844, 0.0213165283203125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 5.0, 4.0, 8.0, 8.0, 13.0, 11.0, 22.0, 30.0, 55.0, 84.0, 109.0, 167.0, 237.0, 383.0, 598.0, 929.0, 1514.0, 2777.0, 4890.0, 9556.0, 19342.0, 44536.0, 128447.0, 735094.0, 2885973.0, 235744.0, 68278.0, 27427.0, 12777.0, 6426.0, 3490.0, 2047.0, 1243.0, 689.0, 471.0, 296.0, 193.0, 139.0, 85.0, 70.0, 32.0, 29.0, 15.0, 15.0, 14.0, 4.0, 8.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.09649658203125, -0.09367656707763672, -0.09085655212402344, -0.08803653717041016, -0.08521652221679688, -0.0823965072631836, -0.07957649230957031, -0.07675647735595703, -0.07393646240234375, -0.07111644744873047, -0.06829643249511719, -0.0654764175415039, -0.06265640258789062, -0.059836387634277344, -0.05701637268066406, -0.05419635772705078, -0.0513763427734375, -0.04855632781982422, -0.04573631286621094, -0.042916297912597656, -0.040096282958984375, -0.037276268005371094, -0.03445625305175781, -0.03163623809814453, -0.02881622314453125, -0.02599620819091797, -0.023176193237304688, -0.020356178283691406, -0.017536163330078125, -0.014716148376464844, -0.011896133422851562, -0.009076118469238281, -0.006256103515625, -0.0034360885620117188, -0.0006160736083984375, 0.0022039413452148438, 0.005023956298828125, 0.007843971252441406, 0.010663986206054688, 0.013484001159667969, 0.01630401611328125, 0.01912403106689453, 0.021944046020507812, 0.024764060974121094, 0.027584075927734375, 0.030404090881347656, 0.03322410583496094, 0.03604412078857422, 0.0388641357421875, 0.04168415069580078, 0.04450416564941406, 0.047324180603027344, 0.050144195556640625, 0.052964210510253906, 0.05578422546386719, 0.05860424041748047, 0.06142425537109375, 0.06424427032470703, 0.06706428527832031, 0.0698843002319336, 0.07270431518554688, 0.07552433013916016, 0.07834434509277344, 0.08116436004638672, 0.083984375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 3.0, 10.0, 4.0, 11.0, 11.0, 16.0, 20.0, 25.0, 31.0, 44.0, 60.0, 100.0, 170.0, 296.0, 835.0, 1449.0, 369.0, 187.0, 121.0, 94.0, 53.0, 37.0, 30.0, 21.0, 12.0, 18.0, 7.0, 8.0, 6.0, 1.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.052764892578125, -0.05112457275390625, -0.0494842529296875, -0.04784393310546875, -0.04620361328125, -0.04456329345703125, -0.0429229736328125, -0.04128265380859375, -0.039642333984375, -0.03800201416015625, -0.0363616943359375, -0.03472137451171875, -0.0330810546875, -0.03144073486328125, -0.0298004150390625, -0.02816009521484375, -0.026519775390625, -0.02487945556640625, -0.0232391357421875, -0.02159881591796875, -0.01995849609375, -0.01831817626953125, -0.0166778564453125, -0.01503753662109375, -0.013397216796875, -0.01175689697265625, -0.0101165771484375, -0.00847625732421875, -0.0068359375, -0.00519561767578125, -0.0035552978515625, -0.00191497802734375, -0.000274658203125, 0.00136566162109375, 0.0030059814453125, 0.00464630126953125, 0.00628662109375, 0.00792694091796875, 0.0095672607421875, 0.01120758056640625, 0.012847900390625, 0.01448822021484375, 0.0161285400390625, 0.01776885986328125, 0.0194091796875, 0.02104949951171875, 0.0226898193359375, 0.02433013916015625, 0.025970458984375, 0.02761077880859375, 0.0292510986328125, 0.03089141845703125, 0.03253173828125, 0.03417205810546875, 0.0358123779296875, 0.03745269775390625, 0.039093017578125, 0.04073333740234375, 0.0423736572265625, 0.04401397705078125, 0.045654296875, 0.04729461669921875, 0.0489349365234375, 0.05057525634765625, 0.052215576171875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 6.0, 4.0, 10.0, 12.0, 25.0, 36.0, 32.0, 48.0, 65.0, 85.0, 98.0, 107.0, 90.0, 93.0, 76.0, 68.0, 51.0, 22.0, 20.0, 13.0, 13.0, 12.0, 7.0, 3.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34757858514785767, -0.33721330761909485, -0.32684803009033203, -0.3164827227592468, -0.306117445230484, -0.2957521677017212, -0.285386860370636, -0.27502158284187317, -0.26465630531311035, -0.25429102778434753, -0.24392573535442352, -0.2335604429244995, -0.2231951653957367, -0.21282988786697388, -0.20246459543704987, -0.19209930300712585, -0.18173402547836304, -0.17136874794960022, -0.1610034555196762, -0.1506381630897522, -0.14027288556098938, -0.12990760803222656, -0.11954231560230255, -0.10917703062295914, -0.09881174564361572, -0.08844646066427231, -0.0780811756849289, -0.06771589070558548, -0.057350605726242065, -0.04698532074689865, -0.03662003576755524, -0.026254750788211823, -0.015889465808868408, -0.005524180829524994, 0.00484110414981842, 0.015206389129161835, 0.02557167410850525, 0.03593695908784866, 0.04630224406719208, 0.05666752904653549, 0.0670328140258789, 0.07739809900522232, 0.08776338398456573, 0.09812866896390915, 0.10849395394325256, 0.11885923892259598, 0.1292245239019394, 0.1395898163318634, 0.14995509386062622, 0.16032037138938904, 0.17068566381931305, 0.18105095624923706, 0.19141623377799988, 0.2017815113067627, 0.2121468037366867, 0.22251209616661072, 0.23287737369537354, 0.24324265122413635, 0.25360792875289917, 0.2639732360839844, 0.2743385136127472, 0.28470379114151, 0.2950690984725952, 0.30543437600135803, 0.31579965353012085]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 5.0, 5.0, 8.0, 5.0, 14.0, 14.0, 13.0, 16.0, 18.0, 21.0, 21.0, 25.0, 23.0, 28.0, 43.0, 36.0, 43.0, 33.0, 48.0, 38.0, 45.0, 47.0, 46.0, 46.0, 40.0, 42.0, 38.0, 25.0, 41.0, 30.0, 23.0, 21.0, 27.0, 17.0, 11.0, 11.0, 7.0, 11.0, 9.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19329124689102173, -0.18715421855449677, -0.1810171753168106, -0.17488014698028564, -0.1687431037425995, -0.16260607540607452, -0.15646904706954956, -0.1503320038318634, -0.14419497549533844, -0.13805794715881348, -0.13192090392112732, -0.12578387558460236, -0.1196468397974968, -0.11350980401039124, -0.10737277567386627, -0.10123573988676071, -0.09509870409965515, -0.08896166831254959, -0.08282463252544403, -0.07668760418891907, -0.07055056840181351, -0.06441353261470795, -0.058276500552892685, -0.05213946849107742, -0.04600243270397186, -0.0398653969168663, -0.03372836485505104, -0.02759133093059063, -0.02145429700613022, -0.015317263081669807, -0.009180229157209396, -0.0030431970953941345, 0.0030938386917114258, 0.009230872616171837, 0.015367906540632248, 0.02150494046509266, 0.02764197438955307, 0.03377901017665863, 0.03991604223847389, 0.046053074300289154, 0.052190110087394714, 0.058327145874500275, 0.06446418166160583, 0.0706012099981308, 0.07673824578523636, 0.08287528157234192, 0.08901230990886688, 0.09514934569597244, 0.101286381483078, 0.10742341727018356, 0.11356045305728912, 0.11969748139381409, 0.12583452463150024, 0.1319715529680252, 0.13810858130455017, 0.14424562454223633, 0.1503826528787613, 0.15651968121528625, 0.1626567244529724, 0.16879375278949738, 0.17493078112602234, 0.1810678243637085, 0.18720485270023346, 0.19334188103675842, 0.19947892427444458]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 3.0, 11.0, 13.0, 21.0, 23.0, 32.0, 64.0, 55.0, 124.0, 178.0, 266.0, 336.0, 620.0, 957.0, 1557.0, 2701.0, 4777.0, 8416.0, 15406.0, 29094.0, 55342.0, 106444.0, 187080.0, 238217.0, 180998.0, 101298.0, 52842.0, 27695.0, 14829.0, 8051.0, 4467.0, 2536.0, 1538.0, 901.0, 555.0, 378.0, 241.0, 167.0, 101.0, 65.0, 50.0, 32.0, 30.0, 9.0, 8.0, 6.0, 7.0, 5.0, 4.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.051971435546875, -0.05026531219482422, -0.04855918884277344, -0.046853065490722656, -0.045146942138671875, -0.043440818786621094, -0.04173469543457031, -0.04002857208251953, -0.03832244873046875, -0.03661632537841797, -0.03491020202636719, -0.033204078674316406, -0.031497955322265625, -0.029791831970214844, -0.028085708618164062, -0.02637958526611328, -0.0246734619140625, -0.02296733856201172, -0.021261215209960938, -0.019555091857910156, -0.017848968505859375, -0.016142845153808594, -0.014436721801757812, -0.012730598449707031, -0.01102447509765625, -0.009318351745605469, -0.0076122283935546875, -0.005906105041503906, -0.004199981689453125, -0.0024938583374023438, -0.0007877349853515625, 0.0009183883666992188, 0.00262451171875, 0.004330635070800781, 0.0060367584228515625, 0.007742881774902344, 0.009449005126953125, 0.011155128479003906, 0.012861251831054688, 0.014567375183105469, 0.01627349853515625, 0.01797962188720703, 0.019685745239257812, 0.021391868591308594, 0.023097991943359375, 0.024804115295410156, 0.026510238647460938, 0.02821636199951172, 0.0299224853515625, 0.03162860870361328, 0.03333473205566406, 0.035040855407714844, 0.036746978759765625, 0.038453102111816406, 0.04015922546386719, 0.04186534881591797, 0.04357147216796875, 0.04527759552001953, 0.04698371887207031, 0.048689842224121094, 0.050395965576171875, 0.052102088928222656, 0.05380821228027344, 0.05551433563232422, 0.057220458984375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 3.0, 6.0, 15.0, 9.0, 13.0, 22.0, 13.0, 19.0, 24.0, 17.0, 34.0, 31.0, 37.0, 44.0, 44.0, 47.0, 35.0, 46.0, 43.0, 42.0, 51.0, 42.0, 49.0, 40.0, 51.0, 34.0, 25.0, 25.0, 22.0, 19.0, 15.0, 18.0, 16.0, 11.0, 16.0, 6.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0222930908203125, -0.021569252014160156, -0.020845413208007812, -0.02012157440185547, -0.019397735595703125, -0.01867389678955078, -0.017950057983398438, -0.017226219177246094, -0.01650238037109375, -0.015778541564941406, -0.015054702758789062, -0.014330863952636719, -0.013607025146484375, -0.012883186340332031, -0.012159347534179688, -0.011435508728027344, -0.010711669921875, -0.009987831115722656, -0.009263992309570312, -0.008540153503417969, -0.007816314697265625, -0.007092475891113281, -0.0063686370849609375, -0.005644798278808594, -0.00492095947265625, -0.004197120666503906, -0.0034732818603515625, -0.0027494430541992188, -0.002025604248046875, -0.0013017654418945312, -0.0005779266357421875, 0.00014591217041015625, 0.0008697509765625, 0.0015935897827148438, 0.0023174285888671875, 0.0030412673950195312, 0.003765106201171875, 0.004488945007324219, 0.0052127838134765625, 0.005936622619628906, 0.00666046142578125, 0.007384300231933594, 0.008108139038085938, 0.008831977844238281, 0.009555816650390625, 0.010279655456542969, 0.011003494262695312, 0.011727333068847656, 0.012451171875, 0.013175010681152344, 0.013898849487304688, 0.014622688293457031, 0.015346527099609375, 0.01607036590576172, 0.016794204711914062, 0.017518043518066406, 0.01824188232421875, 0.018965721130371094, 0.019689559936523438, 0.02041339874267578, 0.021137237548828125, 0.02186107635498047, 0.022584915161132812, 0.023308753967285156, 0.0240325927734375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 8.0, 5.0, 7.0, 8.0, 16.0, 17.0, 32.0, 35.0, 53.0, 114.0, 179.0, 321.0, 570.0, 1306.0, 3688.0, 14089.0, 67398.0, 371853.0, 471403.0, 91228.0, 18330.0, 4734.0, 1641.0, 695.0, 326.0, 190.0, 118.0, 72.0, 36.0, 39.0, 16.0, 12.0, 6.0, 7.0, 2.0, 6.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1307373046875, -0.1266632080078125, -0.122589111328125, -0.1185150146484375, -0.11444091796875, -0.1103668212890625, -0.106292724609375, -0.1022186279296875, -0.09814453125, -0.0940704345703125, -0.089996337890625, -0.0859222412109375, -0.08184814453125, -0.0777740478515625, -0.073699951171875, -0.0696258544921875, -0.0655517578125, -0.0614776611328125, -0.057403564453125, -0.0533294677734375, -0.04925537109375, -0.0451812744140625, -0.041107177734375, -0.0370330810546875, -0.032958984375, -0.0288848876953125, -0.024810791015625, -0.0207366943359375, -0.01666259765625, -0.0125885009765625, -0.008514404296875, -0.0044403076171875, -0.0003662109375, 0.0037078857421875, 0.007781982421875, 0.0118560791015625, 0.01593017578125, 0.0200042724609375, 0.024078369140625, 0.0281524658203125, 0.0322265625, 0.0363006591796875, 0.040374755859375, 0.0444488525390625, 0.04852294921875, 0.0525970458984375, 0.056671142578125, 0.0607452392578125, 0.0648193359375, 0.0688934326171875, 0.072967529296875, 0.0770416259765625, 0.08111572265625, 0.0851898193359375, 0.089263916015625, 0.0933380126953125, 0.097412109375, 0.1014862060546875, 0.105560302734375, 0.1096343994140625, 0.11370849609375, 0.1177825927734375, 0.121856689453125, 0.1259307861328125, 0.1300048828125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 7.0, 3.0, 7.0, 11.0, 17.0, 22.0, 18.0, 32.0, 29.0, 36.0, 35.0, 48.0, 42.0, 40.0, 46.0, 39.0, 53.0, 58.0, 52.0, 46.0, 37.0, 44.0, 43.0, 32.0, 26.0, 41.0, 22.0, 24.0, 20.0, 15.0, 15.0, 8.0, 8.0, 10.0, 5.0, 0.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1512451171875, -0.14704227447509766, -0.1428394317626953, -0.13863658905029297, -0.13443374633789062, -0.13023090362548828, -0.12602806091308594, -0.1218252182006836, -0.11762237548828125, -0.1134195327758789, -0.10921669006347656, -0.10501384735107422, -0.10081100463867188, -0.09660816192626953, -0.09240531921386719, -0.08820247650146484, -0.0839996337890625, -0.07979679107666016, -0.07559394836425781, -0.07139110565185547, -0.06718826293945312, -0.06298542022705078, -0.05878257751464844, -0.054579734802246094, -0.05037689208984375, -0.046174049377441406, -0.04197120666503906, -0.03776836395263672, -0.033565521240234375, -0.02936267852783203, -0.025159835815429688, -0.020956993103027344, -0.016754150390625, -0.012551307678222656, -0.008348464965820312, -0.004145622253417969, 5.7220458984375e-05, 0.004260063171386719, 0.008462905883789062, 0.012665748596191406, 0.01686859130859375, 0.021071434020996094, 0.025274276733398438, 0.02947711944580078, 0.033679962158203125, 0.03788280487060547, 0.04208564758300781, 0.046288490295410156, 0.0504913330078125, 0.054694175720214844, 0.05889701843261719, 0.06309986114501953, 0.06730270385742188, 0.07150554656982422, 0.07570838928222656, 0.0799112319946289, 0.08411407470703125, 0.0883169174194336, 0.09251976013183594, 0.09672260284423828, 0.10092544555664062, 0.10512828826904297, 0.10933113098144531, 0.11353397369384766, 0.11773681640625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 2.0, 6.0, 10.0, 12.0, 26.0, 40.0, 106.0, 189.0, 482.0, 1344.0, 4262.0, 18926.0, 134164.0, 658803.0, 196743.0, 25275.0, 5512.0, 1666.0, 562.0, 215.0, 103.0, 53.0, 23.0, 13.0, 10.0, 7.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07818603515625, -0.07535171508789062, -0.07251739501953125, -0.06968307495117188, -0.0668487548828125, -0.06401443481445312, -0.06118011474609375, -0.058345794677734375, -0.055511474609375, -0.052677154541015625, -0.04984283447265625, -0.047008514404296875, -0.0441741943359375, -0.041339874267578125, -0.03850555419921875, -0.035671234130859375, -0.0328369140625, -0.030002593994140625, -0.02716827392578125, -0.024333953857421875, -0.0214996337890625, -0.018665313720703125, -0.01583099365234375, -0.012996673583984375, -0.010162353515625, -0.007328033447265625, -0.00449371337890625, -0.001659393310546875, 0.0011749267578125, 0.004009246826171875, 0.00684356689453125, 0.009677886962890625, 0.01251220703125, 0.015346527099609375, 0.01818084716796875, 0.021015167236328125, 0.0238494873046875, 0.026683807373046875, 0.02951812744140625, 0.032352447509765625, 0.035186767578125, 0.038021087646484375, 0.04085540771484375, 0.043689727783203125, 0.0465240478515625, 0.049358367919921875, 0.05219268798828125, 0.055027008056640625, 0.057861328125, 0.060695648193359375, 0.06352996826171875, 0.06636428833007812, 0.0691986083984375, 0.07203292846679688, 0.07486724853515625, 0.07770156860351562, 0.080535888671875, 0.08337020874023438, 0.08620452880859375, 0.08903884887695312, 0.0918731689453125, 0.09470748901367188, 0.09754180908203125, 0.10037612915039062, 0.10321044921875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 12.0, 14.0, 7.0, 12.0, 16.0, 23.0, 23.0, 28.0, 35.0, 50.0, 47.0, 68.0, 54.0, 56.0, 71.0, 68.0, 77.0, 56.0, 38.0, 47.0, 41.0, 28.0, 21.0, 18.0, 19.0, 15.0, 14.0, 12.0, 14.0, 7.0, 3.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.9981136322021484e-05, -2.9064714908599854e-05, -2.8148293495178223e-05, -2.7231872081756592e-05, -2.631545066833496e-05, -2.539902925491333e-05, -2.44826078414917e-05, -2.356618642807007e-05, -2.2649765014648438e-05, -2.1733343601226807e-05, -2.0816922187805176e-05, -1.9900500774383545e-05, -1.8984079360961914e-05, -1.8067657947540283e-05, -1.7151236534118652e-05, -1.623481512069702e-05, -1.531839370727539e-05, -1.440197229385376e-05, -1.3485550880432129e-05, -1.2569129467010498e-05, -1.1652708053588867e-05, -1.0736286640167236e-05, -9.819865226745605e-06, -8.903443813323975e-06, -7.987022399902344e-06, -7.070600986480713e-06, -6.154179573059082e-06, -5.237758159637451e-06, -4.32133674621582e-06, -3.4049153327941895e-06, -2.4884939193725586e-06, -1.5720725059509277e-06, -6.556510925292969e-07, 2.60770320892334e-07, 1.1771917343139648e-06, 2.0936131477355957e-06, 3.0100345611572266e-06, 3.926455974578857e-06, 4.842877388000488e-06, 5.759298801422119e-06, 6.67572021484375e-06, 7.592141628265381e-06, 8.508563041687012e-06, 9.424984455108643e-06, 1.0341405868530273e-05, 1.1257827281951904e-05, 1.2174248695373535e-05, 1.3090670108795166e-05, 1.4007091522216797e-05, 1.4923512935638428e-05, 1.583993434906006e-05, 1.675635576248169e-05, 1.767277717590332e-05, 1.858919858932495e-05, 1.9505620002746582e-05, 2.0422041416168213e-05, 2.1338462829589844e-05, 2.2254884243011475e-05, 2.3171305656433105e-05, 2.4087727069854736e-05, 2.5004148483276367e-05, 2.5920569896697998e-05, 2.683699131011963e-05, 2.775341272354126e-05, 2.866983413696289e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 5.0, 8.0, 21.0, 18.0, 23.0, 40.0, 56.0, 97.0, 124.0, 181.0, 304.0, 492.0, 952.0, 1949.0, 4039.0, 8983.0, 23889.0, 74084.0, 245071.0, 416149.0, 184057.0, 55253.0, 18364.0, 7284.0, 3443.0, 1598.0, 791.0, 483.0, 270.0, 174.0, 106.0, 85.0, 49.0, 37.0, 28.0, 16.0, 10.0, 4.0, 7.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.04931640625, -0.04769277572631836, -0.04606914520263672, -0.04444551467895508, -0.04282188415527344, -0.0411982536315918, -0.039574623107910156, -0.037950992584228516, -0.036327362060546875, -0.034703731536865234, -0.033080101013183594, -0.03145647048950195, -0.029832839965820312, -0.028209209442138672, -0.02658557891845703, -0.02496194839477539, -0.02333831787109375, -0.02171468734741211, -0.02009105682373047, -0.018467426300048828, -0.016843795776367188, -0.015220165252685547, -0.013596534729003906, -0.011972904205322266, -0.010349273681640625, -0.008725643157958984, -0.007102012634277344, -0.005478382110595703, -0.0038547515869140625, -0.002231121063232422, -0.0006074905395507812, 0.0010161399841308594, 0.0026397705078125, 0.004263401031494141, 0.005887031555175781, 0.007510662078857422, 0.009134292602539062, 0.010757923126220703, 0.012381553649902344, 0.014005184173583984, 0.015628814697265625, 0.017252445220947266, 0.018876075744628906, 0.020499706268310547, 0.022123336791992188, 0.023746967315673828, 0.02537059783935547, 0.02699422836303711, 0.02861785888671875, 0.03024148941040039, 0.03186511993408203, 0.03348875045776367, 0.03511238098144531, 0.03673601150512695, 0.038359642028808594, 0.039983272552490234, 0.041606903076171875, 0.043230533599853516, 0.044854164123535156, 0.0464777946472168, 0.04810142517089844, 0.04972505569458008, 0.05134868621826172, 0.05297231674194336, 0.054595947265625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 9.0, 6.0, 6.0, 9.0, 15.0, 11.0, 17.0, 17.0, 26.0, 28.0, 36.0, 48.0, 57.0, 59.0, 69.0, 86.0, 64.0, 57.0, 54.0, 59.0, 38.0, 39.0, 35.0, 30.0, 21.0, 18.0, 13.0, 15.0, 17.0, 9.0, 6.0, 5.0, 5.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.046783447265625, -0.045366764068603516, -0.04395008087158203, -0.04253339767456055, -0.04111671447753906, -0.03970003128051758, -0.038283348083496094, -0.03686666488647461, -0.035449981689453125, -0.03403329849243164, -0.032616615295410156, -0.031199932098388672, -0.029783248901367188, -0.028366565704345703, -0.02694988250732422, -0.025533199310302734, -0.02411651611328125, -0.022699832916259766, -0.02128314971923828, -0.019866466522216797, -0.018449783325195312, -0.017033100128173828, -0.015616416931152344, -0.01419973373413086, -0.012783050537109375, -0.01136636734008789, -0.009949684143066406, -0.008533000946044922, -0.0071163177490234375, -0.005699634552001953, -0.004282951354980469, -0.0028662681579589844, -0.0014495849609375, -3.2901763916015625e-05, 0.0013837814331054688, 0.002800464630126953, 0.0042171478271484375, 0.005633831024169922, 0.007050514221191406, 0.00846719741821289, 0.009883880615234375, 0.01130056381225586, 0.012717247009277344, 0.014133930206298828, 0.015550613403320312, 0.016967296600341797, 0.01838397979736328, 0.019800662994384766, 0.02121734619140625, 0.022634029388427734, 0.02405071258544922, 0.025467395782470703, 0.026884078979492188, 0.028300762176513672, 0.029717445373535156, 0.03113412857055664, 0.032550811767578125, 0.03396749496459961, 0.035384178161621094, 0.03680086135864258, 0.03821754455566406, 0.03963422775268555, 0.04105091094970703, 0.042467594146728516, 0.04388427734375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 8.0, 9.0, 11.0, 21.0, 30.0, 41.0, 70.0, 87.0, 122.0, 131.0, 127.0, 109.0, 76.0, 61.0, 30.0, 26.0, 13.0, 12.0, 5.0, 6.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6081541776657104, -0.5803227424621582, -0.552491307258606, -0.5246598720550537, -0.49682846665382385, -0.4689970314502716, -0.44116559624671936, -0.4133341908454895, -0.38550275564193726, -0.357671320438385, -0.32983988523483276, -0.3020084500312805, -0.27417704463005066, -0.2463456094264984, -0.21851417422294617, -0.19068275392055511, -0.16285130381584167, -0.13501986861228943, -0.10718844830989838, -0.07935701310634613, -0.05152558535337448, -0.023694157600402832, 0.004137277603149414, 0.031968697905540466, 0.05980013310909271, 0.08763156086206436, 0.11546298861503601, 0.14329442381858826, 0.1711258590221405, 0.19895727932453156, 0.2267887145280838, 0.25462013483047485, 0.2824515700340271, 0.31028300523757935, 0.3381144404411316, 0.36594587564468384, 0.3937772810459137, 0.42160871624946594, 0.4494401514530182, 0.47727155685424805, 0.5051029920578003, 0.5329344272613525, 0.5607658624649048, 0.588597297668457, 0.6164287328720093, 0.6442601680755615, 0.6720916032791138, 0.6999229788780212, 0.7277544736862183, 0.7555859088897705, 0.7834173440933228, 0.811248779296875, 0.8390802145004272, 0.8669116497039795, 0.8947430849075317, 0.9225744605064392, 0.9504058957099915, 0.9782373309135437, 1.0060687065124512, 1.0339001417160034, 1.0617315769195557, 1.089563012123108, 1.1173944473266602, 1.1452258825302124, 1.1730573177337646]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 8.0, 10.0, 11.0, 6.0, 12.0, 8.0, 19.0, 23.0, 18.0, 18.0, 26.0, 19.0, 39.0, 29.0, 31.0, 29.0, 33.0, 46.0, 42.0, 44.0, 51.0, 50.0, 50.0, 29.0, 39.0, 37.0, 38.0, 35.0, 34.0, 30.0, 26.0, 24.0, 8.0, 16.0, 6.0, 13.0, 6.0, 9.0, 10.0, 7.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5535398125648499, -0.5352002382278442, -0.5168606638908386, -0.4985211193561554, -0.48018157482147217, -0.46184200048446655, -0.44350242614746094, -0.4251628816127777, -0.4068233370780945, -0.38848376274108887, -0.37014421820640564, -0.3518046438694, -0.3334650993347168, -0.3151255249977112, -0.29678595066070557, -0.27844640612602234, -0.2601068317890167, -0.2417672723531723, -0.22342771291732788, -0.20508813858032227, -0.18674859404563904, -0.16840901970863342, -0.150069460272789, -0.13172990083694458, -0.11339034140110016, -0.09505078196525574, -0.07671122252941132, -0.0583716556429863, -0.040032096207141876, -0.021692536771297455, -0.0033529698848724365, 0.014986589550971985, 0.033326148986816406, 0.05166570842266083, 0.07000526785850525, 0.08834483474493027, 0.10668439418077469, 0.1250239610671997, 0.14336352050304413, 0.16170307993888855, 0.18004263937473297, 0.1983821988105774, 0.21672175824642181, 0.23506131768226624, 0.25340089201927185, 0.2717404365539551, 0.2900800108909607, 0.3084195852279663, 0.32675912976264954, 0.34509870409965515, 0.3634382486343384, 0.381777822971344, 0.4001173675060272, 0.41845694184303284, 0.43679648637771606, 0.4551360607147217, 0.4734756350517273, 0.4918152093887329, 0.5101547837257385, 0.5284942984580994, 0.546833872795105, 0.5651734471321106, 0.5835130214691162, 0.601852536201477, 0.6201921105384827]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 3.0, 7.0, 7.0, 4.0, 8.0, 10.0, 11.0, 25.0, 23.0, 38.0, 37.0, 46.0, 59.0, 74.0, 111.0, 164.0, 212.0, 376.0, 455.0, 772.0, 1373.0, 2770.0, 7238.0, 32811.0, 4052784.0, 75945.0, 10715.0, 3601.0, 1727.0, 955.0, 600.0, 391.0, 253.0, 173.0, 123.0, 89.0, 74.0, 34.0, 34.0, 36.0, 29.0, 12.0, 7.0, 15.0, 10.0, 13.0, 7.0, 8.0, 3.0, 6.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.2086181640625, -0.20223236083984375, -0.1958465576171875, -0.18946075439453125, -0.183074951171875, -0.17668914794921875, -0.1703033447265625, -0.16391754150390625, -0.15753173828125, -0.15114593505859375, -0.1447601318359375, -0.13837432861328125, -0.131988525390625, -0.12560272216796875, -0.1192169189453125, -0.11283111572265625, -0.1064453125, -0.10005950927734375, -0.0936737060546875, -0.08728790283203125, -0.080902099609375, -0.07451629638671875, -0.0681304931640625, -0.06174468994140625, -0.05535888671875, -0.04897308349609375, -0.0425872802734375, -0.03620147705078125, -0.029815673828125, -0.02342987060546875, -0.0170440673828125, -0.01065826416015625, -0.0042724609375, 0.00211334228515625, 0.0084991455078125, 0.01488494873046875, 0.021270751953125, 0.02765655517578125, 0.0340423583984375, 0.04042816162109375, 0.04681396484375, 0.05319976806640625, 0.0595855712890625, 0.06597137451171875, 0.072357177734375, 0.07874298095703125, 0.0851287841796875, 0.09151458740234375, 0.097900390625, 0.10428619384765625, 0.1106719970703125, 0.11705780029296875, 0.123443603515625, 0.12982940673828125, 0.1362152099609375, 0.14260101318359375, 0.14898681640625, 0.15537261962890625, 0.1617584228515625, 0.16814422607421875, 0.174530029296875, 0.18091583251953125, 0.1873016357421875, 0.19368743896484375, 0.2000732421875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 2.0, 7.0, 1.0, 8.0, 14.0, 10.0, 6.0, 13.0, 17.0, 17.0, 22.0, 13.0, 27.0, 29.0, 32.0, 34.0, 37.0, 40.0, 42.0, 32.0, 44.0, 38.0, 40.0, 38.0, 43.0, 35.0, 39.0, 31.0, 36.0, 38.0, 32.0, 34.0, 21.0, 17.0, 25.0, 10.0, 11.0, 13.0, 11.0, 8.0, 2.0, 14.0, 5.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.022979736328125, -0.022265195846557617, -0.021550655364990234, -0.02083611488342285, -0.02012157440185547, -0.019407033920288086, -0.018692493438720703, -0.01797795295715332, -0.017263412475585938, -0.016548871994018555, -0.015834331512451172, -0.015119791030883789, -0.014405250549316406, -0.013690710067749023, -0.01297616958618164, -0.012261629104614258, -0.011547088623046875, -0.010832548141479492, -0.01011800765991211, -0.009403467178344727, -0.008688926696777344, -0.007974386215209961, -0.007259845733642578, -0.006545305252075195, -0.0058307647705078125, -0.00511622428894043, -0.004401683807373047, -0.003687143325805664, -0.0029726028442382812, -0.0022580623626708984, -0.0015435218811035156, -0.0008289813995361328, -0.00011444091796875, 0.0006000995635986328, 0.0013146400451660156, 0.0020291805267333984, 0.0027437210083007812, 0.003458261489868164, 0.004172801971435547, 0.00488734245300293, 0.0056018829345703125, 0.006316423416137695, 0.007030963897705078, 0.007745504379272461, 0.008460044860839844, 0.009174585342407227, 0.00988912582397461, 0.010603666305541992, 0.011318206787109375, 0.012032747268676758, 0.01274728775024414, 0.013461828231811523, 0.014176368713378906, 0.014890909194946289, 0.015605449676513672, 0.016319990158081055, 0.017034530639648438, 0.01774907112121582, 0.018463611602783203, 0.019178152084350586, 0.01989269256591797, 0.02060723304748535, 0.021321773529052734, 0.022036314010620117, 0.0227508544921875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 1.0, 4.0, 2.0, 9.0, 5.0, 10.0, 13.0, 11.0, 26.0, 35.0, 51.0, 57.0, 83.0, 112.0, 152.0, 209.0, 320.0, 501.0, 763.0, 1225.0, 2353.0, 5280.0, 15446.0, 130337.0, 3982670.0, 37652.0, 8778.0, 3605.0, 1799.0, 882.0, 630.0, 354.0, 255.0, 193.0, 132.0, 82.0, 62.0, 45.0, 48.0, 30.0, 15.0, 15.0, 11.0, 6.0, 7.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.25244140625, -0.2452831268310547, -0.23812484741210938, -0.23096656799316406, -0.22380828857421875, -0.21665000915527344, -0.20949172973632812, -0.2023334503173828, -0.1951751708984375, -0.1880168914794922, -0.18085861206054688, -0.17370033264160156, -0.16654205322265625, -0.15938377380371094, -0.15222549438476562, -0.1450672149658203, -0.137908935546875, -0.1307506561279297, -0.12359237670898438, -0.11643409729003906, -0.10927581787109375, -0.10211753845214844, -0.09495925903320312, -0.08780097961425781, -0.0806427001953125, -0.07348442077636719, -0.06632614135742188, -0.05916786193847656, -0.05200958251953125, -0.04485130310058594, -0.037693023681640625, -0.030534744262695312, -0.02337646484375, -0.016218185424804688, -0.009059906005859375, -0.0019016265869140625, 0.00525665283203125, 0.012414932250976562, 0.019573211669921875, 0.026731491088867188, 0.0338897705078125, 0.04104804992675781, 0.048206329345703125, 0.05536460876464844, 0.06252288818359375, 0.06968116760253906, 0.07683944702148438, 0.08399772644042969, 0.091156005859375, 0.09831428527832031, 0.10547256469726562, 0.11263084411621094, 0.11978912353515625, 0.12694740295410156, 0.13410568237304688, 0.1412639617919922, 0.1484222412109375, 0.1555805206298828, 0.16273880004882812, 0.16989707946777344, 0.17705535888671875, 0.18421363830566406, 0.19137191772460938, 0.1985301971435547, 0.2056884765625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 2.0, 5.0, 0.0, 12.0, 9.0, 14.0, 34.0, 81.0, 463.0, 3227.0, 123.0, 47.0, 24.0, 10.0, 4.0, 6.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049774169921875, -0.04822492599487305, -0.046675682067871094, -0.04512643814086914, -0.04357719421386719, -0.042027950286865234, -0.04047870635986328, -0.03892946243286133, -0.037380218505859375, -0.03583097457885742, -0.03428173065185547, -0.032732486724853516, -0.031183242797851562, -0.02963399887084961, -0.028084754943847656, -0.026535511016845703, -0.02498626708984375, -0.023437023162841797, -0.021887779235839844, -0.02033853530883789, -0.018789291381835938, -0.017240047454833984, -0.01569080352783203, -0.014141559600830078, -0.012592315673828125, -0.011043071746826172, -0.009493827819824219, -0.007944583892822266, -0.0063953399658203125, -0.004846096038818359, -0.0032968521118164062, -0.0017476081848144531, -0.0001983642578125, 0.0013508796691894531, 0.0029001235961914062, 0.004449367523193359, 0.0059986114501953125, 0.007547855377197266, 0.009097099304199219, 0.010646343231201172, 0.012195587158203125, 0.013744831085205078, 0.015294075012207031, 0.016843318939208984, 0.018392562866210938, 0.01994180679321289, 0.021491050720214844, 0.023040294647216797, 0.02458953857421875, 0.026138782501220703, 0.027688026428222656, 0.02923727035522461, 0.030786514282226562, 0.032335758209228516, 0.03388500213623047, 0.03543424606323242, 0.036983489990234375, 0.03853273391723633, 0.04008197784423828, 0.041631221771240234, 0.04318046569824219, 0.04472970962524414, 0.046278953552246094, 0.04782819747924805, 0.04937744140625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 1.0, 4.0, 4.0, 13.0, 9.0, 12.0, 19.0, 36.0, 38.0, 69.0, 87.0, 101.0, 118.0, 110.0, 109.0, 71.0, 60.0, 59.0, 27.0, 22.0, 15.0, 8.0, 3.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14739945530891418, -0.14217491447925568, -0.13695037364959717, -0.13172583281993866, -0.12650129199028015, -0.12127675861120224, -0.11605222523212433, -0.11082768440246582, -0.10560314357280731, -0.1003786027431488, -0.0951540619134903, -0.08992952853441238, -0.08470498770475388, -0.07948044687509537, -0.07425591349601746, -0.06903137266635895, -0.06380683183670044, -0.05858229100704193, -0.05335775390267372, -0.04813321679830551, -0.042908675968647, -0.037684135138988495, -0.032459598034620285, -0.027235060930252075, -0.022010520100593567, -0.016785981133580208, -0.011561442166566849, -0.00633690319955349, -0.0011123642325401306, 0.0041121747344732285, 0.009336713701486588, 0.014561250805854797, 0.019785791635513306, 0.025010330602526665, 0.030234869569540024, 0.035459406673908234, 0.04068394750356674, 0.04590848833322525, 0.05113302543759346, 0.05635756254196167, 0.06158210337162018, 0.06680664420127869, 0.0720311850309372, 0.0772557184100151, 0.08248025923967361, 0.08770480006933212, 0.09292933344841003, 0.09815387427806854, 0.10337841510772705, 0.10860295593738556, 0.11382749676704407, 0.11905203014612198, 0.12427657097578049, 0.1295011043548584, 0.1347256451845169, 0.13995018601417542, 0.14517472684383392, 0.15039926767349243, 0.15562380850315094, 0.16084834933280945, 0.16607287526130676, 0.17129741609096527, 0.17652195692062378, 0.1817464977502823, 0.1869710385799408]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 6.0, 10.0, 6.0, 5.0, 4.0, 13.0, 15.0, 24.0, 13.0, 23.0, 28.0, 18.0, 26.0, 31.0, 47.0, 43.0, 44.0, 47.0, 50.0, 59.0, 53.0, 49.0, 35.0, 36.0, 52.0, 34.0, 34.0, 26.0, 33.0, 26.0, 26.0, 18.0, 14.0, 11.0, 9.0, 14.0, 10.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.08530747890472412, -0.08259212970733643, -0.07987678050994873, -0.07716142386198044, -0.07444607466459274, -0.07173072546720505, -0.06901536881923676, -0.06630001962184906, -0.06358467042446136, -0.06086932122707367, -0.058153968304395676, -0.05543861538171768, -0.05272326618432999, -0.05000791698694229, -0.0472925640642643, -0.044577211141586304, -0.04186186194419861, -0.03914651274681091, -0.03643115982413292, -0.033715806901454926, -0.03100045770406723, -0.028285106644034386, -0.02556975558400154, -0.022854404523968697, -0.020139053463935852, -0.017423702403903008, -0.014708351343870163, -0.011993000283837318, -0.009277649223804474, -0.006562298163771629, -0.003846947103738785, -0.0011315960437059402, 0.0015837550163269043, 0.004299106076359749, 0.007014457136392593, 0.009729808196425438, 0.012445159256458282, 0.015160510316491127, 0.01787586137652397, 0.020591212436556816, 0.02330656349658966, 0.026021914556622505, 0.02873726561665535, 0.031452618539333344, 0.03416796773672104, 0.036883316934108734, 0.03959866985678673, 0.04231402277946472, 0.04502937197685242, 0.04774472117424011, 0.050460074096918106, 0.0531754270195961, 0.055890776216983795, 0.05860612541437149, 0.061321478337049484, 0.06403683125972748, 0.06675218045711517, 0.06946752965450287, 0.07218287885189056, 0.07489823549985886, 0.07761358469724655, 0.08032893389463425, 0.08304429054260254, 0.08575963973999023, 0.08847498893737793]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 9.0, 11.0, 15.0, 26.0, 37.0, 45.0, 67.0, 102.0, 130.0, 252.0, 356.0, 521.0, 901.0, 1495.0, 2569.0, 4578.0, 8540.0, 16754.0, 34574.0, 71812.0, 147712.0, 249193.0, 239987.0, 137511.0, 66006.0, 31437.0, 15572.0, 7879.0, 4211.0, 2433.0, 1419.0, 868.0, 555.0, 328.0, 212.0, 142.0, 87.0, 66.0, 42.0, 26.0, 20.0, 20.0, 13.0, 3.0, 9.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052032470703125, -0.0501704216003418, -0.048308372497558594, -0.04644632339477539, -0.04458427429199219, -0.042722225189208984, -0.04086017608642578, -0.03899812698364258, -0.037136077880859375, -0.03527402877807617, -0.03341197967529297, -0.031549930572509766, -0.029687881469726562, -0.02782583236694336, -0.025963783264160156, -0.024101734161376953, -0.02223968505859375, -0.020377635955810547, -0.018515586853027344, -0.01665353775024414, -0.014791488647460938, -0.012929439544677734, -0.011067390441894531, -0.009205341339111328, -0.007343292236328125, -0.005481243133544922, -0.0036191940307617188, -0.0017571449279785156, 0.0001049041748046875, 0.0019669532775878906, 0.0038290023803710938, 0.005691051483154297, 0.0075531005859375, 0.009415149688720703, 0.011277198791503906, 0.01313924789428711, 0.015001296997070312, 0.016863346099853516, 0.01872539520263672, 0.020587444305419922, 0.022449493408203125, 0.024311542510986328, 0.02617359161376953, 0.028035640716552734, 0.029897689819335938, 0.03175973892211914, 0.033621788024902344, 0.03548383712768555, 0.03734588623046875, 0.03920793533325195, 0.041069984436035156, 0.04293203353881836, 0.04479408264160156, 0.046656131744384766, 0.04851818084716797, 0.05038022994995117, 0.052242279052734375, 0.05410432815551758, 0.05596637725830078, 0.057828426361083984, 0.05969047546386719, 0.06155252456665039, 0.0634145736694336, 0.0652766227722168, 0.067138671875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 0.0, 6.0, 11.0, 8.0, 6.0, 17.0, 16.0, 13.0, 25.0, 18.0, 21.0, 28.0, 20.0, 30.0, 34.0, 36.0, 38.0, 36.0, 38.0, 44.0, 46.0, 44.0, 53.0, 46.0, 42.0, 38.0, 44.0, 33.0, 27.0, 31.0, 32.0, 18.0, 24.0, 18.0, 15.0, 6.0, 7.0, 12.0, 5.0, 9.0, 6.0, 4.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.021697998046875, -0.020832061767578125, -0.01996612548828125, -0.019100189208984375, -0.0182342529296875, -0.017368316650390625, -0.01650238037109375, -0.015636444091796875, -0.0147705078125, -0.013904571533203125, -0.01303863525390625, -0.012172698974609375, -0.0113067626953125, -0.010440826416015625, -0.00957489013671875, -0.008708953857421875, -0.007843017578125, -0.006977081298828125, -0.00611114501953125, -0.005245208740234375, -0.0043792724609375, -0.003513336181640625, -0.00264739990234375, -0.001781463623046875, -0.00091552734375, -4.9591064453125e-05, 0.00081634521484375, 0.001682281494140625, 0.0025482177734375, 0.003414154052734375, 0.00428009033203125, 0.005146026611328125, 0.006011962890625, 0.006877899169921875, 0.00774383544921875, 0.008609771728515625, 0.0094757080078125, 0.010341644287109375, 0.01120758056640625, 0.012073516845703125, 0.012939453125, 0.013805389404296875, 0.01467132568359375, 0.015537261962890625, 0.0164031982421875, 0.017269134521484375, 0.01813507080078125, 0.019001007080078125, 0.019866943359375, 0.020732879638671875, 0.02159881591796875, 0.022464752197265625, 0.0233306884765625, 0.024196624755859375, 0.02506256103515625, 0.025928497314453125, 0.02679443359375, 0.027660369873046875, 0.02852630615234375, 0.029392242431640625, 0.0302581787109375, 0.031124114990234375, 0.03199005126953125, 0.032855987548828125, 0.033721923828125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 16.0, 8.0, 17.0, 26.0, 46.0, 87.0, 97.0, 175.0, 325.0, 559.0, 1076.0, 2345.0, 6668.0, 24314.0, 124864.0, 585610.0, 243485.0, 42056.0, 10336.0, 3379.0, 1413.0, 718.0, 363.0, 215.0, 126.0, 94.0, 50.0, 30.0, 19.0, 20.0, 8.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.15283203125, -0.14877605438232422, -0.14472007751464844, -0.14066410064697266, -0.13660812377929688, -0.1325521469116211, -0.1284961700439453, -0.12444019317626953, -0.12038421630859375, -0.11632823944091797, -0.11227226257324219, -0.1082162857055664, -0.10416030883789062, -0.10010433197021484, -0.09604835510253906, -0.09199237823486328, -0.0879364013671875, -0.08388042449951172, -0.07982444763183594, -0.07576847076416016, -0.07171249389648438, -0.0676565170288086, -0.06360054016113281, -0.05954456329345703, -0.05548858642578125, -0.05143260955810547, -0.04737663269042969, -0.043320655822753906, -0.039264678955078125, -0.035208702087402344, -0.031152725219726562, -0.02709674835205078, -0.023040771484375, -0.01898479461669922, -0.014928817749023438, -0.010872840881347656, -0.006816864013671875, -0.0027608871459960938, 0.0012950897216796875, 0.005351066589355469, 0.00940704345703125, 0.013463020324707031, 0.017518997192382812, 0.021574974060058594, 0.025630950927734375, 0.029686927795410156, 0.03374290466308594, 0.03779888153076172, 0.0418548583984375, 0.04591083526611328, 0.04996681213378906, 0.054022789001464844, 0.058078765869140625, 0.062134742736816406, 0.06619071960449219, 0.07024669647216797, 0.07430267333984375, 0.07835865020751953, 0.08241462707519531, 0.0864706039428711, 0.09052658081054688, 0.09458255767822266, 0.09863853454589844, 0.10269451141357422, 0.10675048828125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 6.0, 2.0, 6.0, 7.0, 8.0, 10.0, 9.0, 10.0, 10.0, 21.0, 17.0, 22.0, 18.0, 35.0, 33.0, 31.0, 39.0, 31.0, 41.0, 44.0, 51.0, 43.0, 39.0, 48.0, 38.0, 43.0, 33.0, 41.0, 30.0, 30.0, 30.0, 31.0, 19.0, 25.0, 16.0, 13.0, 15.0, 11.0, 8.0, 10.0, 5.0, 7.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.1290283203125, -0.12491607666015625, -0.1208038330078125, -0.11669158935546875, -0.112579345703125, -0.10846710205078125, -0.1043548583984375, -0.10024261474609375, -0.09613037109375, -0.09201812744140625, -0.0879058837890625, -0.08379364013671875, -0.079681396484375, -0.07556915283203125, -0.0714569091796875, -0.06734466552734375, -0.063232421875, -0.05912017822265625, -0.0550079345703125, -0.05089569091796875, -0.046783447265625, -0.04267120361328125, -0.0385589599609375, -0.03444671630859375, -0.03033447265625, -0.02622222900390625, -0.0221099853515625, -0.01799774169921875, -0.013885498046875, -0.00977325439453125, -0.0056610107421875, -0.00154876708984375, 0.0025634765625, 0.00667572021484375, 0.0107879638671875, 0.01490020751953125, 0.019012451171875, 0.02312469482421875, 0.0272369384765625, 0.03134918212890625, 0.03546142578125, 0.03957366943359375, 0.0436859130859375, 0.04779815673828125, 0.051910400390625, 0.05602264404296875, 0.0601348876953125, 0.06424713134765625, 0.068359375, 0.07247161865234375, 0.0765838623046875, 0.08069610595703125, 0.084808349609375, 0.08892059326171875, 0.0930328369140625, 0.09714508056640625, 0.10125732421875, 0.10536956787109375, 0.1094818115234375, 0.11359405517578125, 0.117706298828125, 0.12181854248046875, 0.1259307861328125, 0.13004302978515625, 0.1341552734375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 5.0, 4.0, 4.0, 26.0, 28.0, 40.0, 62.0, 91.0, 231.0, 525.0, 1617.0, 6515.0, 116863.0, 898852.0, 18976.0, 3064.0, 950.0, 320.0, 145.0, 92.0, 48.0, 22.0, 29.0, 12.0, 7.0, 10.0, 7.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.29150390625, -0.28426170349121094, -0.2770195007324219, -0.2697772979736328, -0.26253509521484375, -0.2552928924560547, -0.24805068969726562, -0.24080848693847656, -0.2335662841796875, -0.22632408142089844, -0.21908187866210938, -0.2118396759033203, -0.20459747314453125, -0.1973552703857422, -0.19011306762695312, -0.18287086486816406, -0.175628662109375, -0.16838645935058594, -0.16114425659179688, -0.1539020538330078, -0.14665985107421875, -0.1394176483154297, -0.13217544555664062, -0.12493324279785156, -0.1176910400390625, -0.11044883728027344, -0.10320663452148438, -0.09596443176269531, -0.08872222900390625, -0.08148002624511719, -0.07423782348632812, -0.06699562072753906, -0.05975341796875, -0.05251121520996094, -0.045269012451171875, -0.03802680969238281, -0.03078460693359375, -0.023542404174804688, -0.016300201416015625, -0.009057998657226562, -0.0018157958984375, 0.0054264068603515625, 0.012668609619140625, 0.019910812377929688, 0.02715301513671875, 0.03439521789550781, 0.041637420654296875, 0.04887962341308594, 0.056121826171875, 0.06336402893066406, 0.07060623168945312, 0.07784843444824219, 0.08509063720703125, 0.09233283996582031, 0.09957504272460938, 0.10681724548339844, 0.1140594482421875, 0.12130165100097656, 0.12854385375976562, 0.1357860565185547, 0.14302825927734375, 0.1502704620361328, 0.15751266479492188, 0.16475486755371094, 0.1719970703125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 7.0, 11.0, 12.0, 24.0, 33.0, 56.0, 57.0, 72.0, 101.0, 122.0, 109.0, 94.0, 75.0, 56.0, 48.0, 47.0, 27.0, 22.0, 10.0, 7.0, 5.0, 3.0, 5.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-5.835294723510742e-05, -5.705840885639191e-05, -5.576387047767639e-05, -5.4469332098960876e-05, -5.317479372024536e-05, -5.1880255341529846e-05, -5.058571696281433e-05, -4.9291178584098816e-05, -4.79966402053833e-05, -4.6702101826667786e-05, -4.540756344795227e-05, -4.4113025069236755e-05, -4.281848669052124e-05, -4.1523948311805725e-05, -4.022940993309021e-05, -3.8934871554374695e-05, -3.764033317565918e-05, -3.6345794796943665e-05, -3.505125641822815e-05, -3.3756718039512634e-05, -3.246217966079712e-05, -3.1167641282081604e-05, -2.987310290336609e-05, -2.8578564524650574e-05, -2.728402614593506e-05, -2.5989487767219543e-05, -2.469494938850403e-05, -2.3400411009788513e-05, -2.2105872631072998e-05, -2.0811334252357483e-05, -1.9516795873641968e-05, -1.8222257494926453e-05, -1.6927719116210938e-05, -1.5633180737495422e-05, -1.4338642358779907e-05, -1.3044103980064392e-05, -1.1749565601348877e-05, -1.0455027222633362e-05, -9.160488843917847e-06, -7.865950465202332e-06, -6.571412086486816e-06, -5.276873707771301e-06, -3.982335329055786e-06, -2.687796950340271e-06, -1.3932585716247559e-06, -9.872019290924072e-08, 1.1958181858062744e-06, 2.4903565645217896e-06, 3.7848949432373047e-06, 5.07943332195282e-06, 6.373971700668335e-06, 7.66851007938385e-06, 8.963048458099365e-06, 1.025758683681488e-05, 1.1552125215530396e-05, 1.284666359424591e-05, 1.4141201972961426e-05, 1.543574035167694e-05, 1.6730278730392456e-05, 1.802481710910797e-05, 1.9319355487823486e-05, 2.0613893866539e-05, 2.1908432245254517e-05, 2.3202970623970032e-05, 2.4497509002685547e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 4.0, 7.0, 4.0, 12.0, 17.0, 28.0, 25.0, 52.0, 73.0, 101.0, 153.0, 280.0, 398.0, 742.0, 1358.0, 2971.0, 8143.0, 35933.0, 418088.0, 521092.0, 43359.0, 8981.0, 3221.0, 1498.0, 789.0, 464.0, 256.0, 183.0, 93.0, 61.0, 51.0, 38.0, 32.0, 18.0, 7.0, 6.0, 4.0, 4.0, 1.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1060791015625, -0.1027688980102539, -0.09945869445800781, -0.09614849090576172, -0.09283828735351562, -0.08952808380126953, -0.08621788024902344, -0.08290767669677734, -0.07959747314453125, -0.07628726959228516, -0.07297706604003906, -0.06966686248779297, -0.06635665893554688, -0.06304645538330078, -0.05973625183105469, -0.056426048278808594, -0.0531158447265625, -0.049805641174316406, -0.04649543762207031, -0.04318523406982422, -0.039875030517578125, -0.03656482696533203, -0.03325462341308594, -0.029944419860839844, -0.02663421630859375, -0.023324012756347656, -0.020013809204101562, -0.01670360565185547, -0.013393402099609375, -0.010083198547363281, -0.0067729949951171875, -0.0034627914428710938, -0.000152587890625, 0.0031576156616210938, 0.0064678192138671875, 0.009778022766113281, 0.013088226318359375, 0.01639842987060547, 0.019708633422851562, 0.023018836975097656, 0.02632904052734375, 0.029639244079589844, 0.03294944763183594, 0.03625965118408203, 0.039569854736328125, 0.04288005828857422, 0.04619026184082031, 0.049500465393066406, 0.0528106689453125, 0.056120872497558594, 0.05943107604980469, 0.06274127960205078, 0.06605148315429688, 0.06936168670654297, 0.07267189025878906, 0.07598209381103516, 0.07929229736328125, 0.08260250091552734, 0.08591270446777344, 0.08922290802001953, 0.09253311157226562, 0.09584331512451172, 0.09915351867675781, 0.1024637222290039, 0.10577392578125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 2.0, 3.0, 5.0, 9.0, 8.0, 13.0, 5.0, 17.0, 27.0, 26.0, 41.0, 45.0, 66.0, 90.0, 78.0, 84.0, 106.0, 89.0, 67.0, 48.0, 35.0, 33.0, 25.0, 19.0, 15.0, 17.0, 12.0, 5.0, 3.0, 1.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06634521484375, -0.06403923034667969, -0.061733245849609375, -0.05942726135253906, -0.05712127685546875, -0.05481529235839844, -0.052509307861328125, -0.05020332336425781, -0.0478973388671875, -0.04559135437011719, -0.043285369873046875, -0.04097938537597656, -0.03867340087890625, -0.03636741638183594, -0.034061431884765625, -0.03175544738769531, -0.029449462890625, -0.027143478393554688, -0.024837493896484375, -0.022531509399414062, -0.02022552490234375, -0.017919540405273438, -0.015613555908203125, -0.013307571411132812, -0.0110015869140625, -0.008695602416992188, -0.006389617919921875, -0.0040836334228515625, -0.00177764892578125, 0.0005283355712890625, 0.002834320068359375, 0.0051403045654296875, 0.0074462890625, 0.009752273559570312, 0.012058258056640625, 0.014364242553710938, 0.01667022705078125, 0.018976211547851562, 0.021282196044921875, 0.023588180541992188, 0.0258941650390625, 0.028200149536132812, 0.030506134033203125, 0.03281211853027344, 0.03511810302734375, 0.03742408752441406, 0.039730072021484375, 0.04203605651855469, 0.044342041015625, 0.04664802551269531, 0.048954010009765625, 0.05125999450683594, 0.05356597900390625, 0.05587196350097656, 0.058177947998046875, 0.06048393249511719, 0.0627899169921875, 0.06509590148925781, 0.06740188598632812, 0.06970787048339844, 0.07201385498046875, 0.07431983947753906, 0.07662582397460938, 0.07893180847167969, 0.08123779296875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 10.0, 10.0, 21.0, 46.0, 80.0, 117.0, 148.0, 149.0, 141.0, 110.0, 77.0, 45.0, 20.0, 13.0, 11.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0901665687561035, -1.0443147420883179, -0.9984630346298218, -0.9526112079620361, -0.9067594408988953, -0.8609076738357544, -0.8150558471679688, -0.7692040801048279, -0.723352313041687, -0.6775005459785461, -0.6316487789154053, -0.5857969522476196, -0.5399451851844788, -0.4940934181213379, -0.44824162125587463, -0.4023898243904114, -0.3565380573272705, -0.31068629026412964, -0.2648344933986664, -0.21898271143436432, -0.17313092947006226, -0.1272791475057602, -0.08142736554145813, -0.03557556867599487, 0.010276198387145996, 0.05612798035144806, 0.10197976231575012, 0.14783154428005219, 0.19368332624435425, 0.2395351082086563, 0.2853868901729584, 0.33123868703842163, 0.3770904541015625, 0.42294222116470337, 0.4687940180301666, 0.5146458148956299, 0.5604975819587708, 0.6063493490219116, 0.6522011756896973, 0.6980529427528381, 0.743904709815979, 0.7897564768791199, 0.8356082439422607, 0.8814600706100464, 0.9273118376731873, 0.9731636047363281, 1.0190154314041138, 1.0648672580718994, 1.1107189655303955, 1.1565707921981812, 1.2024224996566772, 1.248274326324463, 1.294126033782959, 1.3399778604507446, 1.3858296871185303, 1.4316813945770264, 1.477533221244812, 1.5233850479125977, 1.5692367553710938, 1.6150885820388794, 1.660940408706665, 1.7067921161651611, 1.7526439428329468, 1.7984957695007324, 1.8443474769592285]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 7.0, 8.0, 11.0, 9.0, 11.0, 14.0, 15.0, 30.0, 28.0, 28.0, 32.0, 54.0, 48.0, 52.0, 47.0, 61.0, 56.0, 66.0, 67.0, 49.0, 45.0, 37.0, 36.0, 30.0, 32.0, 26.0, 14.0, 18.0, 21.0, 15.0, 7.0, 17.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.1282103061676025, -1.0989480018615723, -1.0696858167648315, -1.0404235124588013, -1.0111613273620605, -0.9818990230560303, -0.9526367783546448, -0.9233745336532593, -0.894112229347229, -0.8648499846458435, -0.835587739944458, -0.8063254356384277, -0.7770631909370422, -0.7478009462356567, -0.7185387015342712, -0.6892764568328857, -0.6600141525268555, -0.63075190782547, -0.6014896631240845, -0.5722273588180542, -0.5429651141166687, -0.5137028694152832, -0.4844406247138977, -0.4551783502101898, -0.4259161353111267, -0.3966538906097412, -0.3673916161060333, -0.3381293714046478, -0.30886709690093994, -0.27960485219955444, -0.25034260749816895, -0.22108033299446106, -0.19181805849075317, -0.16255579888820648, -0.1332935392856598, -0.1040312871336937, -0.074769027531147, -0.04550677537918091, -0.016244515776634216, 0.013017743825912476, 0.04228000342845917, 0.07154226303100586, 0.10080452263355255, 0.13006678223609924, 0.15932902693748474, 0.18859128654003143, 0.21785354614257812, 0.24711580574512482, 0.2763780653476715, 0.305640310049057, 0.3349025845527649, 0.3641648292541504, 0.3934271037578583, 0.4226893484592438, 0.45195162296295166, 0.48121386766433716, 0.5104761123657227, 0.5397383570671082, 0.5690006017684937, 0.5982629060745239, 0.6275251507759094, 0.6567873954772949, 0.6860496401786804, 0.7153118848800659, 0.7445741891860962]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 12.0, 8.0, 9.0, 10.0, 23.0, 30.0, 46.0, 47.0, 76.0, 118.0, 167.0, 254.0, 401.0, 786.0, 1629.0, 4176.0, 18943.0, 4070729.0, 83403.0, 8365.0, 2461.0, 1055.0, 548.0, 346.0, 206.0, 128.0, 86.0, 66.0, 44.0, 31.0, 20.0, 17.0, 12.0, 9.0, 4.0, 5.0, 6.0, 2.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.315185546875, -0.30556488037109375, -0.2959442138671875, -0.28632354736328125, -0.276702880859375, -0.26708221435546875, -0.2574615478515625, -0.24784088134765625, -0.23822021484375, -0.22859954833984375, -0.2189788818359375, -0.20935821533203125, -0.199737548828125, -0.19011688232421875, -0.1804962158203125, -0.17087554931640625, -0.1612548828125, -0.15163421630859375, -0.1420135498046875, -0.13239288330078125, -0.122772216796875, -0.11315155029296875, -0.1035308837890625, -0.09391021728515625, -0.08428955078125, -0.07466888427734375, -0.0650482177734375, -0.05542755126953125, -0.045806884765625, -0.03618621826171875, -0.0265655517578125, -0.01694488525390625, -0.00732421875, 0.00229644775390625, 0.0119171142578125, 0.02153778076171875, 0.031158447265625, 0.04077911376953125, 0.0503997802734375, 0.06002044677734375, 0.06964111328125, 0.07926177978515625, 0.0888824462890625, 0.09850311279296875, 0.108123779296875, 0.11774444580078125, 0.1273651123046875, 0.13698577880859375, 0.1466064453125, 0.15622711181640625, 0.1658477783203125, 0.17546844482421875, 0.185089111328125, 0.19470977783203125, 0.2043304443359375, 0.21395111083984375, 0.22357177734375, 0.23319244384765625, 0.2428131103515625, 0.25243377685546875, 0.262054443359375, 0.27167510986328125, 0.2812957763671875, 0.29091644287109375, 0.300537109375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 6.0, 4.0, 5.0, 3.0, 8.0, 9.0, 13.0, 11.0, 25.0, 16.0, 26.0, 30.0, 43.0, 27.0, 41.0, 50.0, 53.0, 54.0, 46.0, 65.0, 57.0, 50.0, 43.0, 45.0, 43.0, 29.0, 41.0, 38.0, 20.0, 20.0, 18.0, 15.0, 13.0, 11.0, 10.0, 4.0, 5.0, 5.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.038726806640625, -0.037693023681640625, -0.03665924072265625, -0.035625457763671875, -0.0345916748046875, -0.033557891845703125, -0.03252410888671875, -0.031490325927734375, -0.03045654296875, -0.029422760009765625, -0.02838897705078125, -0.027355194091796875, -0.0263214111328125, -0.025287628173828125, -0.02425384521484375, -0.023220062255859375, -0.022186279296875, -0.021152496337890625, -0.02011871337890625, -0.019084930419921875, -0.0180511474609375, -0.017017364501953125, -0.01598358154296875, -0.014949798583984375, -0.013916015625, -0.012882232666015625, -0.01184844970703125, -0.010814666748046875, -0.0097808837890625, -0.008747100830078125, -0.00771331787109375, -0.006679534912109375, -0.005645751953125, -0.004611968994140625, -0.00357818603515625, -0.002544403076171875, -0.0015106201171875, -0.000476837158203125, 0.00055694580078125, 0.001590728759765625, 0.00262451171875, 0.003658294677734375, 0.00469207763671875, 0.005725860595703125, 0.0067596435546875, 0.007793426513671875, 0.00882720947265625, 0.009860992431640625, 0.010894775390625, 0.011928558349609375, 0.01296234130859375, 0.013996124267578125, 0.0150299072265625, 0.016063690185546875, 0.01709747314453125, 0.018131256103515625, 0.0191650390625, 0.020198822021484375, 0.02123260498046875, 0.022266387939453125, 0.0233001708984375, 0.024333953857421875, 0.02536773681640625, 0.026401519775390625, 0.027435302734375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 8.0, 9.0, 8.0, 10.0, 17.0, 20.0, 28.0, 42.0, 70.0, 98.0, 106.0, 133.0, 197.0, 328.0, 529.0, 832.0, 1451.0, 3059.0, 8172.0, 36818.0, 4028192.0, 93184.0, 12246.0, 4097.0, 1800.0, 963.0, 597.0, 372.0, 260.0, 185.0, 120.0, 83.0, 90.0, 60.0, 20.0, 21.0, 18.0, 17.0, 3.0, 8.0, 5.0, 5.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.270751953125, -0.261627197265625, -0.25250244140625, -0.243377685546875, -0.2342529296875, -0.225128173828125, -0.21600341796875, -0.206878662109375, -0.19775390625, -0.188629150390625, -0.17950439453125, -0.170379638671875, -0.1612548828125, -0.152130126953125, -0.14300537109375, -0.133880615234375, -0.124755859375, -0.115631103515625, -0.10650634765625, -0.097381591796875, -0.0882568359375, -0.079132080078125, -0.07000732421875, -0.060882568359375, -0.0517578125, -0.042633056640625, -0.03350830078125, -0.024383544921875, -0.0152587890625, -0.006134033203125, 0.00299072265625, 0.012115478515625, 0.021240234375, 0.030364990234375, 0.03948974609375, 0.048614501953125, 0.0577392578125, 0.066864013671875, 0.07598876953125, 0.085113525390625, 0.09423828125, 0.103363037109375, 0.11248779296875, 0.121612548828125, 0.1307373046875, 0.139862060546875, 0.14898681640625, 0.158111572265625, 0.167236328125, 0.176361083984375, 0.18548583984375, 0.194610595703125, 0.2037353515625, 0.212860107421875, 0.22198486328125, 0.231109619140625, 0.240234375, 0.249359130859375, 0.25848388671875, 0.267608642578125, 0.2767333984375, 0.285858154296875, 0.29498291015625, 0.304107666015625, 0.313232421875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 9.0, 2.0, 8.0, 13.0, 39.0, 95.0, 3152.0, 589.0, 77.0, 34.0, 15.0, 14.0, 11.0, 3.0, 3.0, 5.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0899658203125, -0.08759450912475586, -0.08522319793701172, -0.08285188674926758, -0.08048057556152344, -0.0781092643737793, -0.07573795318603516, -0.07336664199829102, -0.07099533081054688, -0.06862401962280273, -0.0662527084350586, -0.06388139724731445, -0.06151008605957031, -0.05913877487182617, -0.05676746368408203, -0.05439615249633789, -0.05202484130859375, -0.04965353012084961, -0.04728221893310547, -0.04491090774536133, -0.04253959655761719, -0.04016828536987305, -0.037796974182128906, -0.035425662994384766, -0.033054351806640625, -0.030683040618896484, -0.028311729431152344, -0.025940418243408203, -0.023569107055664062, -0.021197795867919922, -0.01882648468017578, -0.01645517349243164, -0.0140838623046875, -0.01171255111694336, -0.009341239929199219, -0.006969928741455078, -0.0045986175537109375, -0.002227306365966797, 0.00014400482177734375, 0.0025153160095214844, 0.004886627197265625, 0.007257938385009766, 0.009629249572753906, 0.012000560760498047, 0.014371871948242188, 0.016743183135986328, 0.01911449432373047, 0.02148580551147461, 0.02385711669921875, 0.02622842788696289, 0.02859973907470703, 0.030971050262451172, 0.03334236145019531, 0.03571367263793945, 0.038084983825683594, 0.040456295013427734, 0.042827606201171875, 0.045198917388916016, 0.047570228576660156, 0.0499415397644043, 0.05231285095214844, 0.05468416213989258, 0.05705547332763672, 0.05942678451538086, 0.061798095703125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 10.0, 14.0, 18.0, 30.0, 43.0, 74.0, 103.0, 116.0, 143.0, 133.0, 84.0, 79.0, 49.0, 29.0, 29.0, 11.0, 7.0, 8.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18322843313217163, -0.17545722424983978, -0.16768601536750793, -0.15991482138633728, -0.15214361250400543, -0.14437240362167358, -0.13660119473934174, -0.1288299858570099, -0.12105877697467804, -0.11328756809234619, -0.10551636666059494, -0.09774515777826309, -0.08997394889593124, -0.08220274746417999, -0.07443153858184814, -0.0666603296995163, -0.058889128267765045, -0.051117923110723495, -0.04334671422839165, -0.0355755090713501, -0.0278043020516634, -0.0200330950319767, -0.01226188987493515, -0.004490680992603302, 0.0032805241644382477, 0.011051731184124947, 0.018822938203811646, 0.026594143360853195, 0.034365348517894745, 0.04213655740022659, 0.04990776255726814, 0.05767897143959999, 0.06545017659664154, 0.07322138547897339, 0.08099258691072464, 0.08876379579305649, 0.09653500467538834, 0.10430620610713959, 0.11207741498947144, 0.11984862387180328, 0.12761983275413513, 0.13539104163646698, 0.14316225051879883, 0.15093344449996948, 0.15870465338230133, 0.16647586226463318, 0.17424707114696503, 0.18201828002929688, 0.18978947401046753, 0.19756068289279938, 0.20533189177513123, 0.21310308575630188, 0.22087429463863373, 0.22864550352096558, 0.23641671240329742, 0.24418792128562927, 0.2519591450691223, 0.25973033905029297, 0.267501562833786, 0.27527275681495667, 0.2830439805984497, 0.29081517457962036, 0.298586368560791, 0.30635759234428406, 0.3141287863254547]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 11.0, 7.0, 12.0, 8.0, 13.0, 19.0, 18.0, 17.0, 19.0, 27.0, 28.0, 29.0, 33.0, 28.0, 34.0, 31.0, 41.0, 37.0, 36.0, 51.0, 40.0, 29.0, 33.0, 31.0, 31.0, 36.0, 35.0, 34.0, 29.0, 23.0, 23.0, 25.0, 21.0, 20.0, 14.0, 12.0, 16.0, 11.0, 6.0, 6.0, 6.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09320485591888428, -0.08998407423496246, -0.08676329255104065, -0.08354251086711884, -0.08032172918319702, -0.07710094749927521, -0.0738801583647728, -0.07065937668085098, -0.06743859499692917, -0.06421781331300735, -0.06099703162908554, -0.05777624621987343, -0.054555464535951614, -0.0513346828520298, -0.04811389744281769, -0.044893115758895874, -0.04167233407497406, -0.038451552391052246, -0.03523077070713043, -0.03200998529791832, -0.028789203613996506, -0.025568421930074692, -0.02234763838350773, -0.019126854836940765, -0.01590607315301895, -0.012685290537774563, -0.009464507922530174, -0.006243725307285786, -0.003022942692041397, 0.00019783899188041687, 0.00341862253844738, 0.006639406085014343, 0.009860187768936157, 0.013080970384180546, 0.016301752999424934, 0.019522536545991898, 0.02274331822991371, 0.025964099913835526, 0.02918488346040249, 0.03240566700696945, 0.035626448690891266, 0.03884723037481308, 0.042068012058734894, 0.045288797467947006, 0.04850957915186882, 0.051730360835790634, 0.05495114624500275, 0.05817192792892456, 0.061392709612846375, 0.06461349129676819, 0.06783427298069, 0.07105505466461182, 0.07427583634853363, 0.07749661803245544, 0.08071740716695786, 0.08393818885087967, 0.08715897053480148, 0.0903797522187233, 0.09360053390264511, 0.09682131558656693, 0.10004210472106934, 0.10326288640499115, 0.10648366808891296, 0.10970444977283478, 0.11292523145675659]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 4.0, 6.0, 3.0, 9.0, 14.0, 17.0, 31.0, 53.0, 69.0, 111.0, 220.0, 274.0, 510.0, 860.0, 1686.0, 3472.0, 6996.0, 15422.0, 34762.0, 81852.0, 181734.0, 294416.0, 229716.0, 110074.0, 47607.0, 20221.0, 9254.0, 4292.0, 2162.0, 1162.0, 582.0, 369.0, 207.0, 140.0, 89.0, 56.0, 37.0, 29.0, 5.0, 17.0, 10.0, 4.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0704345703125, -0.0683431625366211, -0.06625175476074219, -0.06416034698486328, -0.062068939208984375, -0.05997753143310547, -0.05788612365722656, -0.055794715881347656, -0.05370330810546875, -0.051611900329589844, -0.04952049255371094, -0.04742908477783203, -0.045337677001953125, -0.04324626922607422, -0.04115486145019531, -0.039063453674316406, -0.0369720458984375, -0.034880638122558594, -0.03278923034667969, -0.03069782257080078, -0.028606414794921875, -0.02651500701904297, -0.024423599243164062, -0.022332191467285156, -0.02024078369140625, -0.018149375915527344, -0.016057968139648438, -0.013966560363769531, -0.011875152587890625, -0.009783744812011719, -0.0076923370361328125, -0.005600929260253906, -0.003509521484375, -0.0014181137084960938, 0.0006732940673828125, 0.0027647018432617188, 0.004856109619140625, 0.006947517395019531, 0.009038925170898438, 0.011130332946777344, 0.01322174072265625, 0.015313148498535156, 0.017404556274414062, 0.01949596405029297, 0.021587371826171875, 0.02367877960205078, 0.025770187377929688, 0.027861595153808594, 0.0299530029296875, 0.032044410705566406, 0.03413581848144531, 0.03622722625732422, 0.038318634033203125, 0.04041004180908203, 0.04250144958496094, 0.044592857360839844, 0.04668426513671875, 0.048775672912597656, 0.05086708068847656, 0.05295848846435547, 0.055049896240234375, 0.05714130401611328, 0.05923271179199219, 0.061324119567871094, 0.06341552734375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 5.0, 11.0, 6.0, 16.0, 11.0, 15.0, 18.0, 14.0, 14.0, 18.0, 32.0, 32.0, 41.0, 28.0, 40.0, 48.0, 41.0, 59.0, 44.0, 38.0, 33.0, 39.0, 50.0, 42.0, 40.0, 43.0, 30.0, 27.0, 26.0, 31.0, 16.0, 13.0, 13.0, 18.0, 10.0, 10.0, 4.0, 2.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0290374755859375, -0.028041601181030273, -0.027045726776123047, -0.02604985237121582, -0.025053977966308594, -0.024058103561401367, -0.02306222915649414, -0.022066354751586914, -0.021070480346679688, -0.02007460594177246, -0.019078731536865234, -0.018082857131958008, -0.01708698272705078, -0.016091108322143555, -0.015095233917236328, -0.014099359512329102, -0.013103485107421875, -0.012107610702514648, -0.011111736297607422, -0.010115861892700195, -0.009119987487792969, -0.008124113082885742, -0.007128238677978516, -0.006132364273071289, -0.0051364898681640625, -0.004140615463256836, -0.0031447410583496094, -0.002148866653442383, -0.0011529922485351562, -0.0001571178436279297, 0.0008387565612792969, 0.0018346309661865234, 0.00283050537109375, 0.0038263797760009766, 0.004822254180908203, 0.00581812858581543, 0.006814002990722656, 0.007809877395629883, 0.00880575180053711, 0.009801626205444336, 0.010797500610351562, 0.011793375015258789, 0.012789249420166016, 0.013785123825073242, 0.014780998229980469, 0.015776872634887695, 0.016772747039794922, 0.01776862144470215, 0.018764495849609375, 0.0197603702545166, 0.020756244659423828, 0.021752119064331055, 0.02274799346923828, 0.023743867874145508, 0.024739742279052734, 0.02573561668395996, 0.026731491088867188, 0.027727365493774414, 0.02872323989868164, 0.029719114303588867, 0.030714988708496094, 0.03171086311340332, 0.03270673751831055, 0.03370261192321777, 0.034698486328125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 2.0, 2.0, 5.0, 6.0, 3.0, 7.0, 13.0, 15.0, 28.0, 30.0, 73.0, 79.0, 133.0, 191.0, 297.0, 473.0, 921.0, 1932.0, 5059.0, 17124.0, 83425.0, 495341.0, 364175.0, 58743.0, 12624.0, 4112.0, 1655.0, 800.0, 442.0, 272.0, 188.0, 101.0, 89.0, 49.0, 33.0, 28.0, 25.0, 12.0, 20.0, 7.0, 5.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.141357421875, -0.1374197006225586, -0.1334819793701172, -0.12954425811767578, -0.12560653686523438, -0.12166881561279297, -0.11773109436035156, -0.11379337310791016, -0.10985565185546875, -0.10591793060302734, -0.10198020935058594, -0.09804248809814453, -0.09410476684570312, -0.09016704559326172, -0.08622932434082031, -0.0822916030883789, -0.0783538818359375, -0.0744161605834961, -0.07047843933105469, -0.06654071807861328, -0.06260299682617188, -0.05866527557373047, -0.05472755432128906, -0.050789833068847656, -0.04685211181640625, -0.042914390563964844, -0.03897666931152344, -0.03503894805908203, -0.031101226806640625, -0.02716350555419922, -0.023225784301757812, -0.019288063049316406, -0.015350341796875, -0.011412620544433594, -0.0074748992919921875, -0.0035371780395507812, 0.000400543212890625, 0.004338264465332031, 0.008275985717773438, 0.012213706970214844, 0.01615142822265625, 0.020089149475097656, 0.024026870727539062, 0.02796459197998047, 0.031902313232421875, 0.03584003448486328, 0.03977775573730469, 0.043715476989746094, 0.0476531982421875, 0.051590919494628906, 0.05552864074707031, 0.05946636199951172, 0.06340408325195312, 0.06734180450439453, 0.07127952575683594, 0.07521724700927734, 0.07915496826171875, 0.08309268951416016, 0.08703041076660156, 0.09096813201904297, 0.09490585327148438, 0.09884357452392578, 0.10278129577636719, 0.1067190170288086, 0.11065673828125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 2.0, 6.0, 3.0, 8.0, 3.0, 12.0, 10.0, 13.0, 14.0, 13.0, 22.0, 33.0, 28.0, 32.0, 21.0, 34.0, 47.0, 31.0, 48.0, 60.0, 60.0, 50.0, 45.0, 58.0, 36.0, 35.0, 23.0, 33.0, 31.0, 32.0, 25.0, 29.0, 18.0, 15.0, 17.0, 12.0, 13.0, 9.0, 4.0, 5.0, 4.0, 5.0, 2.0, 1.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1376953125, -0.13295745849609375, -0.1282196044921875, -0.12348175048828125, -0.118743896484375, -0.11400604248046875, -0.1092681884765625, -0.10453033447265625, -0.09979248046875, -0.09505462646484375, -0.0903167724609375, -0.08557891845703125, -0.080841064453125, -0.07610321044921875, -0.0713653564453125, -0.06662750244140625, -0.0618896484375, -0.05715179443359375, -0.0524139404296875, -0.04767608642578125, -0.042938232421875, -0.03820037841796875, -0.0334625244140625, -0.02872467041015625, -0.02398681640625, -0.01924896240234375, -0.0145111083984375, -0.00977325439453125, -0.005035400390625, -0.00029754638671875, 0.0044403076171875, 0.00917816162109375, 0.013916015625, 0.01865386962890625, 0.0233917236328125, 0.02812957763671875, 0.032867431640625, 0.03760528564453125, 0.0423431396484375, 0.04708099365234375, 0.05181884765625, 0.05655670166015625, 0.0612945556640625, 0.06603240966796875, 0.070770263671875, 0.07550811767578125, 0.0802459716796875, 0.08498382568359375, 0.0897216796875, 0.09445953369140625, 0.0991973876953125, 0.10393524169921875, 0.108673095703125, 0.11341094970703125, 0.1181488037109375, 0.12288665771484375, 0.12762451171875, 0.13236236572265625, 0.1371002197265625, 0.14183807373046875, 0.146575927734375, 0.15131378173828125, 0.1560516357421875, 0.16078948974609375, 0.16552734375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 6.0, 3.0, 5.0, 9.0, 9.0, 15.0, 20.0, 28.0, 48.0, 74.0, 149.0, 301.0, 781.0, 3271.0, 27469.0, 858417.0, 148013.0, 7556.0, 1449.0, 439.0, 213.0, 112.0, 53.0, 29.0, 21.0, 13.0, 13.0, 8.0, 5.0, 4.0, 9.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1849365234375, -0.1801614761352539, -0.1753864288330078, -0.17061138153076172, -0.16583633422851562, -0.16106128692626953, -0.15628623962402344, -0.15151119232177734, -0.14673614501953125, -0.14196109771728516, -0.13718605041503906, -0.13241100311279297, -0.12763595581054688, -0.12286090850830078, -0.11808586120605469, -0.1133108139038086, -0.1085357666015625, -0.1037607192993164, -0.09898567199707031, -0.09421062469482422, -0.08943557739257812, -0.08466053009033203, -0.07988548278808594, -0.07511043548583984, -0.07033538818359375, -0.06556034088134766, -0.06078529357910156, -0.05601024627685547, -0.051235198974609375, -0.04646015167236328, -0.04168510437011719, -0.036910057067871094, -0.032135009765625, -0.027359962463378906, -0.022584915161132812, -0.01780986785888672, -0.013034820556640625, -0.008259773254394531, -0.0034847259521484375, 0.0012903213500976562, 0.00606536865234375, 0.010840415954589844, 0.015615463256835938, 0.02039051055908203, 0.025165557861328125, 0.02994060516357422, 0.03471565246582031, 0.039490699768066406, 0.0442657470703125, 0.049040794372558594, 0.05381584167480469, 0.05859088897705078, 0.06336593627929688, 0.06814098358154297, 0.07291603088378906, 0.07769107818603516, 0.08246612548828125, 0.08724117279052734, 0.09201622009277344, 0.09679126739501953, 0.10156631469726562, 0.10634136199951172, 0.11111640930175781, 0.1158914566040039, 0.12066650390625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 7.0, 16.0, 13.0, 24.0, 29.0, 26.0, 50.0, 51.0, 77.0, 73.0, 93.0, 76.0, 78.0, 67.0, 69.0, 39.0, 34.0, 37.0, 22.0, 24.0, 13.0, 25.0, 11.0, 13.0, 9.0, 3.0, 5.0, 5.0, 2.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.300739288330078e-05, -2.2184103727340698e-05, -2.1360814571380615e-05, -2.0537525415420532e-05, -1.971423625946045e-05, -1.8890947103500366e-05, -1.8067657947540283e-05, -1.72443687915802e-05, -1.6421079635620117e-05, -1.5597790479660034e-05, -1.4774501323699951e-05, -1.3951212167739868e-05, -1.3127923011779785e-05, -1.2304633855819702e-05, -1.1481344699859619e-05, -1.0658055543899536e-05, -9.834766387939453e-06, -9.01147723197937e-06, -8.188188076019287e-06, -7.364898920059204e-06, -6.541609764099121e-06, -5.718320608139038e-06, -4.895031452178955e-06, -4.071742296218872e-06, -3.248453140258789e-06, -2.425163984298706e-06, -1.601874828338623e-06, -7.7858567237854e-07, 4.470348358154297e-08, 8.67992639541626e-07, 1.691281795501709e-06, 2.514570951461792e-06, 3.337860107421875e-06, 4.161149263381958e-06, 4.984438419342041e-06, 5.807727575302124e-06, 6.631016731262207e-06, 7.45430588722229e-06, 8.277595043182373e-06, 9.100884199142456e-06, 9.924173355102539e-06, 1.0747462511062622e-05, 1.1570751667022705e-05, 1.2394040822982788e-05, 1.3217329978942871e-05, 1.4040619134902954e-05, 1.4863908290863037e-05, 1.568719744682312e-05, 1.6510486602783203e-05, 1.7333775758743286e-05, 1.815706491470337e-05, 1.8980354070663452e-05, 1.9803643226623535e-05, 2.0626932382583618e-05, 2.14502215385437e-05, 2.2273510694503784e-05, 2.3096799850463867e-05, 2.392008900642395e-05, 2.4743378162384033e-05, 2.5566667318344116e-05, 2.63899564743042e-05, 2.7213245630264282e-05, 2.8036534786224365e-05, 2.8859823942184448e-05, 2.968311309814453e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 7.0, 6.0, 7.0, 8.0, 19.0, 28.0, 30.0, 38.0, 76.0, 135.0, 202.0, 345.0, 725.0, 1524.0, 3858.0, 12858.0, 83399.0, 687958.0, 223287.0, 23869.0, 5943.0, 2121.0, 974.0, 470.0, 234.0, 126.0, 90.0, 78.0, 33.0, 31.0, 16.0, 8.0, 17.0, 8.0, 7.0, 5.0, 4.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.08917236328125, -0.08635902404785156, -0.08354568481445312, -0.08073234558105469, -0.07791900634765625, -0.07510566711425781, -0.07229232788085938, -0.06947898864746094, -0.0666656494140625, -0.06385231018066406, -0.061038970947265625, -0.05822563171386719, -0.05541229248046875, -0.05259895324707031, -0.049785614013671875, -0.04697227478027344, -0.044158935546875, -0.04134559631347656, -0.038532257080078125, -0.03571891784667969, -0.03290557861328125, -0.030092239379882812, -0.027278900146484375, -0.024465560913085938, -0.0216522216796875, -0.018838882446289062, -0.016025543212890625, -0.013212203979492188, -0.01039886474609375, -0.0075855255126953125, -0.004772186279296875, -0.0019588470458984375, 0.0008544921875, 0.0036678314208984375, 0.006481170654296875, 0.009294509887695312, 0.01210784912109375, 0.014921188354492188, 0.017734527587890625, 0.020547866821289062, 0.0233612060546875, 0.026174545288085938, 0.028987884521484375, 0.03180122375488281, 0.03461456298828125, 0.03742790222167969, 0.040241241455078125, 0.04305458068847656, 0.045867919921875, 0.04868125915527344, 0.051494598388671875, 0.05430793762207031, 0.05712127685546875, 0.05993461608886719, 0.06274795532226562, 0.06556129455566406, 0.0683746337890625, 0.07118797302246094, 0.07400131225585938, 0.07681465148925781, 0.07962799072265625, 0.08244132995605469, 0.08525466918945312, 0.08806800842285156, 0.09088134765625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 1.0, 3.0, 5.0, 6.0, 7.0, 9.0, 23.0, 36.0, 67.0, 116.0, 134.0, 150.0, 162.0, 104.0, 69.0, 45.0, 27.0, 13.0, 12.0, 7.0, 3.0, 5.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1597900390625, -0.15594959259033203, -0.15210914611816406, -0.1482686996459961, -0.14442825317382812, -0.14058780670166016, -0.1367473602294922, -0.13290691375732422, -0.12906646728515625, -0.12522602081298828, -0.12138557434082031, -0.11754512786865234, -0.11370468139648438, -0.1098642349243164, -0.10602378845214844, -0.10218334197998047, -0.0983428955078125, -0.09450244903564453, -0.09066200256347656, -0.0868215560913086, -0.08298110961914062, -0.07914066314697266, -0.07530021667480469, -0.07145977020263672, -0.06761932373046875, -0.06377887725830078, -0.05993843078613281, -0.056097984313964844, -0.052257537841796875, -0.048417091369628906, -0.04457664489746094, -0.04073619842529297, -0.036895751953125, -0.03305530548095703, -0.029214859008789062, -0.025374412536621094, -0.021533966064453125, -0.017693519592285156, -0.013853073120117188, -0.010012626647949219, -0.00617218017578125, -0.0023317337036132812, 0.0015087127685546875, 0.005349159240722656, 0.009189605712890625, 0.013030052185058594, 0.016870498657226562, 0.02071094512939453, 0.0245513916015625, 0.02839183807373047, 0.03223228454589844, 0.036072731018066406, 0.039913177490234375, 0.043753623962402344, 0.04759407043457031, 0.05143451690673828, 0.05527496337890625, 0.05911540985107422, 0.06295585632324219, 0.06679630279541016, 0.07063674926757812, 0.0744771957397461, 0.07831764221191406, 0.08215808868408203, 0.08599853515625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 7.0, 25.0, 60.0, 186.0, 271.0, 257.0, 143.0, 31.0, 15.0, 6.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0014524459838867, -0.9235528111457825, -0.8456531763076782, -0.7677536010742188, -0.6898539662361145, -0.6119543313980103, -0.5340547561645508, -0.45615512132644653, -0.3782554864883423, -0.30035585165023804, -0.22245624661445618, -0.14455662667751312, -0.06665700674057007, 0.01124262809753418, 0.08914223313331604, 0.1670418381690979, 0.24494147300720215, 0.3228411078453064, 0.40074071288108826, 0.4786403179168701, 0.5565399527549744, 0.6344395875930786, 0.7123391628265381, 0.7902387976646423, 0.8681384325027466, 0.9460380673408508, 1.023937702178955, 1.1018372774124146, 1.179736852645874, 1.257636547088623, 1.3355361223220825, 1.413435697555542, 1.491335153579712, 1.5692347288131714, 1.6471344232559204, 1.7250339984893799, 1.802933692932129, 1.8808332681655884, 1.9587328433990479, 2.036632537841797, 2.114531993865967, 2.192431688308716, 2.2703311443328857, 2.3482308387756348, 2.426130533218384, 2.504030227661133, 2.5819296836853027, 2.6598293781280518, 2.737729072570801, 2.81562876701355, 2.8935282230377197, 2.9714279174804688, 3.0493276119232178, 3.127227306365967, 3.2051267623901367, 3.2830264568328857, 3.3609261512756348, 3.438825845718384, 3.5167253017425537, 3.5946249961853027, 3.6725246906280518, 3.750424385070801, 3.8283238410949707, 3.9062235355377197, 3.9841229915618896]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 7.0, 11.0, 8.0, 13.0, 13.0, 14.0, 15.0, 22.0, 32.0, 34.0, 32.0, 34.0, 42.0, 42.0, 47.0, 55.0, 59.0, 49.0, 44.0, 48.0, 55.0, 38.0, 38.0, 41.0, 34.0, 33.0, 33.0, 13.0, 18.0, 11.0, 19.0, 9.0, 9.0, 8.0, 7.0, 6.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8185887336730957, -0.794086217880249, -0.7695837616920471, -0.7450812458992004, -0.7205787897109985, -0.6960762739181519, -0.6715737581253052, -0.6470712423324585, -0.6225687861442566, -0.5980662703514099, -0.573563814163208, -0.5490612983703613, -0.5245587825775146, -0.5000563263893127, -0.47555381059646606, -0.4510513246059418, -0.4265488386154175, -0.4020463526248932, -0.3775438666343689, -0.3530413508415222, -0.3285388648509979, -0.30403637886047363, -0.27953386306762695, -0.25503137707710266, -0.23052889108657837, -0.20602640509605408, -0.1815239042043686, -0.1570214033126831, -0.1325189173221588, -0.10801642388105392, -0.08351393043994904, -0.05901142954826355, -0.03450888395309448, -0.010006390511989594, 0.014496102929115295, 0.038998596370220184, 0.06350108981132507, 0.08800358325242996, 0.11250607669353485, 0.13700857758522034, 0.16151106357574463, 0.18601354956626892, 0.2105160504579544, 0.2350185513496399, 0.2595210373401642, 0.2840235233306885, 0.30852603912353516, 0.33302852511405945, 0.35753101110458374, 0.38203349709510803, 0.4065359830856323, 0.431038498878479, 0.4555409848690033, 0.4800434708595276, 0.5045459866523743, 0.5290484428405762, 0.5535509586334229, 0.5780534744262695, 0.6025559306144714, 0.6270584464073181, 0.65156090259552, 0.6760634183883667, 0.7005659341812134, 0.7250684499740601, 0.749570906162262]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 2.0, 6.0, 5.0, 5.0, 8.0, 23.0, 29.0, 50.0, 49.0, 104.0, 150.0, 274.0, 354.0, 684.0, 1150.0, 2496.0, 6454.0, 44672.0, 4113567.0, 15875.0, 4160.0, 1798.0, 940.0, 526.0, 332.0, 174.0, 120.0, 105.0, 61.0, 42.0, 24.0, 12.0, 11.0, 10.0, 7.0, 7.0, 5.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.185546875, -0.17722702026367188, -0.16890716552734375, -0.16058731079101562, -0.1522674560546875, -0.14394760131835938, -0.13562774658203125, -0.12730789184570312, -0.118988037109375, -0.11066818237304688, -0.10234832763671875, -0.09402847290039062, -0.0857086181640625, -0.07738876342773438, -0.06906890869140625, -0.060749053955078125, -0.05242919921875, -0.044109344482421875, -0.03578948974609375, -0.027469635009765625, -0.0191497802734375, -0.010829925537109375, -0.00251007080078125, 0.005809783935546875, 0.014129638671875, 0.022449493408203125, 0.03076934814453125, 0.039089202880859375, 0.0474090576171875, 0.055728912353515625, 0.06404876708984375, 0.07236862182617188, 0.0806884765625, 0.08900833129882812, 0.09732818603515625, 0.10564804077148438, 0.1139678955078125, 0.12228775024414062, 0.13060760498046875, 0.13892745971679688, 0.147247314453125, 0.15556716918945312, 0.16388702392578125, 0.17220687866210938, 0.1805267333984375, 0.18884658813476562, 0.19716644287109375, 0.20548629760742188, 0.21380615234375, 0.22212600708007812, 0.23044586181640625, 0.23876571655273438, 0.2470855712890625, 0.2554054260253906, 0.26372528076171875, 0.2720451354980469, 0.280364990234375, 0.2886848449707031, 0.29700469970703125, 0.3053245544433594, 0.3136444091796875, 0.3219642639160156, 0.33028411865234375, 0.3386039733886719, 0.346923828125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 7.0, 10.0, 15.0, 15.0, 21.0, 23.0, 27.0, 35.0, 31.0, 33.0, 39.0, 42.0, 54.0, 48.0, 45.0, 44.0, 49.0, 40.0, 49.0, 49.0, 46.0, 36.0, 34.0, 34.0, 30.0, 26.0, 22.0, 10.0, 12.0, 9.0, 18.0, 7.0, 6.0, 6.0, 9.0, 0.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.038330078125, -0.03719615936279297, -0.03606224060058594, -0.034928321838378906, -0.033794403076171875, -0.032660484313964844, -0.03152656555175781, -0.03039264678955078, -0.02925872802734375, -0.02812480926513672, -0.026990890502929688, -0.025856971740722656, -0.024723052978515625, -0.023589134216308594, -0.022455215454101562, -0.02132129669189453, -0.0201873779296875, -0.01905345916748047, -0.017919540405273438, -0.016785621643066406, -0.015651702880859375, -0.014517784118652344, -0.013383865356445312, -0.012249946594238281, -0.01111602783203125, -0.009982109069824219, -0.008848190307617188, -0.007714271545410156, -0.006580352783203125, -0.005446434020996094, -0.0043125152587890625, -0.0031785964965820312, -0.002044677734375, -0.0009107589721679688, 0.0002231597900390625, 0.0013570785522460938, 0.002490997314453125, 0.0036249160766601562, 0.0047588348388671875, 0.005892753601074219, 0.00702667236328125, 0.008160591125488281, 0.009294509887695312, 0.010428428649902344, 0.011562347412109375, 0.012696266174316406, 0.013830184936523438, 0.014964103698730469, 0.0160980224609375, 0.01723194122314453, 0.018365859985351562, 0.019499778747558594, 0.020633697509765625, 0.021767616271972656, 0.022901535034179688, 0.02403545379638672, 0.02516937255859375, 0.02630329132080078, 0.027437210083007812, 0.028571128845214844, 0.029705047607421875, 0.030838966369628906, 0.03197288513183594, 0.03310680389404297, 0.03424072265625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 5.0, 8.0, 7.0, 6.0, 9.0, 12.0, 27.0, 20.0, 22.0, 42.0, 61.0, 80.0, 110.0, 143.0, 180.0, 308.0, 546.0, 998.0, 3132.0, 100561.0, 4081016.0, 4114.0, 1182.0, 603.0, 315.0, 223.0, 148.0, 101.0, 76.0, 60.0, 36.0, 42.0, 23.0, 14.0, 8.0, 9.0, 10.0, 9.0, 2.0, 2.0, 2.0, 1.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.79296875, -0.7697067260742188, -0.7464447021484375, -0.7231826782226562, -0.699920654296875, -0.6766586303710938, -0.6533966064453125, -0.6301345825195312, -0.60687255859375, -0.5836105346679688, -0.5603485107421875, -0.5370864868164062, -0.513824462890625, -0.49056243896484375, -0.4673004150390625, -0.44403839111328125, -0.4207763671875, -0.39751434326171875, -0.3742523193359375, -0.35099029541015625, -0.327728271484375, -0.30446624755859375, -0.2812042236328125, -0.25794219970703125, -0.23468017578125, -0.21141815185546875, -0.1881561279296875, -0.16489410400390625, -0.141632080078125, -0.11837005615234375, -0.0951080322265625, -0.07184600830078125, -0.048583984375, -0.02532196044921875, -0.0020599365234375, 0.02120208740234375, 0.044464111328125, 0.06772613525390625, 0.0909881591796875, 0.11425018310546875, 0.13751220703125, 0.16077423095703125, 0.1840362548828125, 0.20729827880859375, 0.230560302734375, 0.25382232666015625, 0.2770843505859375, 0.30034637451171875, 0.3236083984375, 0.34687042236328125, 0.3701324462890625, 0.39339447021484375, 0.416656494140625, 0.43991851806640625, 0.4631805419921875, 0.48644256591796875, 0.50970458984375, 0.5329666137695312, 0.5562286376953125, 0.5794906616210938, 0.602752685546875, 0.6260147094726562, 0.6492767333984375, 0.6725387573242188, 0.69580078125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 8.0, 15.0, 102.0, 3884.0, 52.0, 11.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.169921875, -0.16414642333984375, -0.1583709716796875, -0.15259552001953125, -0.146820068359375, -0.14104461669921875, -0.1352691650390625, -0.12949371337890625, -0.12371826171875, -0.11794281005859375, -0.1121673583984375, -0.10639190673828125, -0.100616455078125, -0.09484100341796875, -0.0890655517578125, -0.08329010009765625, -0.0775146484375, -0.07173919677734375, -0.0659637451171875, -0.06018829345703125, -0.054412841796875, -0.04863739013671875, -0.0428619384765625, -0.03708648681640625, -0.03131103515625, -0.02553558349609375, -0.0197601318359375, -0.01398468017578125, -0.008209228515625, -0.00243377685546875, 0.0033416748046875, 0.00911712646484375, 0.014892578125, 0.02066802978515625, 0.0264434814453125, 0.03221893310546875, 0.037994384765625, 0.04376983642578125, 0.0495452880859375, 0.05532073974609375, 0.06109619140625, 0.06687164306640625, 0.0726470947265625, 0.07842254638671875, 0.084197998046875, 0.08997344970703125, 0.0957489013671875, 0.10152435302734375, 0.1072998046875, 0.11307525634765625, 0.1188507080078125, 0.12462615966796875, 0.130401611328125, 0.13617706298828125, 0.1419525146484375, 0.14772796630859375, 0.15350341796875, 0.15927886962890625, 0.1650543212890625, 0.17082977294921875, 0.176605224609375, 0.18238067626953125, 0.1881561279296875, 0.19393157958984375, 0.19970703125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 6.0, 8.0, 13.0, 20.0, 19.0, 19.0, 36.0, 53.0, 76.0, 81.0, 108.0, 108.0, 102.0, 96.0, 75.0, 47.0, 31.0, 29.0, 22.0, 14.0, 6.0, 10.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2450229972600937, -0.23755328357219696, -0.23008356988430023, -0.2226138710975647, -0.21514415740966797, -0.20767444372177124, -0.2002047300338745, -0.19273501634597778, -0.18526530265808105, -0.17779558897018433, -0.1703258752822876, -0.16285616159439087, -0.15538646280765533, -0.1479167491197586, -0.14044703543186188, -0.13297732174396515, -0.12550762295722961, -0.11803790926933289, -0.11056820303201675, -0.10309848934412003, -0.0956287831068039, -0.08815906941890717, -0.08068935573101044, -0.07321964204311371, -0.06574993580579758, -0.05828022584319115, -0.05081051588058472, -0.04334080219268799, -0.03587109223008156, -0.028401382267475128, -0.0209316685795784, -0.01346195861697197, -0.005992233753204346, 0.001477477140724659, 0.008947188034653664, 0.016416899859905243, 0.023886609822511673, 0.0313563197851181, 0.03882603347301483, 0.04629574343562126, 0.05376545339822769, 0.06123516336083412, 0.06870487332344055, 0.07617458701133728, 0.08364430069923401, 0.09111400693655014, 0.09858372062444687, 0.106053426861763, 0.11352314054965973, 0.12099285423755646, 0.12846256792545319, 0.13593226671218872, 0.14340198040008545, 0.15087169408798218, 0.1583414077758789, 0.16581112146377563, 0.17328083515167236, 0.1807505488395691, 0.18822026252746582, 0.19568997621536255, 0.20315967500209808, 0.2106293886899948, 0.21809910237789154, 0.22556881606578827, 0.2330385148525238]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 4.0, 2.0, 3.0, 4.0, 9.0, 7.0, 9.0, 10.0, 13.0, 18.0, 17.0, 20.0, 22.0, 28.0, 27.0, 28.0, 34.0, 33.0, 39.0, 41.0, 30.0, 34.0, 50.0, 36.0, 37.0, 44.0, 25.0, 33.0, 28.0, 43.0, 34.0, 27.0, 45.0, 17.0, 14.0, 15.0, 23.0, 19.0, 16.0, 15.0, 11.0, 6.0, 7.0, 5.0, 4.0, 5.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.1370716094970703, -0.1327364295721054, -0.1284012496471405, -0.1240660548210144, -0.1197308748960495, -0.1153956949710846, -0.11106050759553909, -0.10672532021999359, -0.10239014029502869, -0.09805496037006378, -0.09371977299451828, -0.08938458561897278, -0.08504940569400787, -0.08071422576904297, -0.07637903839349747, -0.07204385101795197, -0.06770867109298706, -0.06337349116802216, -0.059038303792476654, -0.05470312014222145, -0.05036793649196625, -0.046032752841711044, -0.04169756919145584, -0.03736238554120064, -0.033027201890945435, -0.02869201824069023, -0.024356834590435028, -0.020021650940179825, -0.01568646728992462, -0.011351283639669418, -0.007016099989414215, -0.002680916339159012, 0.0016542673110961914, 0.005989450961351395, 0.010324634611606598, 0.014659818261861801, 0.018995001912117004, 0.023330185562372208, 0.02766536921262741, 0.032000552862882614, 0.03633573651313782, 0.04067092016339302, 0.045006103813648224, 0.04934128746390343, 0.05367647111415863, 0.058011654764413834, 0.06234683841466904, 0.06668202579021454, 0.07101720571517944, 0.07535238564014435, 0.07968757301568985, 0.08402276039123535, 0.08835794031620026, 0.09269312024116516, 0.09702830761671066, 0.10136349499225616, 0.10569867491722107, 0.11003385484218597, 0.11436904221773148, 0.11870422959327698, 0.12303940951824188, 0.1273745894432068, 0.13170978426933289, 0.1360449641942978, 0.1403801441192627]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 9.0, 7.0, 4.0, 12.0, 10.0, 16.0, 30.0, 27.0, 41.0, 68.0, 100.0, 111.0, 227.0, 307.0, 444.0, 737.0, 1164.0, 2096.0, 3855.0, 7274.0, 15459.0, 35350.0, 88218.0, 227783.0, 354865.0, 183161.0, 70951.0, 29045.0, 12859.0, 6291.0, 3163.0, 1853.0, 1048.0, 693.0, 416.0, 284.0, 167.0, 109.0, 77.0, 56.0, 50.0, 30.0, 33.0, 16.0, 7.0, 8.0, 7.0, 2.0, 3.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 3.0], "bins": [-0.07763671875, -0.07516288757324219, -0.07268905639648438, -0.07021522521972656, -0.06774139404296875, -0.06526756286621094, -0.06279373168945312, -0.06031990051269531, -0.0578460693359375, -0.05537223815917969, -0.052898406982421875, -0.05042457580566406, -0.04795074462890625, -0.04547691345214844, -0.043003082275390625, -0.04052925109863281, -0.038055419921875, -0.03558158874511719, -0.033107757568359375, -0.030633926391601562, -0.02816009521484375, -0.025686264038085938, -0.023212432861328125, -0.020738601684570312, -0.0182647705078125, -0.015790939331054688, -0.013317108154296875, -0.010843276977539062, -0.00836944580078125, -0.0058956146240234375, -0.003421783447265625, -0.0009479522705078125, 0.00152587890625, 0.0039997100830078125, 0.006473541259765625, 0.008947372436523438, 0.01142120361328125, 0.013895034790039062, 0.016368865966796875, 0.018842697143554688, 0.0213165283203125, 0.023790359497070312, 0.026264190673828125, 0.028738021850585938, 0.03121185302734375, 0.03368568420410156, 0.036159515380859375, 0.03863334655761719, 0.041107177734375, 0.04358100891113281, 0.046054840087890625, 0.04852867126464844, 0.05100250244140625, 0.05347633361816406, 0.055950164794921875, 0.05842399597167969, 0.0608978271484375, 0.06337165832519531, 0.06584548950195312, 0.06831932067871094, 0.07079315185546875, 0.07326698303222656, 0.07574081420898438, 0.07821464538574219, 0.0806884765625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 7.0, 0.0, 6.0, 6.0, 5.0, 6.0, 9.0, 15.0, 15.0, 12.0, 16.0, 16.0, 20.0, 12.0, 28.0, 36.0, 41.0, 33.0, 32.0, 39.0, 29.0, 49.0, 47.0, 31.0, 53.0, 46.0, 49.0, 43.0, 46.0, 35.0, 28.0, 23.0, 27.0, 19.0, 16.0, 19.0, 12.0, 12.0, 14.0, 12.0, 10.0, 9.0, 4.0, 8.0, 4.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.040313720703125, -0.03911113739013672, -0.03790855407714844, -0.036705970764160156, -0.035503387451171875, -0.034300804138183594, -0.03309822082519531, -0.03189563751220703, -0.03069305419921875, -0.02949047088623047, -0.028287887573242188, -0.027085304260253906, -0.025882720947265625, -0.024680137634277344, -0.023477554321289062, -0.02227497100830078, -0.0210723876953125, -0.01986980438232422, -0.018667221069335938, -0.017464637756347656, -0.016262054443359375, -0.015059471130371094, -0.013856887817382812, -0.012654304504394531, -0.01145172119140625, -0.010249137878417969, -0.009046554565429688, -0.007843971252441406, -0.006641387939453125, -0.005438804626464844, -0.0042362213134765625, -0.0030336380004882812, -0.0018310546875, -0.0006284713745117188, 0.0005741119384765625, 0.0017766952514648438, 0.002979278564453125, 0.004181861877441406, 0.0053844451904296875, 0.006587028503417969, 0.00778961181640625, 0.008992195129394531, 0.010194778442382812, 0.011397361755371094, 0.012599945068359375, 0.013802528381347656, 0.015005111694335938, 0.01620769500732422, 0.0174102783203125, 0.01861286163330078, 0.019815444946289062, 0.021018028259277344, 0.022220611572265625, 0.023423194885253906, 0.024625778198242188, 0.02582836151123047, 0.02703094482421875, 0.02823352813720703, 0.029436111450195312, 0.030638694763183594, 0.031841278076171875, 0.033043861389160156, 0.03424644470214844, 0.03544902801513672, 0.036651611328125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 2.0, 3.0, 3.0, 11.0, 8.0, 14.0, 14.0, 27.0, 32.0, 39.0, 69.0, 89.0, 118.0, 198.0, 242.0, 443.0, 796.0, 1635.0, 4440.0, 16215.0, 95027.0, 684233.0, 206016.0, 27455.0, 6563.0, 2296.0, 1015.0, 526.0, 327.0, 215.0, 157.0, 98.0, 68.0, 49.0, 36.0, 27.0, 14.0, 11.0, 9.0, 7.0, 4.0, 1.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1624755859375, -0.1577892303466797, -0.15310287475585938, -0.14841651916503906, -0.14373016357421875, -0.13904380798339844, -0.13435745239257812, -0.1296710968017578, -0.1249847412109375, -0.12029838562011719, -0.11561203002929688, -0.11092567443847656, -0.10623931884765625, -0.10155296325683594, -0.09686660766601562, -0.09218025207519531, -0.087493896484375, -0.08280754089355469, -0.07812118530273438, -0.07343482971191406, -0.06874847412109375, -0.06406211853027344, -0.059375762939453125, -0.05468940734863281, -0.0500030517578125, -0.04531669616699219, -0.040630340576171875, -0.03594398498535156, -0.03125762939453125, -0.026571273803710938, -0.021884918212890625, -0.017198562622070312, -0.01251220703125, -0.007825851440429688, -0.003139495849609375, 0.0015468597412109375, 0.00623321533203125, 0.010919570922851562, 0.015605926513671875, 0.020292282104492188, 0.0249786376953125, 0.029664993286132812, 0.034351348876953125, 0.03903770446777344, 0.04372406005859375, 0.04841041564941406, 0.053096771240234375, 0.05778312683105469, 0.062469482421875, 0.06715583801269531, 0.07184219360351562, 0.07652854919433594, 0.08121490478515625, 0.08590126037597656, 0.09058761596679688, 0.09527397155761719, 0.0999603271484375, 0.10464668273925781, 0.10933303833007812, 0.11401939392089844, 0.11870574951171875, 0.12339210510253906, 0.12807846069335938, 0.1327648162841797, 0.137451171875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 8.0, 5.0, 14.0, 9.0, 8.0, 25.0, 17.0, 39.0, 18.0, 39.0, 33.0, 50.0, 31.0, 43.0, 48.0, 55.0, 55.0, 60.0, 42.0, 46.0, 59.0, 35.0, 43.0, 40.0, 39.0, 21.0, 34.0, 24.0, 9.0, 10.0, 7.0, 11.0, 7.0, 7.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2349853515625, -0.22806930541992188, -0.22115325927734375, -0.21423721313476562, -0.2073211669921875, -0.20040512084960938, -0.19348907470703125, -0.18657302856445312, -0.179656982421875, -0.17274093627929688, -0.16582489013671875, -0.15890884399414062, -0.1519927978515625, -0.14507675170898438, -0.13816070556640625, -0.13124465942382812, -0.12432861328125, -0.11741256713867188, -0.11049652099609375, -0.10358047485351562, -0.0966644287109375, -0.08974838256835938, -0.08283233642578125, -0.07591629028320312, -0.069000244140625, -0.062084197998046875, -0.05516815185546875, -0.048252105712890625, -0.0413360595703125, -0.034420013427734375, -0.02750396728515625, -0.020587921142578125, -0.013671875, -0.006755828857421875, 0.00016021728515625, 0.007076263427734375, 0.0139923095703125, 0.020908355712890625, 0.02782440185546875, 0.034740447998046875, 0.041656494140625, 0.048572540283203125, 0.05548858642578125, 0.062404632568359375, 0.0693206787109375, 0.07623672485351562, 0.08315277099609375, 0.09006881713867188, 0.09698486328125, 0.10390090942382812, 0.11081695556640625, 0.11773300170898438, 0.1246490478515625, 0.13156509399414062, 0.13848114013671875, 0.14539718627929688, 0.152313232421875, 0.15922927856445312, 0.16614532470703125, 0.17306137084960938, 0.1799774169921875, 0.18689346313476562, 0.19380950927734375, 0.20072555541992188, 0.2076416015625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 2.0, 5.0, 8.0, 3.0, 12.0, 22.0, 32.0, 56.0, 91.0, 196.0, 445.0, 1383.0, 11594.0, 842199.0, 186035.0, 4843.0, 908.0, 334.0, 144.0, 64.0, 62.0, 41.0, 24.0, 19.0, 8.0, 7.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.2646484375, -0.25832176208496094, -0.2519950866699219, -0.2456684112548828, -0.23934173583984375, -0.2330150604248047, -0.22668838500976562, -0.22036170959472656, -0.2140350341796875, -0.20770835876464844, -0.20138168334960938, -0.1950550079345703, -0.18872833251953125, -0.1824016571044922, -0.17607498168945312, -0.16974830627441406, -0.163421630859375, -0.15709495544433594, -0.15076828002929688, -0.1444416046142578, -0.13811492919921875, -0.1317882537841797, -0.12546157836914062, -0.11913490295410156, -0.1128082275390625, -0.10648155212402344, -0.10015487670898438, -0.09382820129394531, -0.08750152587890625, -0.08117485046386719, -0.07484817504882812, -0.06852149963378906, -0.06219482421875, -0.05586814880371094, -0.049541473388671875, -0.04321479797363281, -0.03688812255859375, -0.030561447143554688, -0.024234771728515625, -0.017908096313476562, -0.0115814208984375, -0.0052547454833984375, 0.001071929931640625, 0.0073986053466796875, 0.01372528076171875, 0.020051956176757812, 0.026378631591796875, 0.03270530700683594, 0.039031982421875, 0.04535865783691406, 0.051685333251953125, 0.05801200866699219, 0.06433868408203125, 0.07066535949707031, 0.07699203491210938, 0.08331871032714844, 0.0896453857421875, 0.09597206115722656, 0.10229873657226562, 0.10862541198730469, 0.11495208740234375, 0.12127876281738281, 0.12760543823242188, 0.13393211364746094, 0.1402587890625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 8.0, 7.0, 10.0, 10.0, 15.0, 11.0, 18.0, 18.0, 37.0, 42.0, 48.0, 46.0, 86.0, 71.0, 78.0, 80.0, 65.0, 71.0, 49.0, 49.0, 45.0, 25.0, 20.0, 23.0, 10.0, 11.0, 10.0, 8.0, 10.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1278858184814453e-05, -2.0585954189300537e-05, -1.989305019378662e-05, -1.9200146198272705e-05, -1.850724220275879e-05, -1.7814338207244873e-05, -1.7121434211730957e-05, -1.642853021621704e-05, -1.5735626220703125e-05, -1.5042722225189209e-05, -1.4349818229675293e-05, -1.3656914234161377e-05, -1.2964010238647461e-05, -1.2271106243133545e-05, -1.1578202247619629e-05, -1.0885298252105713e-05, -1.0192394256591797e-05, -9.499490261077881e-06, -8.806586265563965e-06, -8.113682270050049e-06, -7.420778274536133e-06, -6.727874279022217e-06, -6.034970283508301e-06, -5.342066287994385e-06, -4.649162292480469e-06, -3.956258296966553e-06, -3.2633543014526367e-06, -2.5704503059387207e-06, -1.8775463104248047e-06, -1.1846423149108887e-06, -4.917383193969727e-07, 2.0116567611694336e-07, 8.940696716308594e-07, 1.5869736671447754e-06, 2.2798776626586914e-06, 2.9727816581726074e-06, 3.6656856536865234e-06, 4.3585896492004395e-06, 5.0514936447143555e-06, 5.7443976402282715e-06, 6.4373016357421875e-06, 7.1302056312561035e-06, 7.82310962677002e-06, 8.516013622283936e-06, 9.208917617797852e-06, 9.901821613311768e-06, 1.0594725608825684e-05, 1.12876296043396e-05, 1.1980533599853516e-05, 1.2673437595367432e-05, 1.3366341590881348e-05, 1.4059245586395264e-05, 1.475214958190918e-05, 1.5445053577423096e-05, 1.6137957572937012e-05, 1.6830861568450928e-05, 1.7523765563964844e-05, 1.821666955947876e-05, 1.8909573554992676e-05, 1.9602477550506592e-05, 2.0295381546020508e-05, 2.0988285541534424e-05, 2.168118953704834e-05, 2.2374093532562256e-05, 2.3066997528076172e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 12.0, 15.0, 31.0, 56.0, 82.0, 159.0, 280.0, 585.0, 1422.0, 5051.0, 39584.0, 832005.0, 155469.0, 9882.0, 2254.0, 790.0, 395.0, 202.0, 106.0, 67.0, 28.0, 22.0, 15.0, 9.0, 6.0, 5.0, 8.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.174072265625, -0.16945552825927734, -0.1648387908935547, -0.16022205352783203, -0.15560531616210938, -0.15098857879638672, -0.14637184143066406, -0.1417551040649414, -0.13713836669921875, -0.1325216293334961, -0.12790489196777344, -0.12328815460205078, -0.11867141723632812, -0.11405467987060547, -0.10943794250488281, -0.10482120513916016, -0.1002044677734375, -0.09558773040771484, -0.09097099304199219, -0.08635425567626953, -0.08173751831054688, -0.07712078094482422, -0.07250404357910156, -0.0678873062133789, -0.06327056884765625, -0.058653831481933594, -0.05403709411621094, -0.04942035675048828, -0.044803619384765625, -0.04018688201904297, -0.03557014465332031, -0.030953407287597656, -0.026336669921875, -0.021719932556152344, -0.017103195190429688, -0.012486457824707031, -0.007869720458984375, -0.0032529830932617188, 0.0013637542724609375, 0.005980491638183594, 0.01059722900390625, 0.015213966369628906, 0.019830703735351562, 0.02444744110107422, 0.029064178466796875, 0.03368091583251953, 0.03829765319824219, 0.042914390563964844, 0.0475311279296875, 0.052147865295410156, 0.05676460266113281, 0.06138134002685547, 0.06599807739257812, 0.07061481475830078, 0.07523155212402344, 0.0798482894897461, 0.08446502685546875, 0.0890817642211914, 0.09369850158691406, 0.09831523895263672, 0.10293197631835938, 0.10754871368408203, 0.11216545104980469, 0.11678218841552734, 0.12139892578125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 8.0, 9.0, 12.0, 27.0, 49.0, 83.0, 122.0, 164.0, 161.0, 139.0, 85.0, 55.0, 36.0, 24.0, 7.0, 9.0, 7.0, 7.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1910400390625, -0.1868114471435547, -0.18258285522460938, -0.17835426330566406, -0.17412567138671875, -0.16989707946777344, -0.16566848754882812, -0.1614398956298828, -0.1572113037109375, -0.1529827117919922, -0.14875411987304688, -0.14452552795410156, -0.14029693603515625, -0.13606834411621094, -0.13183975219726562, -0.1276111602783203, -0.123382568359375, -0.11915397644042969, -0.11492538452148438, -0.11069679260253906, -0.10646820068359375, -0.10223960876464844, -0.09801101684570312, -0.09378242492675781, -0.0895538330078125, -0.08532524108886719, -0.08109664916992188, -0.07686805725097656, -0.07263946533203125, -0.06841087341308594, -0.06418228149414062, -0.05995368957519531, -0.05572509765625, -0.05149650573730469, -0.047267913818359375, -0.04303932189941406, -0.03881072998046875, -0.03458213806152344, -0.030353546142578125, -0.026124954223632812, -0.0218963623046875, -0.017667770385742188, -0.013439178466796875, -0.009210586547851562, -0.00498199462890625, -0.0007534027099609375, 0.003475189208984375, 0.0077037811279296875, 0.011932373046875, 0.016160964965820312, 0.020389556884765625, 0.024618148803710938, 0.02884674072265625, 0.03307533264160156, 0.037303924560546875, 0.04153251647949219, 0.0457611083984375, 0.04998970031738281, 0.054218292236328125, 0.05844688415527344, 0.06267547607421875, 0.06690406799316406, 0.07113265991210938, 0.07536125183105469, 0.07958984375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 9.0, 4.0, 33.0, 85.0, 234.0, 276.0, 200.0, 102.0, 32.0, 16.0, 9.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9702353477478027, -2.891038179397583, -2.8118410110473633, -2.7326440811157227, -2.653446912765503, -2.574249744415283, -2.4950528144836426, -2.415855646133423, -2.336658477783203, -2.2574613094329834, -2.1782641410827637, -2.099067211151123, -2.0198700428009033, -1.9406728744506836, -1.8614758253097534, -1.7822787761688232, -1.7030816078186035, -1.6238844394683838, -1.5446873903274536, -1.4654903411865234, -1.3862931728363037, -1.307096004486084, -1.2278989553451538, -1.1487019062042236, -1.069504737854004, -0.990307629108429, -0.911110520362854, -0.831913411617279, -0.7527163028717041, -0.6735191941261292, -0.5943220853805542, -0.5151249766349792, -0.4359278678894043, -0.35673075914382935, -0.2775336503982544, -0.19833654165267944, -0.11913943290710449, -0.03994232416152954, 0.03925478458404541, 0.11845189332962036, 0.1976490020751953, 0.27684611082077026, 0.3560432195663452, 0.43524032831192017, 0.5144374370574951, 0.5936345458030701, 0.672831654548645, 0.75202876329422, 0.8312258720397949, 0.9104229807853699, 0.9896200895309448, 1.068817138671875, 1.1480143070220947, 1.2272114753723145, 1.3064085245132446, 1.3856055736541748, 1.4648027420043945, 1.5439999103546143, 1.6231969594955444, 1.7023940086364746, 1.7815911769866943, 1.860788345336914, 1.9399853944778442, 2.0191824436187744, 2.098379611968994]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 10.0, 16.0, 16.0, 23.0, 21.0, 18.0, 34.0, 42.0, 46.0, 53.0, 59.0, 69.0, 87.0, 74.0, 76.0, 66.0, 61.0, 36.0, 50.0, 29.0, 24.0, 23.0, 19.0, 14.0, 8.0, 9.0, 2.0, 6.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0803883075714111, -1.0384495258331299, -0.9965108036994934, -0.9545720815658569, -0.9126332998275757, -0.8706945180892944, -0.828755795955658, -0.7868170738220215, -0.7448782920837402, -0.702939510345459, -0.6610007882118225, -0.619062066078186, -0.5771232843399048, -0.5351845026016235, -0.49324578046798706, -0.4513070285320282, -0.40936827659606934, -0.3674295246601105, -0.3254907727241516, -0.28355202078819275, -0.2416132688522339, -0.19967451691627502, -0.15773576498031616, -0.1157970130443573, -0.07385826110839844, -0.031919509172439575, 0.010019242763519287, 0.05195799469947815, 0.09389674663543701, 0.13583549857139587, 0.17777425050735474, 0.2197130024433136, 0.26165175437927246, 0.3035905063152313, 0.3455292582511902, 0.38746801018714905, 0.4294067621231079, 0.4713455140590668, 0.5132842659950256, 0.5552229881286621, 0.5971617698669434, 0.6391005516052246, 0.6810392737388611, 0.7229779958724976, 0.7649167776107788, 0.8068555593490601, 0.8487942814826965, 0.890733003616333, 0.9326717853546143, 0.9746105670928955, 1.0165493488311768, 1.0584880113601685, 1.1004267930984497, 1.142365574836731, 1.1843042373657227, 1.226243019104004, 1.2681818008422852, 1.3101205825805664, 1.3520593643188477, 1.3939980268478394, 1.4359368085861206, 1.4778755903244019, 1.5198142528533936, 1.5617530345916748, 1.603691816329956]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 5.0, 10.0, 11.0, 13.0, 19.0, 21.0, 25.0, 51.0, 55.0, 86.0, 123.0, 173.0, 233.0, 335.0, 527.0, 991.0, 2199.0, 6888.0, 31969.0, 4041324.0, 90522.0, 11805.0, 3402.0, 1392.0, 698.0, 406.0, 281.0, 189.0, 144.0, 96.0, 66.0, 68.0, 48.0, 30.0, 20.0, 21.0, 10.0, 11.0, 2.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.22705078125, -0.2201080322265625, -0.213165283203125, -0.2062225341796875, -0.19927978515625, -0.1923370361328125, -0.185394287109375, -0.1784515380859375, -0.1715087890625, -0.1645660400390625, -0.157623291015625, -0.1506805419921875, -0.14373779296875, -0.1367950439453125, -0.129852294921875, -0.1229095458984375, -0.115966796875, -0.1090240478515625, -0.102081298828125, -0.0951385498046875, -0.08819580078125, -0.0812530517578125, -0.074310302734375, -0.0673675537109375, -0.0604248046875, -0.0534820556640625, -0.046539306640625, -0.0395965576171875, -0.03265380859375, -0.0257110595703125, -0.018768310546875, -0.0118255615234375, -0.0048828125, 0.0020599365234375, 0.009002685546875, 0.0159454345703125, 0.02288818359375, 0.0298309326171875, 0.036773681640625, 0.0437164306640625, 0.0506591796875, 0.0576019287109375, 0.064544677734375, 0.0714874267578125, 0.07843017578125, 0.0853729248046875, 0.092315673828125, 0.0992584228515625, 0.106201171875, 0.1131439208984375, 0.120086669921875, 0.1270294189453125, 0.13397216796875, 0.1409149169921875, 0.147857666015625, 0.1548004150390625, 0.1617431640625, 0.1686859130859375, 0.175628662109375, 0.1825714111328125, 0.18951416015625, 0.1964569091796875, 0.203399658203125, 0.2103424072265625, 0.21728515625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 7.0, 10.0, 12.0, 19.0, 26.0, 28.0, 50.0, 65.0, 77.0, 98.0, 99.0, 105.0, 118.0, 75.0, 57.0, 47.0, 41.0, 36.0, 17.0, 9.0, 3.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.087890625, -0.08505630493164062, -0.08222198486328125, -0.07938766479492188, -0.0765533447265625, -0.07371902465820312, -0.07088470458984375, -0.06805038452148438, -0.065216064453125, -0.062381744384765625, -0.05954742431640625, -0.056713104248046875, -0.0538787841796875, -0.051044464111328125, -0.04821014404296875, -0.045375823974609375, -0.04254150390625, -0.039707183837890625, -0.03687286376953125, -0.034038543701171875, -0.0312042236328125, -0.028369903564453125, -0.02553558349609375, -0.022701263427734375, -0.019866943359375, -0.017032623291015625, -0.01419830322265625, -0.011363983154296875, -0.0085296630859375, -0.005695343017578125, -0.00286102294921875, -2.6702880859375e-05, 0.0028076171875, 0.005641937255859375, 0.00847625732421875, 0.011310577392578125, 0.0141448974609375, 0.016979217529296875, 0.01981353759765625, 0.022647857666015625, 0.025482177734375, 0.028316497802734375, 0.03115081787109375, 0.033985137939453125, 0.0368194580078125, 0.039653778076171875, 0.04248809814453125, 0.045322418212890625, 0.04815673828125, 0.050991058349609375, 0.05382537841796875, 0.056659698486328125, 0.0594940185546875, 0.062328338623046875, 0.06516265869140625, 0.06799697875976562, 0.070831298828125, 0.07366561889648438, 0.07649993896484375, 0.07933425903320312, 0.0821685791015625, 0.08500289916992188, 0.08783721923828125, 0.09067153930664062, 0.093505859375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 2.0, 2.0, 4.0, 6.0, 11.0, 12.0, 17.0, 23.0, 23.0, 46.0, 47.0, 66.0, 102.0, 140.0, 211.0, 290.0, 456.0, 640.0, 1057.0, 1825.0, 3581.0, 8641.0, 31241.0, 3330202.0, 770759.0, 28403.0, 8147.0, 3509.0, 1794.0, 1019.0, 638.0, 414.0, 269.0, 189.0, 151.0, 99.0, 70.0, 53.0, 29.0, 23.0, 23.0, 15.0, 10.0, 9.0, 4.0, 1.0, 3.0, 5.0, 6.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.2103271484375, -0.20413589477539062, -0.19794464111328125, -0.19175338745117188, -0.1855621337890625, -0.17937088012695312, -0.17317962646484375, -0.16698837280273438, -0.160797119140625, -0.15460586547851562, -0.14841461181640625, -0.14222335815429688, -0.1360321044921875, -0.12984085083007812, -0.12364959716796875, -0.11745834350585938, -0.11126708984375, -0.10507583618164062, -0.09888458251953125, -0.09269332885742188, -0.0865020751953125, -0.08031082153320312, -0.07411956787109375, -0.06792831420898438, -0.061737060546875, -0.055545806884765625, -0.04935455322265625, -0.043163299560546875, -0.0369720458984375, -0.030780792236328125, -0.02458953857421875, -0.018398284912109375, -0.01220703125, -0.006015777587890625, 0.00017547607421875, 0.006366729736328125, 0.0125579833984375, 0.018749237060546875, 0.02494049072265625, 0.031131744384765625, 0.037322998046875, 0.043514251708984375, 0.04970550537109375, 0.055896759033203125, 0.0620880126953125, 0.06827926635742188, 0.07447052001953125, 0.08066177368164062, 0.08685302734375, 0.09304428100585938, 0.09923553466796875, 0.10542678833007812, 0.1116180419921875, 0.11780929565429688, 0.12400054931640625, 0.13019180297851562, 0.136383056640625, 0.14257431030273438, 0.14876556396484375, 0.15495681762695312, 0.1611480712890625, 0.16733932495117188, 0.17353057861328125, 0.17972183227539062, 0.1859130859375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 5.0, 6.0, 8.0, 11.0, 14.0, 28.0, 36.0, 109.0, 728.0, 2829.0, 161.0, 48.0, 37.0, 13.0, 5.0, 8.0, 10.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09521484375, -0.09224796295166016, -0.08928108215332031, -0.08631420135498047, -0.08334732055664062, -0.08038043975830078, -0.07741355895996094, -0.0744466781616211, -0.07147979736328125, -0.0685129165649414, -0.06554603576660156, -0.06257915496826172, -0.059612274169921875, -0.05664539337158203, -0.05367851257324219, -0.050711631774902344, -0.0477447509765625, -0.044777870178222656, -0.04181098937988281, -0.03884410858154297, -0.035877227783203125, -0.03291034698486328, -0.029943466186523438, -0.026976585388183594, -0.02400970458984375, -0.021042823791503906, -0.018075942993164062, -0.015109062194824219, -0.012142181396484375, -0.009175300598144531, -0.0062084197998046875, -0.0032415390014648438, -0.000274658203125, 0.0026922225952148438, 0.0056591033935546875, 0.008625984191894531, 0.011592864990234375, 0.014559745788574219, 0.017526626586914062, 0.020493507385253906, 0.02346038818359375, 0.026427268981933594, 0.029394149780273438, 0.03236103057861328, 0.035327911376953125, 0.03829479217529297, 0.04126167297363281, 0.044228553771972656, 0.0471954345703125, 0.050162315368652344, 0.05312919616699219, 0.05609607696533203, 0.059062957763671875, 0.06202983856201172, 0.06499671936035156, 0.0679636001586914, 0.07093048095703125, 0.0738973617553711, 0.07686424255371094, 0.07983112335205078, 0.08279800415039062, 0.08576488494873047, 0.08873176574707031, 0.09169864654541016, 0.09466552734375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 2.0, 2.0, 8.0, 16.0, 14.0, 10.0, 15.0, 29.0, 35.0, 42.0, 61.0, 92.0, 98.0, 100.0, 102.0, 82.0, 84.0, 62.0, 38.0, 39.0, 25.0, 11.0, 10.0, 6.0, 8.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3083820044994354, -0.29975780844688416, -0.2911336123943329, -0.2825094163417816, -0.27388522028923035, -0.2652610242366791, -0.2566368281841278, -0.24801264703273773, -0.23938845098018646, -0.2307642549276352, -0.22214005887508392, -0.21351586282253265, -0.20489168167114258, -0.1962674856185913, -0.18764328956604004, -0.17901909351348877, -0.1703948974609375, -0.16177070140838623, -0.15314650535583496, -0.1445223093032837, -0.13589811325073242, -0.12727391719818115, -0.11864973604679108, -0.11002553999423981, -0.10140134394168854, -0.09277714788913727, -0.084152951836586, -0.07552876323461533, -0.06690456718206406, -0.05828037112951279, -0.049656178802251816, -0.041031986474990845, -0.03240780532360077, -0.02378361113369465, -0.015159416943788528, -0.006535222753882408, 0.002088971436023712, 0.010713167488574982, 0.019337359815835953, 0.027961552143096924, 0.03658574819564819, 0.04520994424819946, 0.053834136575460434, 0.062458328902721405, 0.07108252495527267, 0.07970672100782394, 0.08833090960979462, 0.09695510566234589, 0.10557930171489716, 0.11420349776744843, 0.1228276938199997, 0.13145188987255096, 0.14007607102394104, 0.1487002670764923, 0.15732446312904358, 0.16594865918159485, 0.17457285523414612, 0.1831970512866974, 0.19182124733924866, 0.20044544339179993, 0.2090696394443512, 0.21769383549690247, 0.22631801664829254, 0.2349422127008438, 0.24356640875339508]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 10.0, 3.0, 6.0, 18.0, 14.0, 14.0, 20.0, 18.0, 28.0, 30.0, 37.0, 28.0, 33.0, 51.0, 43.0, 50.0, 36.0, 49.0, 34.0, 52.0, 41.0, 53.0, 46.0, 31.0, 47.0, 36.0, 22.0, 26.0, 25.0, 21.0, 10.0, 19.0, 12.0, 12.0, 3.0, 6.0, 6.0, 2.0, 4.0, 0.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.18508309125900269, -0.17879697680473328, -0.17251084744930267, -0.16622473299503326, -0.15993860363960266, -0.15365248918533325, -0.14736637473106384, -0.14108026027679443, -0.13479413092136383, -0.12850801646709442, -0.12222188711166382, -0.11593577265739441, -0.1096496507525444, -0.1033635288476944, -0.09707741439342499, -0.09079129248857498, -0.08450517058372498, -0.07821904867887497, -0.07193292677402496, -0.06564681231975555, -0.05936069041490555, -0.05307456851005554, -0.046788450330495834, -0.04050233215093613, -0.03421621024608612, -0.027930090203881264, -0.021643970161676407, -0.01535785011947155, -0.009071730077266693, -0.002785608172416687, 0.0035005100071430206, 0.009786628186702728, 0.016072750091552734, 0.02235887013375759, 0.028644990175962448, 0.034931108355522156, 0.04121723026037216, 0.04750335216522217, 0.053789470344781876, 0.06007558852434158, 0.06636171042919159, 0.0726478323340416, 0.0789339542388916, 0.08522006869316101, 0.09150619059801102, 0.09779231250286102, 0.10407842695713043, 0.11036454886198044, 0.11665067076683044, 0.12293679267168045, 0.12922291457653046, 0.13550902903079987, 0.14179515838623047, 0.14808127284049988, 0.1543673872947693, 0.1606535017490387, 0.1669396311044693, 0.1732257455587387, 0.1795118749141693, 0.18579798936843872, 0.19208410382270813, 0.19837023317813873, 0.20465634763240814, 0.21094247698783875, 0.21722859144210815]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 8.0, 10.0, 29.0, 39.0, 41.0, 89.0, 154.0, 230.0, 458.0, 851.0, 1650.0, 3693.0, 10066.0, 32596.0, 131757.0, 509375.0, 269181.0, 60745.0, 16936.0, 5818.0, 2379.0, 1099.0, 585.0, 309.0, 182.0, 101.0, 64.0, 42.0, 24.0, 10.0, 14.0, 7.0, 3.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1624755859375, -0.1570110321044922, -0.15154647827148438, -0.14608192443847656, -0.14061737060546875, -0.13515281677246094, -0.12968826293945312, -0.12422370910644531, -0.1187591552734375, -0.11329460144042969, -0.10783004760742188, -0.10236549377441406, -0.09690093994140625, -0.09143638610839844, -0.08597183227539062, -0.08050727844238281, -0.075042724609375, -0.06957817077636719, -0.06411361694335938, -0.05864906311035156, -0.05318450927734375, -0.04771995544433594, -0.042255401611328125, -0.03679084777832031, -0.0313262939453125, -0.025861740112304688, -0.020397186279296875, -0.014932632446289062, -0.00946807861328125, -0.0040035247802734375, 0.001461029052734375, 0.0069255828857421875, 0.01239013671875, 0.017854690551757812, 0.023319244384765625, 0.028783798217773438, 0.03424835205078125, 0.03971290588378906, 0.045177459716796875, 0.05064201354980469, 0.0561065673828125, 0.06157112121582031, 0.06703567504882812, 0.07250022888183594, 0.07796478271484375, 0.08342933654785156, 0.08889389038085938, 0.09435844421386719, 0.099822998046875, 0.10528755187988281, 0.11075210571289062, 0.11621665954589844, 0.12168121337890625, 0.12714576721191406, 0.13261032104492188, 0.1380748748779297, 0.1435394287109375, 0.1490039825439453, 0.15446853637695312, 0.15993309020996094, 0.16539764404296875, 0.17086219787597656, 0.17632675170898438, 0.1817913055419922, 0.187255859375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 8.0, 10.0, 21.0, 23.0, 29.0, 49.0, 56.0, 81.0, 85.0, 103.0, 85.0, 107.0, 94.0, 80.0, 50.0, 42.0, 25.0, 18.0, 18.0, 11.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10992431640625, -0.1069021224975586, -0.10387992858886719, -0.10085773468017578, -0.09783554077148438, -0.09481334686279297, -0.09179115295410156, -0.08876895904541016, -0.08574676513671875, -0.08272457122802734, -0.07970237731933594, -0.07668018341064453, -0.07365798950195312, -0.07063579559326172, -0.06761360168457031, -0.0645914077758789, -0.0615692138671875, -0.058547019958496094, -0.05552482604980469, -0.05250263214111328, -0.049480438232421875, -0.04645824432373047, -0.04343605041503906, -0.040413856506347656, -0.03739166259765625, -0.034369468688964844, -0.03134727478027344, -0.02832508087158203, -0.025302886962890625, -0.02228069305419922, -0.019258499145507812, -0.016236305236816406, -0.013214111328125, -0.010191917419433594, -0.0071697235107421875, -0.004147529602050781, -0.001125335693359375, 0.0018968582153320312, 0.0049190521240234375, 0.007941246032714844, 0.01096343994140625, 0.013985633850097656, 0.017007827758789062, 0.02003002166748047, 0.023052215576171875, 0.02607440948486328, 0.029096603393554688, 0.032118797302246094, 0.0351409912109375, 0.038163185119628906, 0.04118537902832031, 0.04420757293701172, 0.047229766845703125, 0.05025196075439453, 0.05327415466308594, 0.056296348571777344, 0.05931854248046875, 0.062340736389160156, 0.06536293029785156, 0.06838512420654297, 0.07140731811523438, 0.07442951202392578, 0.07745170593261719, 0.0804738998413086, 0.08349609375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 7.0, 4.0, 6.0, 10.0, 8.0, 13.0, 12.0, 23.0, 45.0, 49.0, 60.0, 78.0, 99.0, 168.0, 234.0, 323.0, 492.0, 843.0, 1583.0, 3161.0, 7710.0, 24385.0, 120487.0, 620478.0, 211181.0, 37533.0, 10607.0, 4096.0, 1963.0, 1004.0, 614.0, 363.0, 288.0, 164.0, 117.0, 90.0, 73.0, 53.0, 33.0, 27.0, 25.0, 11.0, 11.0, 10.0, 4.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.16943359375, -0.164398193359375, -0.15936279296875, -0.154327392578125, -0.1492919921875, -0.144256591796875, -0.13922119140625, -0.134185791015625, -0.129150390625, -0.124114990234375, -0.11907958984375, -0.114044189453125, -0.1090087890625, -0.103973388671875, -0.09893798828125, -0.093902587890625, -0.0888671875, -0.083831787109375, -0.07879638671875, -0.073760986328125, -0.0687255859375, -0.063690185546875, -0.05865478515625, -0.053619384765625, -0.048583984375, -0.043548583984375, -0.03851318359375, -0.033477783203125, -0.0284423828125, -0.023406982421875, -0.01837158203125, -0.013336181640625, -0.00830078125, -0.003265380859375, 0.00177001953125, 0.006805419921875, 0.0118408203125, 0.016876220703125, 0.02191162109375, 0.026947021484375, 0.031982421875, 0.037017822265625, 0.04205322265625, 0.047088623046875, 0.0521240234375, 0.057159423828125, 0.06219482421875, 0.067230224609375, 0.072265625, 0.077301025390625, 0.08233642578125, 0.087371826171875, 0.0924072265625, 0.097442626953125, 0.10247802734375, 0.107513427734375, 0.112548828125, 0.117584228515625, 0.12261962890625, 0.127655029296875, 0.1326904296875, 0.137725830078125, 0.14276123046875, 0.147796630859375, 0.15283203125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 7.0, 3.0, 7.0, 5.0, 5.0, 16.0, 13.0, 13.0, 16.0, 26.0, 32.0, 21.0, 29.0, 44.0, 36.0, 31.0, 40.0, 34.0, 33.0, 44.0, 39.0, 40.0, 29.0, 38.0, 38.0, 37.0, 31.0, 32.0, 35.0, 34.0, 19.0, 24.0, 22.0, 21.0, 13.0, 15.0, 16.0, 17.0, 7.0, 5.0, 7.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.1904296875, -0.1849346160888672, -0.17943954467773438, -0.17394447326660156, -0.16844940185546875, -0.16295433044433594, -0.15745925903320312, -0.1519641876220703, -0.1464691162109375, -0.1409740447998047, -0.13547897338867188, -0.12998390197753906, -0.12448883056640625, -0.11899375915527344, -0.11349868774414062, -0.10800361633300781, -0.102508544921875, -0.09701347351074219, -0.09151840209960938, -0.08602333068847656, -0.08052825927734375, -0.07503318786621094, -0.06953811645507812, -0.06404304504394531, -0.0585479736328125, -0.05305290222167969, -0.047557830810546875, -0.04206275939941406, -0.03656768798828125, -0.031072616577148438, -0.025577545166015625, -0.020082473754882812, -0.01458740234375, -0.009092330932617188, -0.003597259521484375, 0.0018978118896484375, 0.00739288330078125, 0.012887954711914062, 0.018383026123046875, 0.023878097534179688, 0.0293731689453125, 0.03486824035644531, 0.040363311767578125, 0.04585838317871094, 0.05135345458984375, 0.05684852600097656, 0.062343597412109375, 0.06783866882324219, 0.073333740234375, 0.07882881164550781, 0.08432388305664062, 0.08981895446777344, 0.09531402587890625, 0.10080909729003906, 0.10630416870117188, 0.11179924011230469, 0.1172943115234375, 0.12278938293457031, 0.12828445434570312, 0.13377952575683594, 0.13927459716796875, 0.14476966857910156, 0.15026473999023438, 0.1557598114013672, 0.1612548828125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 4.0, 6.0, 6.0, 5.0, 4.0, 6.0, 5.0, 11.0, 12.0, 27.0, 31.0, 34.0, 64.0, 115.0, 154.0, 230.0, 349.0, 626.0, 1251.0, 2620.0, 6578.0, 22242.0, 148853.0, 698580.0, 134285.0, 20900.0, 6173.0, 2480.0, 1218.0, 634.0, 377.0, 241.0, 130.0, 99.0, 57.0, 48.0, 26.0, 19.0, 18.0, 9.0, 7.0, 5.0, 7.0, 3.0, 2.0, 4.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06658935546875, -0.06440448760986328, -0.06221961975097656, -0.060034751892089844, -0.057849884033203125, -0.055665016174316406, -0.05348014831542969, -0.05129528045654297, -0.04911041259765625, -0.04692554473876953, -0.04474067687988281, -0.042555809020996094, -0.040370941162109375, -0.038186073303222656, -0.03600120544433594, -0.03381633758544922, -0.0316314697265625, -0.02944660186767578, -0.027261734008789062, -0.025076866149902344, -0.022891998291015625, -0.020707130432128906, -0.018522262573242188, -0.01633739471435547, -0.01415252685546875, -0.011967658996582031, -0.009782791137695312, -0.007597923278808594, -0.005413055419921875, -0.0032281875610351562, -0.0010433197021484375, 0.0011415481567382812, 0.003326416015625, 0.005511283874511719, 0.0076961517333984375, 0.009881019592285156, 0.012065887451171875, 0.014250755310058594, 0.016435623168945312, 0.01862049102783203, 0.02080535888671875, 0.02299022674560547, 0.025175094604492188, 0.027359962463378906, 0.029544830322265625, 0.031729698181152344, 0.03391456604003906, 0.03609943389892578, 0.0382843017578125, 0.04046916961669922, 0.04265403747558594, 0.044838905334472656, 0.047023773193359375, 0.049208641052246094, 0.05139350891113281, 0.05357837677001953, 0.05576324462890625, 0.05794811248779297, 0.06013298034667969, 0.062317848205566406, 0.06450271606445312, 0.06668758392333984, 0.06887245178222656, 0.07105731964111328, 0.0732421875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 7.0, 10.0, 10.0, 15.0, 19.0, 45.0, 42.0, 57.0, 66.0, 100.0, 162.0, 122.0, 95.0, 73.0, 61.0, 24.0, 31.0, 15.0, 12.0, 12.0, 10.0, 5.0, 5.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.500150680541992e-05, -4.3623149394989014e-05, -4.2244791984558105e-05, -4.08664345741272e-05, -3.948807716369629e-05, -3.810971975326538e-05, -3.673136234283447e-05, -3.5353004932403564e-05, -3.3974647521972656e-05, -3.259629011154175e-05, -3.121793270111084e-05, -2.983957529067993e-05, -2.8461217880249023e-05, -2.7082860469818115e-05, -2.5704503059387207e-05, -2.43261456489563e-05, -2.294778823852539e-05, -2.1569430828094482e-05, -2.0191073417663574e-05, -1.8812716007232666e-05, -1.7434358596801758e-05, -1.605600118637085e-05, -1.4677643775939941e-05, -1.3299286365509033e-05, -1.1920928955078125e-05, -1.0542571544647217e-05, -9.164214134216309e-06, -7.7858567237854e-06, -6.407499313354492e-06, -5.029141902923584e-06, -3.6507844924926758e-06, -2.2724270820617676e-06, -8.940696716308594e-07, 4.842877388000488e-07, 1.862645149230957e-06, 3.2410025596618652e-06, 4.6193599700927734e-06, 5.997717380523682e-06, 7.37607479095459e-06, 8.754432201385498e-06, 1.0132789611816406e-05, 1.1511147022247314e-05, 1.2889504432678223e-05, 1.4267861843109131e-05, 1.564621925354004e-05, 1.7024576663970947e-05, 1.8402934074401855e-05, 1.9781291484832764e-05, 2.1159648895263672e-05, 2.253800630569458e-05, 2.3916363716125488e-05, 2.5294721126556396e-05, 2.6673078536987305e-05, 2.8051435947418213e-05, 2.942979335784912e-05, 3.080815076828003e-05, 3.218650817871094e-05, 3.3564865589141846e-05, 3.4943222999572754e-05, 3.632158041000366e-05, 3.769993782043457e-05, 3.907829523086548e-05, 4.045665264129639e-05, 4.1835010051727295e-05, 4.32133674621582e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 4.0, 10.0, 13.0, 19.0, 46.0, 62.0, 128.0, 225.0, 495.0, 1216.0, 4059.0, 21049.0, 417327.0, 571089.0, 25811.0, 4508.0, 1387.0, 516.0, 247.0, 132.0, 69.0, 57.0, 26.0, 13.0, 12.0, 7.0, 10.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08404541015625, -0.0805501937866211, -0.07705497741699219, -0.07355976104736328, -0.07006454467773438, -0.06656932830810547, -0.06307411193847656, -0.059578895568847656, -0.05608367919921875, -0.052588462829589844, -0.04909324645996094, -0.04559803009033203, -0.042102813720703125, -0.03860759735107422, -0.03511238098144531, -0.031617164611816406, -0.0281219482421875, -0.024626731872558594, -0.021131515502929688, -0.01763629913330078, -0.014141082763671875, -0.010645866394042969, -0.0071506500244140625, -0.0036554336547851562, -0.00016021728515625, 0.0033349990844726562, 0.0068302154541015625, 0.010325431823730469, 0.013820648193359375, 0.01731586456298828, 0.020811080932617188, 0.024306297302246094, 0.027801513671875, 0.031296730041503906, 0.03479194641113281, 0.03828716278076172, 0.041782379150390625, 0.04527759552001953, 0.04877281188964844, 0.052268028259277344, 0.05576324462890625, 0.059258460998535156, 0.06275367736816406, 0.06624889373779297, 0.06974411010742188, 0.07323932647705078, 0.07673454284667969, 0.0802297592163086, 0.0837249755859375, 0.0872201919555664, 0.09071540832519531, 0.09421062469482422, 0.09770584106445312, 0.10120105743408203, 0.10469627380371094, 0.10819149017333984, 0.11168670654296875, 0.11518192291259766, 0.11867713928222656, 0.12217235565185547, 0.12566757202148438, 0.12916278839111328, 0.1326580047607422, 0.1361532211303711, 0.1396484375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 3.0, 6.0, 14.0, 15.0, 22.0, 34.0, 50.0, 70.0, 95.0, 123.0, 125.0, 110.0, 78.0, 76.0, 43.0, 38.0, 23.0, 17.0, 16.0, 8.0, 4.0, 5.0, 5.0, 9.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08782958984375, -0.0852804183959961, -0.08273124694824219, -0.08018207550048828, -0.07763290405273438, -0.07508373260498047, -0.07253456115722656, -0.06998538970947266, -0.06743621826171875, -0.06488704681396484, -0.06233787536621094, -0.05978870391845703, -0.057239532470703125, -0.05469036102294922, -0.05214118957519531, -0.049592018127441406, -0.0470428466796875, -0.044493675231933594, -0.04194450378417969, -0.03939533233642578, -0.036846160888671875, -0.03429698944091797, -0.03174781799316406, -0.029198646545410156, -0.02664947509765625, -0.024100303649902344, -0.021551132202148438, -0.01900196075439453, -0.016452789306640625, -0.013903617858886719, -0.011354446411132812, -0.008805274963378906, -0.006256103515625, -0.0037069320678710938, -0.0011577606201171875, 0.0013914108276367188, 0.003940582275390625, 0.006489753723144531, 0.009038925170898438, 0.011588096618652344, 0.01413726806640625, 0.016686439514160156, 0.019235610961914062, 0.02178478240966797, 0.024333953857421875, 0.02688312530517578, 0.029432296752929688, 0.031981468200683594, 0.0345306396484375, 0.037079811096191406, 0.03962898254394531, 0.04217815399169922, 0.044727325439453125, 0.04727649688720703, 0.04982566833496094, 0.052374839782714844, 0.05492401123046875, 0.057473182678222656, 0.06002235412597656, 0.06257152557373047, 0.06512069702148438, 0.06766986846923828, 0.07021903991699219, 0.0727682113647461, 0.0753173828125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 8.0, 6.0, 31.0, 38.0, 109.0, 185.0, 242.0, 197.0, 113.0, 45.0, 20.0, 4.0, 1.0, 6.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.017937660217285, -2.946852922439575, -2.8757681846618652, -2.8046836853027344, -2.7335989475250244, -2.6625142097473145, -2.5914294719696045, -2.5203447341918945, -2.4492602348327637, -2.3781754970550537, -2.3070907592773438, -2.236006259918213, -2.164921522140503, -2.093836784362793, -2.022752046585083, -1.9516674280166626, -1.8805826902389526, -1.8094979524612427, -1.7384133338928223, -1.6673285961151123, -1.596243977546692, -1.525159239768982, -1.4540746212005615, -1.3829898834228516, -1.3119051456451416, -1.2408204078674316, -1.1697357892990112, -1.0986510515213013, -1.0275664329528809, -0.9564816951751709, -0.8853970170021057, -0.8143123388290405, -0.7432276010513306, -0.6721429228782654, -0.6010582447052002, -0.5299735069274902, -0.45888885855674744, -0.38780418038368225, -0.3167194724082947, -0.2456347942352295, -0.1745501160621643, -0.10346543043851852, -0.03238074481487274, 0.03870394825935364, 0.10978862643241882, 0.180873304605484, 0.2519580125808716, 0.32304269075393677, 0.39412736892700195, 0.46521204710006714, 0.5362967252731323, 0.6073814630508423, 0.6784660816192627, 0.7495508193969727, 0.8206354975700378, 0.891720175743103, 0.9628048539161682, 1.0338895320892334, 1.1049742698669434, 1.1760588884353638, 1.2471436262130737, 1.3182282447814941, 1.389312982559204, 1.460397720336914, 1.5314823389053345]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 3.0, 3.0, 1.0, 6.0, 3.0, 9.0, 5.0, 11.0, 6.0, 14.0, 13.0, 15.0, 21.0, 34.0, 34.0, 27.0, 23.0, 39.0, 50.0, 39.0, 53.0, 48.0, 60.0, 67.0, 37.0, 58.0, 48.0, 41.0, 28.0, 34.0, 27.0, 33.0, 17.0, 13.0, 25.0, 11.0, 16.0, 5.0, 5.0, 7.0, 7.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9634849429130554, -0.9339351654052734, -0.9043853282928467, -0.8748355507850647, -0.8452857732772827, -0.815735936164856, -0.786186158657074, -0.756636381149292, -0.72708660364151, -0.697536826133728, -0.6679869890213013, -0.6384372115135193, -0.6088874340057373, -0.5793375968933105, -0.5497878193855286, -0.5202380418777466, -0.4906882345676422, -0.46113842725753784, -0.43158864974975586, -0.4020388424396515, -0.3724890649318695, -0.34293925762176514, -0.31338948011398315, -0.2838396728038788, -0.2542898654937744, -0.22474007308483124, -0.19519028067588806, -0.1656404733657837, -0.1360906958580017, -0.10654088854789734, -0.07699109613895416, -0.047441303730010986, -0.017891526222229004, 0.011658268049359322, 0.04120806232094765, 0.07075785845518112, 0.1003076508641243, 0.12985745072364807, 0.15940724313259125, 0.18895703554153442, 0.2185068279504776, 0.24805662035942078, 0.27760642766952515, 0.30715620517730713, 0.3367060124874115, 0.36625581979751587, 0.39580559730529785, 0.42535537481307983, 0.4549051821231842, 0.4844549894332886, 0.5140047669410706, 0.5435545444488525, 0.5731043815612793, 0.6026541590690613, 0.6322039365768433, 0.66175377368927, 0.691303551197052, 0.720853328704834, 0.7504031658172607, 0.7799529433250427, 0.8095027208328247, 0.8390525579452515, 0.8686023354530334, 0.8981521129608154, 0.9277018904685974]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 6.0, 2.0, 5.0, 9.0, 11.0, 13.0, 26.0, 25.0, 36.0, 49.0, 67.0, 92.0, 113.0, 150.0, 273.0, 346.0, 499.0, 781.0, 1244.0, 2184.0, 3952.0, 7744.0, 16949.0, 46525.0, 209098.0, 2639896.0, 1088449.0, 116696.0, 31916.0, 12832.0, 6083.0, 3243.0, 1764.0, 1113.0, 665.0, 446.0, 275.0, 187.0, 149.0, 84.0, 86.0, 46.0, 42.0, 22.0, 27.0, 18.0, 15.0, 12.0, 4.0, 7.0, 4.0, 2.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08306884765625, -0.08018779754638672, -0.07730674743652344, -0.07442569732666016, -0.07154464721679688, -0.0686635971069336, -0.06578254699707031, -0.06290149688720703, -0.06002044677734375, -0.05713939666748047, -0.05425834655761719, -0.051377296447753906, -0.048496246337890625, -0.045615196228027344, -0.04273414611816406, -0.03985309600830078, -0.0369720458984375, -0.03409099578857422, -0.031209945678710938, -0.028328895568847656, -0.025447845458984375, -0.022566795349121094, -0.019685745239257812, -0.01680469512939453, -0.01392364501953125, -0.011042594909667969, -0.008161544799804688, -0.005280494689941406, -0.002399444580078125, 0.00048160552978515625, 0.0033626556396484375, 0.006243705749511719, 0.009124755859375, 0.012005805969238281, 0.014886856079101562, 0.017767906188964844, 0.020648956298828125, 0.023530006408691406, 0.026411056518554688, 0.02929210662841797, 0.03217315673828125, 0.03505420684814453, 0.03793525695800781, 0.040816307067871094, 0.043697357177734375, 0.046578407287597656, 0.04945945739746094, 0.05234050750732422, 0.0552215576171875, 0.05810260772705078, 0.06098365783691406, 0.06386470794677734, 0.06674575805664062, 0.0696268081665039, 0.07250785827636719, 0.07538890838623047, 0.07826995849609375, 0.08115100860595703, 0.08403205871582031, 0.0869131088256836, 0.08979415893554688, 0.09267520904541016, 0.09555625915527344, 0.09843730926513672, 0.101318359375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 1.0, 4.0, 3.0, 3.0, 6.0, 8.0, 7.0, 12.0, 8.0, 12.0, 9.0, 14.0, 19.0, 25.0, 17.0, 26.0, 22.0, 22.0, 25.0, 32.0, 31.0, 28.0, 38.0, 39.0, 36.0, 35.0, 51.0, 20.0, 44.0, 43.0, 33.0, 42.0, 40.0, 22.0, 28.0, 20.0, 30.0, 23.0, 18.0, 15.0, 17.0, 15.0, 11.0, 12.0, 9.0, 10.0, 4.0, 3.0, 4.0, 4.0, 5.0, 2.0, 1.0, 3.0], "bins": [-0.03936767578125, -0.03827214241027832, -0.03717660903930664, -0.03608107566833496, -0.03498554229736328, -0.0338900089263916, -0.03279447555541992, -0.03169894218444824, -0.030603408813476562, -0.029507875442504883, -0.028412342071533203, -0.027316808700561523, -0.026221275329589844, -0.025125741958618164, -0.024030208587646484, -0.022934675216674805, -0.021839141845703125, -0.020743608474731445, -0.019648075103759766, -0.018552541732788086, -0.017457008361816406, -0.016361474990844727, -0.015265941619873047, -0.014170408248901367, -0.013074874877929688, -0.011979341506958008, -0.010883808135986328, -0.009788274765014648, -0.008692741394042969, -0.007597208023071289, -0.006501674652099609, -0.00540614128112793, -0.00431060791015625, -0.0032150745391845703, -0.0021195411682128906, -0.001024007797241211, 7.152557373046875e-05, 0.0011670589447021484, 0.002262592315673828, 0.003358125686645508, 0.0044536590576171875, 0.005549192428588867, 0.006644725799560547, 0.0077402591705322266, 0.008835792541503906, 0.009931325912475586, 0.011026859283447266, 0.012122392654418945, 0.013217926025390625, 0.014313459396362305, 0.015408992767333984, 0.016504526138305664, 0.017600059509277344, 0.018695592880249023, 0.019791126251220703, 0.020886659622192383, 0.021982192993164062, 0.023077726364135742, 0.024173259735107422, 0.0252687931060791, 0.02636432647705078, 0.02745985984802246, 0.02855539321899414, 0.02965092658996582, 0.0307464599609375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 16.0, 19.0, 20.0, 35.0, 59.0, 94.0, 128.0, 223.0, 410.0, 770.0, 1651.0, 3865.0, 11646.0, 47609.0, 518028.0, 3424480.0, 147959.0, 24850.0, 7170.0, 2714.0, 1160.0, 556.0, 330.0, 169.0, 117.0, 73.0, 36.0, 20.0, 18.0, 14.0, 15.0, 2.0, 10.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.156494140625, -0.15132713317871094, -0.14616012573242188, -0.1409931182861328, -0.13582611083984375, -0.1306591033935547, -0.12549209594726562, -0.12032508850097656, -0.1151580810546875, -0.10999107360839844, -0.10482406616210938, -0.09965705871582031, -0.09449005126953125, -0.08932304382324219, -0.08415603637695312, -0.07898902893066406, -0.073822021484375, -0.06865501403808594, -0.06348800659179688, -0.05832099914550781, -0.05315399169921875, -0.04798698425292969, -0.042819976806640625, -0.03765296936035156, -0.0324859619140625, -0.027318954467773438, -0.022151947021484375, -0.016984939575195312, -0.01181793212890625, -0.0066509246826171875, -0.001483917236328125, 0.0036830902099609375, 0.00885009765625, 0.014017105102539062, 0.019184112548828125, 0.024351119995117188, 0.02951812744140625, 0.03468513488769531, 0.039852142333984375, 0.04501914978027344, 0.0501861572265625, 0.05535316467285156, 0.060520172119140625, 0.06568717956542969, 0.07085418701171875, 0.07602119445800781, 0.08118820190429688, 0.08635520935058594, 0.091522216796875, 0.09668922424316406, 0.10185623168945312, 0.10702323913574219, 0.11219024658203125, 0.11735725402832031, 0.12252426147460938, 0.12769126892089844, 0.1328582763671875, 0.13802528381347656, 0.14319229125976562, 0.1483592987060547, 0.15352630615234375, 0.1586933135986328, 0.16386032104492188, 0.16902732849121094, 0.1741943359375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 13.0, 12.0, 17.0, 10.0, 18.0, 40.0, 65.0, 113.0, 186.0, 323.0, 756.0, 1196.0, 599.0, 287.0, 144.0, 82.0, 54.0, 41.0, 25.0, 20.0, 13.0, 14.0, 11.0, 3.0, 6.0, 2.0, 2.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1390380859375, -0.1339569091796875, -0.128875732421875, -0.1237945556640625, -0.11871337890625, -0.1136322021484375, -0.108551025390625, -0.1034698486328125, -0.098388671875, -0.0933074951171875, -0.088226318359375, -0.0831451416015625, -0.07806396484375, -0.0729827880859375, -0.067901611328125, -0.0628204345703125, -0.0577392578125, -0.0526580810546875, -0.047576904296875, -0.0424957275390625, -0.03741455078125, -0.0323333740234375, -0.027252197265625, -0.0221710205078125, -0.01708984375, -0.0120086669921875, -0.006927490234375, -0.0018463134765625, 0.00323486328125, 0.0083160400390625, 0.013397216796875, 0.0184783935546875, 0.0235595703125, 0.0286407470703125, 0.033721923828125, 0.0388031005859375, 0.04388427734375, 0.0489654541015625, 0.054046630859375, 0.0591278076171875, 0.064208984375, 0.0692901611328125, 0.074371337890625, 0.0794525146484375, 0.08453369140625, 0.0896148681640625, 0.094696044921875, 0.0997772216796875, 0.1048583984375, 0.1099395751953125, 0.115020751953125, 0.1201019287109375, 0.12518310546875, 0.1302642822265625, 0.135345458984375, 0.1404266357421875, 0.1455078125, 0.1505889892578125, 0.155670166015625, 0.1607513427734375, 0.16583251953125, 0.1709136962890625, 0.175994873046875, 0.1810760498046875, 0.1861572265625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 12.0, 24.0, 84.0, 291.0, 355.0, 151.0, 49.0, 17.0, 12.0, 7.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9909154772758484, -0.9020388126373291, -0.8131622076034546, -0.7242856025695801, -0.6354089379310608, -0.5465322732925415, -0.457655668258667, -0.3687790036201477, -0.2799023985862732, -0.1910257637500763, -0.1021491289138794, -0.013272494077682495, 0.0756041407585144, 0.1644807755947113, 0.2533574104309082, 0.3422340750694275, 0.431110680103302, 0.5199873447418213, 0.6088639497756958, 0.6977405548095703, 0.7866172194480896, 0.8754938840866089, 0.9643704891204834, 1.0532472133636475, 1.1421236991882324, 1.231000304222107, 1.3198769092559814, 1.4087536334991455, 1.49763023853302, 1.5865068435668945, 1.6753835678100586, 1.764260172843933, 1.8531370162963867, 1.9420136213302612, 2.0308902263641357, 2.1197669506073, 2.2086434364318848, 2.297520160675049, 2.386396884918213, 2.475273609161377, 2.564150094985962, 2.653026819229126, 2.741903305053711, 2.830780029296875, 2.919656753540039, 3.008533239364624, 3.097409963607788, 3.186286449432373, 3.275163173675537, 3.364039897918701, 3.452916383743286, 3.54179310798645, 3.630669593811035, 3.719546318054199, 3.8084230422973633, 3.8972997665405273, 3.9861762523651123, 4.075052738189697, 4.163929462432861, 4.252806186676025, 4.3416829109191895, 4.4305596351623535, 4.519435882568359, 4.608312606811523, 4.6971893310546875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 7.0, 4.0, 6.0, 5.0, 11.0, 14.0, 22.0, 26.0, 25.0, 36.0, 33.0, 45.0, 47.0, 58.0, 49.0, 50.0, 77.0, 64.0, 50.0, 51.0, 52.0, 55.0, 41.0, 39.0, 32.0, 20.0, 22.0, 20.0, 12.0, 14.0, 8.0, 4.0, 1.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6463693380355835, -0.6231992840766907, -0.6000292897224426, -0.5768592357635498, -0.553689181804657, -0.5305191278457642, -0.5073491334915161, -0.4841790795326233, -0.46100902557373047, -0.43783900141716003, -0.4146689474582672, -0.3914989233016968, -0.36832886934280396, -0.3451588451862335, -0.3219888210296631, -0.29881876707077026, -0.27564874291419983, -0.2524787187576294, -0.22930866479873657, -0.20613864064216614, -0.18296858668327332, -0.15979856252670288, -0.13662852346897125, -0.11345848441123962, -0.090288445353508, -0.06711840629577637, -0.04394837096333504, -0.020778335630893707, 0.002391703426837921, 0.02556174248456955, 0.04873177409172058, 0.07190181314945221, 0.09507185220718384, 0.11824189126491547, 0.1414119303226471, 0.16458195447921753, 0.18775200843811035, 0.2109220325946808, 0.23409207165241241, 0.25726211071014404, 0.28043216466903687, 0.3036021888256073, 0.3267722427845001, 0.34994226694107056, 0.3731123208999634, 0.3962823450565338, 0.41945236921310425, 0.44262242317199707, 0.4657924473285675, 0.48896247148513794, 0.5121325254440308, 0.5353025794029236, 0.5584725737571716, 0.5816426277160645, 0.6048126816749573, 0.6279827356338501, 0.6511527299880981, 0.674322783946991, 0.697492778301239, 0.7206628322601318, 0.7438328862190247, 0.7670029401779175, 0.7901729345321655, 0.8133429884910583, 0.8365130424499512]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 10.0, 10.0, 19.0, 24.0, 34.0, 39.0, 70.0, 90.0, 165.0, 234.0, 440.0, 783.0, 1521.0, 2917.0, 5558.0, 12210.0, 29696.0, 84013.0, 305158.0, 413463.0, 121500.0, 40010.0, 15791.0, 7275.0, 3478.0, 1731.0, 952.0, 523.0, 314.0, 180.0, 112.0, 78.0, 40.0, 31.0, 23.0, 18.0, 14.0, 10.0, 7.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.1337890625, -0.13018798828125, -0.1265869140625, -0.12298583984375, -0.119384765625, -0.11578369140625, -0.1121826171875, -0.10858154296875, -0.10498046875, -0.10137939453125, -0.0977783203125, -0.09417724609375, -0.090576171875, -0.08697509765625, -0.0833740234375, -0.07977294921875, -0.076171875, -0.07257080078125, -0.0689697265625, -0.06536865234375, -0.061767578125, -0.05816650390625, -0.0545654296875, -0.05096435546875, -0.04736328125, -0.04376220703125, -0.0401611328125, -0.03656005859375, -0.032958984375, -0.02935791015625, -0.0257568359375, -0.02215576171875, -0.0185546875, -0.01495361328125, -0.0113525390625, -0.00775146484375, -0.004150390625, -0.00054931640625, 0.0030517578125, 0.00665283203125, 0.01025390625, 0.01385498046875, 0.0174560546875, 0.02105712890625, 0.024658203125, 0.02825927734375, 0.0318603515625, 0.03546142578125, 0.0390625, 0.04266357421875, 0.0462646484375, 0.04986572265625, 0.053466796875, 0.05706787109375, 0.0606689453125, 0.06427001953125, 0.06787109375, 0.07147216796875, 0.0750732421875, 0.07867431640625, 0.082275390625, 0.08587646484375, 0.0894775390625, 0.09307861328125, 0.0966796875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 2.0, 7.0, 14.0, 9.0, 19.0, 15.0, 25.0, 23.0, 21.0, 30.0, 27.0, 41.0, 33.0, 50.0, 52.0, 60.0, 40.0, 44.0, 59.0, 58.0, 37.0, 51.0, 39.0, 43.0, 30.0, 26.0, 21.0, 29.0, 14.0, 16.0, 15.0, 10.0, 11.0, 9.0, 6.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039093017578125, -0.03761863708496094, -0.036144256591796875, -0.03466987609863281, -0.03319549560546875, -0.03172111511230469, -0.030246734619140625, -0.028772354125976562, -0.0272979736328125, -0.025823593139648438, -0.024349212646484375, -0.022874832153320312, -0.02140045166015625, -0.019926071166992188, -0.018451690673828125, -0.016977310180664062, -0.0155029296875, -0.014028549194335938, -0.012554168701171875, -0.011079788208007812, -0.00960540771484375, -0.008131027221679688, -0.006656646728515625, -0.0051822662353515625, -0.0037078857421875, -0.0022335052490234375, -0.000759124755859375, 0.0007152557373046875, 0.00218963623046875, 0.0036640167236328125, 0.005138397216796875, 0.0066127777099609375, 0.008087158203125, 0.009561538696289062, 0.011035919189453125, 0.012510299682617188, 0.01398468017578125, 0.015459060668945312, 0.016933441162109375, 0.018407821655273438, 0.0198822021484375, 0.021356582641601562, 0.022830963134765625, 0.024305343627929688, 0.02577972412109375, 0.027254104614257812, 0.028728485107421875, 0.030202865600585938, 0.03167724609375, 0.03315162658691406, 0.034626007080078125, 0.03610038757324219, 0.03757476806640625, 0.03904914855957031, 0.040523529052734375, 0.04199790954589844, 0.0434722900390625, 0.04494667053222656, 0.046421051025390625, 0.04789543151855469, 0.04936981201171875, 0.05084419250488281, 0.052318572998046875, 0.05379295349121094, 0.055267333984375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 8.0, 8.0, 7.0, 12.0, 15.0, 31.0, 54.0, 86.0, 110.0, 192.0, 311.0, 522.0, 1045.0, 2342.0, 7103.0, 37704.0, 661829.0, 303899.0, 23954.0, 5345.0, 1886.0, 925.0, 465.0, 256.0, 162.0, 92.0, 51.0, 54.0, 28.0, 23.0, 15.0, 9.0, 9.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2493896484375, -0.24224090576171875, -0.2350921630859375, -0.22794342041015625, -0.220794677734375, -0.21364593505859375, -0.2064971923828125, -0.19934844970703125, -0.19219970703125, -0.18505096435546875, -0.1779022216796875, -0.17075347900390625, -0.163604736328125, -0.15645599365234375, -0.1493072509765625, -0.14215850830078125, -0.135009765625, -0.12786102294921875, -0.1207122802734375, -0.11356353759765625, -0.106414794921875, -0.09926605224609375, -0.0921173095703125, -0.08496856689453125, -0.07781982421875, -0.07067108154296875, -0.0635223388671875, -0.05637359619140625, -0.049224853515625, -0.04207611083984375, -0.0349273681640625, -0.02777862548828125, -0.0206298828125, -0.01348114013671875, -0.0063323974609375, 0.00081634521484375, 0.007965087890625, 0.01511383056640625, 0.0222625732421875, 0.02941131591796875, 0.03656005859375, 0.04370880126953125, 0.0508575439453125, 0.05800628662109375, 0.065155029296875, 0.07230377197265625, 0.0794525146484375, 0.08660125732421875, 0.09375, 0.10089874267578125, 0.1080474853515625, 0.11519622802734375, 0.122344970703125, 0.12949371337890625, 0.1366424560546875, 0.14379119873046875, 0.15093994140625, 0.15808868408203125, 0.1652374267578125, 0.17238616943359375, 0.179534912109375, 0.18668365478515625, 0.1938323974609375, 0.20098114013671875, 0.2081298828125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 2.0, 3.0, 6.0, 8.0, 7.0, 17.0, 16.0, 7.0, 22.0, 25.0, 20.0, 29.0, 44.0, 45.0, 62.0, 58.0, 78.0, 62.0, 67.0, 54.0, 50.0, 57.0, 37.0, 51.0, 36.0, 22.0, 38.0, 23.0, 16.0, 13.0, 10.0, 10.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2310791015625, -0.2233448028564453, -0.21561050415039062, -0.20787620544433594, -0.20014190673828125, -0.19240760803222656, -0.18467330932617188, -0.1769390106201172, -0.1692047119140625, -0.1614704132080078, -0.15373611450195312, -0.14600181579589844, -0.13826751708984375, -0.13053321838378906, -0.12279891967773438, -0.11506462097167969, -0.107330322265625, -0.09959602355957031, -0.09186172485351562, -0.08412742614746094, -0.07639312744140625, -0.06865882873535156, -0.060924530029296875, -0.05319023132324219, -0.0454559326171875, -0.03772163391113281, -0.029987335205078125, -0.022253036499023438, -0.01451873779296875, -0.0067844390869140625, 0.000949859619140625, 0.008684158325195312, 0.01641845703125, 0.024152755737304688, 0.031887054443359375, 0.03962135314941406, 0.04735565185546875, 0.05508995056152344, 0.06282424926757812, 0.07055854797363281, 0.0782928466796875, 0.08602714538574219, 0.09376144409179688, 0.10149574279785156, 0.10923004150390625, 0.11696434020996094, 0.12469863891601562, 0.1324329376220703, 0.140167236328125, 0.1479015350341797, 0.15563583374023438, 0.16337013244628906, 0.17110443115234375, 0.17883872985839844, 0.18657302856445312, 0.1943073272705078, 0.2020416259765625, 0.2097759246826172, 0.21751022338867188, 0.22524452209472656, 0.23297882080078125, 0.24071311950683594, 0.24844741821289062, 0.2561817169189453, 0.263916015625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 3.0, 5.0, 9.0, 17.0, 22.0, 47.0, 64.0, 96.0, 174.0, 340.0, 650.0, 1448.0, 3890.0, 13165.0, 81819.0, 820644.0, 103727.0, 15203.0, 4216.0, 1558.0, 648.0, 312.0, 176.0, 135.0, 60.0, 40.0, 28.0, 14.0, 12.0, 9.0, 3.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11456298828125, -0.11114788055419922, -0.10773277282714844, -0.10431766510009766, -0.10090255737304688, -0.0974874496459961, -0.09407234191894531, -0.09065723419189453, -0.08724212646484375, -0.08382701873779297, -0.08041191101074219, -0.0769968032836914, -0.07358169555664062, -0.07016658782958984, -0.06675148010253906, -0.06333637237548828, -0.0599212646484375, -0.05650615692138672, -0.05309104919433594, -0.049675941467285156, -0.046260833740234375, -0.042845726013183594, -0.03943061828613281, -0.03601551055908203, -0.03260040283203125, -0.02918529510498047, -0.025770187377929688, -0.022355079650878906, -0.018939971923828125, -0.015524864196777344, -0.012109756469726562, -0.008694648742675781, -0.005279541015625, -0.0018644332885742188, 0.0015506744384765625, 0.004965782165527344, 0.008380889892578125, 0.011795997619628906, 0.015211105346679688, 0.01862621307373047, 0.02204132080078125, 0.02545642852783203, 0.028871536254882812, 0.032286643981933594, 0.035701751708984375, 0.039116859436035156, 0.04253196716308594, 0.04594707489013672, 0.0493621826171875, 0.05277729034423828, 0.05619239807128906, 0.059607505798339844, 0.06302261352539062, 0.0664377212524414, 0.06985282897949219, 0.07326793670654297, 0.07668304443359375, 0.08009815216064453, 0.08351325988769531, 0.0869283676147461, 0.09034347534179688, 0.09375858306884766, 0.09717369079589844, 0.10058879852294922, 0.10400390625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 5.0, 2.0, 5.0, 2.0, 7.0, 7.0, 14.0, 9.0, 18.0, 33.0, 34.0, 45.0, 80.0, 134.0, 145.0, 140.0, 100.0, 61.0, 35.0, 37.0, 20.0, 19.0, 10.0, 8.0, 10.0, 6.0, 7.0, 3.0, 9.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.334615707397461e-05, -5.212612450122833e-05, -5.0906091928482056e-05, -4.968605935573578e-05, -4.84660267829895e-05, -4.7245994210243225e-05, -4.602596163749695e-05, -4.480592906475067e-05, -4.3585896492004395e-05, -4.236586391925812e-05, -4.114583134651184e-05, -3.9925798773765564e-05, -3.870576620101929e-05, -3.748573362827301e-05, -3.6265701055526733e-05, -3.5045668482780457e-05, -3.382563591003418e-05, -3.26056033372879e-05, -3.1385570764541626e-05, -3.016553819179535e-05, -2.8945505619049072e-05, -2.7725473046302795e-05, -2.650544047355652e-05, -2.5285407900810242e-05, -2.4065375328063965e-05, -2.2845342755317688e-05, -2.162531018257141e-05, -2.0405277609825134e-05, -1.9185245037078857e-05, -1.796521246433258e-05, -1.6745179891586304e-05, -1.5525147318840027e-05, -1.430511474609375e-05, -1.3085082173347473e-05, -1.1865049600601196e-05, -1.064501702785492e-05, -9.424984455108643e-06, -8.204951882362366e-06, -6.984919309616089e-06, -5.764886736869812e-06, -4.544854164123535e-06, -3.3248215913772583e-06, -2.1047890186309814e-06, -8.847564458847046e-07, 3.3527612686157227e-07, 1.5553086996078491e-06, 2.775341272354126e-06, 3.995373845100403e-06, 5.21540641784668e-06, 6.4354389905929565e-06, 7.655471563339233e-06, 8.87550413608551e-06, 1.0095536708831787e-05, 1.1315569281578064e-05, 1.253560185432434e-05, 1.3755634427070618e-05, 1.4975666999816895e-05, 1.619569957256317e-05, 1.7415732145309448e-05, 1.8635764718055725e-05, 1.9855797290802002e-05, 2.107582986354828e-05, 2.2295862436294556e-05, 2.3515895009040833e-05, 2.473592758178711e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 4.0, 5.0, 2.0, 5.0, 4.0, 2.0, 11.0, 12.0, 14.0, 24.0, 36.0, 43.0, 45.0, 79.0, 174.0, 244.0, 467.0, 946.0, 2280.0, 7245.0, 39671.0, 702855.0, 265547.0, 20588.0, 4805.0, 1698.0, 789.0, 373.0, 189.0, 123.0, 88.0, 53.0, 34.0, 30.0, 19.0, 13.0, 11.0, 6.0, 9.0, 4.0, 6.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.12548828125, -0.12208175659179688, -0.11867523193359375, -0.11526870727539062, -0.1118621826171875, -0.10845565795898438, -0.10504913330078125, -0.10164260864257812, -0.098236083984375, -0.09482955932617188, -0.09142303466796875, -0.08801651000976562, -0.0846099853515625, -0.08120346069335938, -0.07779693603515625, -0.07439041137695312, -0.07098388671875, -0.06757736206054688, -0.06417083740234375, -0.060764312744140625, -0.0573577880859375, -0.053951263427734375, -0.05054473876953125, -0.047138214111328125, -0.043731689453125, -0.040325164794921875, -0.03691864013671875, -0.033512115478515625, -0.0301055908203125, -0.026699066162109375, -0.02329254150390625, -0.019886016845703125, -0.0164794921875, -0.013072967529296875, -0.00966644287109375, -0.006259918212890625, -0.0028533935546875, 0.000553131103515625, 0.00395965576171875, 0.007366180419921875, 0.010772705078125, 0.014179229736328125, 0.01758575439453125, 0.020992279052734375, 0.0243988037109375, 0.027805328369140625, 0.03121185302734375, 0.034618377685546875, 0.03802490234375, 0.041431427001953125, 0.04483795166015625, 0.048244476318359375, 0.0516510009765625, 0.055057525634765625, 0.05846405029296875, 0.061870574951171875, 0.065277099609375, 0.06868362426757812, 0.07209014892578125, 0.07549667358398438, 0.0789031982421875, 0.08230972290039062, 0.08571624755859375, 0.08912277221679688, 0.092529296875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 2.0, 6.0, 7.0, 6.0, 11.0, 8.0, 10.0, 13.0, 26.0, 34.0, 36.0, 56.0, 73.0, 77.0, 91.0, 96.0, 89.0, 86.0, 71.0, 53.0, 20.0, 28.0, 22.0, 12.0, 15.0, 9.0, 5.0, 11.0, 2.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.07025146484375, -0.06768798828125, -0.06512451171875, -0.06256103515625, -0.05999755859375, -0.05743408203125, -0.05487060546875, -0.05230712890625, -0.04974365234375, -0.04718017578125, -0.04461669921875, -0.04205322265625, -0.03948974609375, -0.03692626953125, -0.03436279296875, -0.03179931640625, -0.02923583984375, -0.02667236328125, -0.02410888671875, -0.02154541015625, -0.01898193359375, -0.01641845703125, -0.01385498046875, -0.01129150390625, -0.00872802734375, -0.00616455078125, -0.00360107421875, -0.00103759765625, 0.00152587890625, 0.00408935546875, 0.00665283203125, 0.00921630859375, 0.01177978515625, 0.01434326171875, 0.01690673828125, 0.01947021484375, 0.02203369140625, 0.02459716796875, 0.02716064453125, 0.02972412109375, 0.03228759765625, 0.03485107421875, 0.03741455078125, 0.03997802734375, 0.04254150390625, 0.04510498046875, 0.04766845703125, 0.05023193359375, 0.05279541015625, 0.05535888671875, 0.05792236328125, 0.06048583984375, 0.06304931640625, 0.06561279296875, 0.06817626953125, 0.07073974609375, 0.07330322265625, 0.07586669921875, 0.07843017578125, 0.08099365234375, 0.08355712890625, 0.08612060546875, 0.08868408203125, 0.09124755859375, 0.09381103515625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 19.0, 76.0, 279.0, 420.0, 147.0, 37.0, 7.0, 6.0, 3.0, 2.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.326026201248169, -3.212735891342163, -3.0994455814361572, -2.9861555099487305, -2.8728652000427246, -2.7595748901367188, -2.646284580230713, -2.532994270324707, -2.419703960418701, -2.3064136505126953, -2.1931233406066895, -2.0798330307006836, -1.9665428400039673, -1.853252649307251, -1.7399623394012451, -1.6266720294952393, -1.513381838798523, -1.400091528892517, -1.2868013381958008, -1.173511028289795, -1.060220718383789, -0.946930468082428, -0.8336402177810669, -0.720349907875061, -0.6070596575737, -0.4937693774700165, -0.380479097366333, -0.2671888470649719, -0.15389856696128845, -0.04060828685760498, 0.0726819634437561, 0.18597227334976196, 0.29926252365112305, 0.4125528037548065, 0.52584308385849, 0.6391333341598511, 0.7524236440658569, 0.865713894367218, 0.9790041446685791, 1.092294454574585, 1.2055847644805908, 1.3188750743865967, 1.432165265083313, 1.5454555749893188, 1.6587458848953247, 1.772036075592041, 1.8853263854980469, 1.9986166954040527, 2.1119070053100586, 2.2251973152160645, 2.3384876251220703, 2.451777935028076, 2.565068006515503, 2.678358316421509, 2.7916486263275146, 2.9049389362335205, 3.0182290077209473, 3.131519317626953, 3.244809627532959, 3.358099937438965, 3.4713900089263916, 3.5846803188323975, 3.6979706287384033, 3.811260938644409, 3.924551248550415]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 6.0, 6.0, 8.0, 22.0, 20.0, 25.0, 41.0, 45.0, 45.0, 58.0, 62.0, 72.0, 86.0, 92.0, 82.0, 60.0, 74.0, 51.0, 37.0, 23.0, 29.0, 19.0, 8.0, 12.0, 9.0, 4.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.7596783638000488, -1.7197473049163818, -1.6798162460327148, -1.6398853063583374, -1.5999542474746704, -1.5600231885910034, -1.520092248916626, -1.480161190032959, -1.440230131149292, -1.400299072265625, -1.360368013381958, -1.3204370737075806, -1.2805060148239136, -1.2405749559402466, -1.2006440162658691, -1.1607129573822021, -1.1207818984985352, -1.0808508396148682, -1.0409197807312012, -1.0009888410568237, -0.9610577821731567, -0.9211267232894897, -0.8811957240104675, -0.8412647247314453, -0.8013336658477783, -0.7614026069641113, -0.7214716076850891, -0.6815406084060669, -0.6416095495223999, -0.6016784906387329, -0.5617474913597107, -0.5218164920806885, -0.4818854331970215, -0.4419544041156769, -0.4020233750343323, -0.36209234595298767, -0.32216131687164307, -0.28223028779029846, -0.24229925870895386, -0.20236822962760925, -0.16243720054626465, -0.12250617146492004, -0.08257514238357544, -0.042644113302230835, -0.0027130842208862305, 0.037217944860458374, 0.07714897394180298, 0.11708000302314758, 0.1570110321044922, 0.1969420611858368, 0.2368730902671814, 0.276804119348526, 0.3167351484298706, 0.3566661775112152, 0.3965972065925598, 0.4365282356739044, 0.476459264755249, 0.516390323638916, 0.5563213229179382, 0.5962523221969604, 0.6361833810806274, 0.6761144399642944, 0.7160454392433167, 0.7559764385223389, 0.7959074974060059]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 6.0, 9.0, 5.0, 3.0, 15.0, 14.0, 21.0, 18.0, 23.0, 45.0, 70.0, 112.0, 191.0, 375.0, 747.0, 1634.0, 4933.0, 21573.0, 368006.0, 3702071.0, 78213.0, 10886.0, 3121.0, 1087.0, 480.0, 251.0, 133.0, 71.0, 50.0, 31.0, 13.0, 13.0, 15.0, 6.0, 13.0, 9.0, 6.0, 4.0, 2.0, 0.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1695556640625, -0.1635608673095703, -0.15756607055664062, -0.15157127380371094, -0.14557647705078125, -0.13958168029785156, -0.13358688354492188, -0.1275920867919922, -0.1215972900390625, -0.11560249328613281, -0.10960769653320312, -0.10361289978027344, -0.09761810302734375, -0.09162330627441406, -0.08562850952148438, -0.07963371276855469, -0.073638916015625, -0.06764411926269531, -0.061649322509765625, -0.05565452575683594, -0.04965972900390625, -0.04366493225097656, -0.037670135498046875, -0.03167533874511719, -0.0256805419921875, -0.019685745239257812, -0.013690948486328125, -0.0076961517333984375, -0.00170135498046875, 0.0042934417724609375, 0.010288238525390625, 0.016283035278320312, 0.02227783203125, 0.028272628784179688, 0.034267425537109375, 0.04026222229003906, 0.04625701904296875, 0.05225181579589844, 0.058246612548828125, 0.06424140930175781, 0.0702362060546875, 0.07623100280761719, 0.08222579956054688, 0.08822059631347656, 0.09421539306640625, 0.10021018981933594, 0.10620498657226562, 0.11219978332519531, 0.118194580078125, 0.12418937683105469, 0.13018417358398438, 0.13617897033691406, 0.14217376708984375, 0.14816856384277344, 0.15416336059570312, 0.1601581573486328, 0.1661529541015625, 0.1721477508544922, 0.17814254760742188, 0.18413734436035156, 0.19013214111328125, 0.19612693786621094, 0.20212173461914062, 0.2081165313720703, 0.214111328125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 8.0, 14.0, 24.0, 27.0, 28.0, 49.0, 53.0, 59.0, 73.0, 67.0, 75.0, 68.0, 84.0, 80.0, 74.0, 56.0, 31.0, 31.0, 40.0, 26.0, 11.0, 10.0, 4.0, 10.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09393310546875, -0.09165096282958984, -0.08936882019042969, -0.08708667755126953, -0.08480453491210938, -0.08252239227294922, -0.08024024963378906, -0.0779581069946289, -0.07567596435546875, -0.0733938217163086, -0.07111167907714844, -0.06882953643798828, -0.06654739379882812, -0.06426525115966797, -0.06198310852050781, -0.059700965881347656, -0.0574188232421875, -0.055136680603027344, -0.05285453796386719, -0.05057239532470703, -0.048290252685546875, -0.04600811004638672, -0.04372596740722656, -0.041443824768066406, -0.03916168212890625, -0.036879539489746094, -0.03459739685058594, -0.03231525421142578, -0.030033111572265625, -0.02775096893310547, -0.025468826293945312, -0.023186683654785156, -0.020904541015625, -0.018622398376464844, -0.016340255737304688, -0.014058113098144531, -0.011775970458984375, -0.009493827819824219, -0.0072116851806640625, -0.004929542541503906, -0.00264739990234375, -0.00036525726318359375, 0.0019168853759765625, 0.004199028015136719, 0.006481170654296875, 0.008763313293457031, 0.011045455932617188, 0.013327598571777344, 0.0156097412109375, 0.017891883850097656, 0.020174026489257812, 0.02245616912841797, 0.024738311767578125, 0.02702045440673828, 0.029302597045898438, 0.031584739685058594, 0.03386688232421875, 0.036149024963378906, 0.03843116760253906, 0.04071331024169922, 0.042995452880859375, 0.04527759552001953, 0.04755973815917969, 0.049841880798339844, 0.0521240234375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 7.0, 10.0, 21.0, 23.0, 33.0, 56.0, 96.0, 159.0, 293.0, 604.0, 1361.0, 3579.0, 11957.0, 50433.0, 444832.0, 3413794.0, 216734.0, 35075.0, 9344.0, 3152.0, 1268.0, 615.0, 318.0, 185.0, 124.0, 64.0, 48.0, 30.0, 29.0, 15.0, 7.0, 7.0, 2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.173095703125, -0.1683368682861328, -0.16357803344726562, -0.15881919860839844, -0.15406036376953125, -0.14930152893066406, -0.14454269409179688, -0.1397838592529297, -0.1350250244140625, -0.1302661895751953, -0.12550735473632812, -0.12074851989746094, -0.11598968505859375, -0.11123085021972656, -0.10647201538085938, -0.10171318054199219, -0.096954345703125, -0.09219551086425781, -0.08743667602539062, -0.08267784118652344, -0.07791900634765625, -0.07316017150878906, -0.06840133666992188, -0.06364250183105469, -0.0588836669921875, -0.05412483215332031, -0.049365997314453125, -0.04460716247558594, -0.03984832763671875, -0.03508949279785156, -0.030330657958984375, -0.025571823120117188, -0.02081298828125, -0.016054153442382812, -0.011295318603515625, -0.0065364837646484375, -0.00177764892578125, 0.0029811859130859375, 0.007740020751953125, 0.012498855590820312, 0.0172576904296875, 0.022016525268554688, 0.026775360107421875, 0.03153419494628906, 0.03629302978515625, 0.04105186462402344, 0.045810699462890625, 0.05056953430175781, 0.055328369140625, 0.06008720397949219, 0.06484603881835938, 0.06960487365722656, 0.07436370849609375, 0.07912254333496094, 0.08388137817382812, 0.08864021301269531, 0.0933990478515625, 0.09815788269042969, 0.10291671752929688, 0.10767555236816406, 0.11243438720703125, 0.11719322204589844, 0.12195205688476562, 0.1267108917236328, 0.1314697265625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 6.0, 2.0, 1.0, 4.0, 6.0, 4.0, 8.0, 10.0, 13.0, 12.0, 22.0, 32.0, 43.0, 68.0, 93.0, 163.0, 319.0, 581.0, 996.0, 726.0, 375.0, 204.0, 111.0, 76.0, 51.0, 28.0, 30.0, 22.0, 21.0, 11.0, 7.0, 15.0, 6.0, 5.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08795166015625, -0.08370304107666016, -0.07945442199707031, -0.07520580291748047, -0.07095718383789062, -0.06670856475830078, -0.06245994567871094, -0.058211326599121094, -0.05396270751953125, -0.049714088439941406, -0.04546546936035156, -0.04121685028076172, -0.036968231201171875, -0.03271961212158203, -0.028470993041992188, -0.024222373962402344, -0.0199737548828125, -0.015725135803222656, -0.011476516723632812, -0.007227897644042969, -0.002979278564453125, 0.0012693405151367188, 0.0055179595947265625, 0.009766578674316406, 0.01401519775390625, 0.018263816833496094, 0.022512435913085938, 0.02676105499267578, 0.031009674072265625, 0.03525829315185547, 0.03950691223144531, 0.043755531311035156, 0.048004150390625, 0.052252769470214844, 0.05650138854980469, 0.06075000762939453, 0.06499862670898438, 0.06924724578857422, 0.07349586486816406, 0.0777444839477539, 0.08199310302734375, 0.0862417221069336, 0.09049034118652344, 0.09473896026611328, 0.09898757934570312, 0.10323619842529297, 0.10748481750488281, 0.11173343658447266, 0.1159820556640625, 0.12023067474365234, 0.12447929382324219, 0.12872791290283203, 0.13297653198242188, 0.13722515106201172, 0.14147377014160156, 0.1457223892211914, 0.14997100830078125, 0.1542196273803711, 0.15846824645996094, 0.16271686553955078, 0.16696548461914062, 0.17121410369873047, 0.1754627227783203, 0.17971134185791016, 0.1839599609375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 5.0, 19.0, 32.0, 67.0, 177.0, 249.0, 218.0, 111.0, 48.0, 32.0, 17.0, 5.0, 9.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.702487051486969, -0.6507090926170349, -0.598931074142456, -0.547153115272522, -0.4953750967979431, -0.44359713792800903, -0.39181914925575256, -0.3400411605834961, -0.2882631719112396, -0.23648518323898315, -0.18470719456672668, -0.1329292207956314, -0.08115123212337494, -0.029373258352279663, 0.022404730319976807, 0.07418271899223328, 0.12596070766448975, 0.17773869633674622, 0.22951668500900269, 0.28129464387893677, 0.3330726623535156, 0.3848506212234497, 0.4366286098957062, 0.48840659856796265, 0.5401846170425415, 0.5919625759124756, 0.6437405943870544, 0.6955185532569885, 0.7472965717315674, 0.7990745306015015, 0.8508524894714355, 0.9026305079460144, 0.9544085264205933, 1.0061864852905273, 1.0579644441604614, 1.109742522239685, 1.1615204811096191, 1.2132984399795532, 1.2650763988494873, 1.316854476928711, 1.368632435798645, 1.420410394668579, 1.4721883535385132, 1.5239664316177368, 1.575744390487671, 1.627522349357605, 1.679300308227539, 1.7310783863067627, 1.7828562259674072, 1.8346341848373413, 1.8864121437072754, 1.938190221786499, 1.989968180656433, 2.041746139526367, 2.093524217605591, 2.1453020572662354, 2.197080135345459, 2.2488582134246826, 2.300636053085327, 2.352414131164551, 2.4041919708251953, 2.455970048904419, 2.5077481269836426, 2.559525966644287, 2.6113040447235107]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 2.0, 3.0, 5.0, 9.0, 9.0, 8.0, 9.0, 12.0, 17.0, 21.0, 23.0, 26.0, 29.0, 40.0, 33.0, 27.0, 47.0, 47.0, 42.0, 40.0, 50.0, 52.0, 42.0, 34.0, 38.0, 43.0, 37.0, 34.0, 31.0, 28.0, 26.0, 24.0, 16.0, 11.0, 17.0, 10.0, 10.0, 15.0, 13.0, 11.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5210294723510742, -0.5037463307380676, -0.48646318912506104, -0.46918004751205444, -0.45189690589904785, -0.43461376428604126, -0.41733065247535706, -0.40004751086235046, -0.38276436924934387, -0.3654812276363373, -0.3481980860233307, -0.3309149444103241, -0.3136318325996399, -0.2963486909866333, -0.2790655493736267, -0.2617824077606201, -0.24449926614761353, -0.22721612453460693, -0.20993298292160034, -0.19264985620975494, -0.17536671459674835, -0.15808357298374176, -0.14080044627189636, -0.12351730465888977, -0.10623416304588318, -0.08895102143287659, -0.07166788727045059, -0.0543847493827343, -0.037101611495018005, -0.019818469882011414, -0.0025353357195854187, 0.014747798442840576, 0.03203094005584717, 0.04931407794356346, 0.06659721583127975, 0.08388034999370575, 0.10116349160671234, 0.11844663321971893, 0.13572975993156433, 0.15301290154457092, 0.17029604315757751, 0.1875791847705841, 0.2048623263835907, 0.2221454530954361, 0.2394285947084427, 0.2567117214202881, 0.2739948630332947, 0.29127800464630127, 0.30856114625930786, 0.32584428787231445, 0.34312742948532104, 0.36041057109832764, 0.37769371271133423, 0.3949768543243408, 0.412259966135025, 0.4295431077480316, 0.4468262493610382, 0.4641093909740448, 0.4813925325870514, 0.498675674200058, 0.5159587860107422, 0.5332419276237488, 0.5505250692367554, 0.567808210849762, 0.5850913524627686]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 6.0, 9.0, 13.0, 19.0, 34.0, 39.0, 57.0, 83.0, 130.0, 194.0, 288.0, 474.0, 758.0, 1418.0, 2457.0, 4791.0, 9855.0, 22748.0, 62084.0, 225608.0, 474771.0, 159532.0, 47371.0, 18277.0, 8219.0, 4033.0, 2201.0, 1233.0, 679.0, 391.0, 268.0, 142.0, 104.0, 75.0, 47.0, 50.0, 28.0, 19.0, 13.0, 9.0, 5.0, 4.0, 3.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.11395263671875, -0.11053848266601562, -0.10712432861328125, -0.10371017456054688, -0.1002960205078125, -0.09688186645507812, -0.09346771240234375, -0.09005355834960938, -0.086639404296875, -0.08322525024414062, -0.07981109619140625, -0.07639694213867188, -0.0729827880859375, -0.06956863403320312, -0.06615447998046875, -0.06274032592773438, -0.059326171875, -0.055912017822265625, -0.05249786376953125, -0.049083709716796875, -0.0456695556640625, -0.042255401611328125, -0.03884124755859375, -0.035427093505859375, -0.032012939453125, -0.028598785400390625, -0.02518463134765625, -0.021770477294921875, -0.0183563232421875, -0.014942169189453125, -0.01152801513671875, -0.008113861083984375, -0.00469970703125, -0.001285552978515625, 0.00212860107421875, 0.005542755126953125, 0.0089569091796875, 0.012371063232421875, 0.01578521728515625, 0.019199371337890625, 0.022613525390625, 0.026027679443359375, 0.02944183349609375, 0.032855987548828125, 0.0362701416015625, 0.039684295654296875, 0.04309844970703125, 0.046512603759765625, 0.0499267578125, 0.053340911865234375, 0.05675506591796875, 0.060169219970703125, 0.0635833740234375, 0.06699752807617188, 0.07041168212890625, 0.07382583618164062, 0.077239990234375, 0.08065414428710938, 0.08406829833984375, 0.08748245239257812, 0.0908966064453125, 0.09431076049804688, 0.09772491455078125, 0.10113906860351562, 0.10455322265625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 6.0, 9.0, 8.0, 9.0, 15.0, 19.0, 15.0, 28.0, 35.0, 29.0, 39.0, 37.0, 38.0, 36.0, 45.0, 59.0, 52.0, 58.0, 48.0, 55.0, 45.0, 32.0, 42.0, 44.0, 35.0, 39.0, 37.0, 23.0, 15.0, 12.0, 4.0, 4.0, 7.0, 9.0, 3.0, 2.0, 5.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.058685302734375, -0.057065486907958984, -0.05544567108154297, -0.05382585525512695, -0.05220603942871094, -0.05058622360229492, -0.048966407775878906, -0.04734659194946289, -0.045726776123046875, -0.04410696029663086, -0.042487144470214844, -0.04086732864379883, -0.03924751281738281, -0.0376276969909668, -0.03600788116455078, -0.034388065338134766, -0.03276824951171875, -0.031148433685302734, -0.02952861785888672, -0.027908802032470703, -0.026288986206054688, -0.024669170379638672, -0.023049354553222656, -0.02142953872680664, -0.019809722900390625, -0.01818990707397461, -0.016570091247558594, -0.014950275421142578, -0.013330459594726562, -0.011710643768310547, -0.010090827941894531, -0.008471012115478516, -0.0068511962890625, -0.005231380462646484, -0.0036115646362304688, -0.001991748809814453, -0.0003719329833984375, 0.0012478828430175781, 0.0028676986694335938, 0.004487514495849609, 0.006107330322265625, 0.007727146148681641, 0.009346961975097656, 0.010966777801513672, 0.012586593627929688, 0.014206409454345703, 0.01582622528076172, 0.017446041107177734, 0.01906585693359375, 0.020685672760009766, 0.02230548858642578, 0.023925304412841797, 0.025545120239257812, 0.027164936065673828, 0.028784751892089844, 0.03040456771850586, 0.032024383544921875, 0.03364419937133789, 0.035264015197753906, 0.03688383102416992, 0.03850364685058594, 0.04012346267700195, 0.04174327850341797, 0.043363094329833984, 0.04498291015625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 1.0, 1.0, 9.0, 8.0, 13.0, 9.0, 11.0, 28.0, 36.0, 69.0, 102.0, 170.0, 310.0, 620.0, 1480.0, 4276.0, 19362.0, 174885.0, 773766.0, 59410.0, 9295.0, 2609.0, 1025.0, 451.0, 252.0, 128.0, 70.0, 48.0, 36.0, 23.0, 16.0, 15.0, 6.0, 6.0, 7.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2423095703125, -0.2348041534423828, -0.22729873657226562, -0.21979331970214844, -0.21228790283203125, -0.20478248596191406, -0.19727706909179688, -0.1897716522216797, -0.1822662353515625, -0.1747608184814453, -0.16725540161132812, -0.15974998474121094, -0.15224456787109375, -0.14473915100097656, -0.13723373413085938, -0.1297283172607422, -0.122222900390625, -0.11471748352050781, -0.10721206665039062, -0.09970664978027344, -0.09220123291015625, -0.08469581604003906, -0.07719039916992188, -0.06968498229980469, -0.0621795654296875, -0.05467414855957031, -0.047168731689453125, -0.03966331481933594, -0.03215789794921875, -0.024652481079101562, -0.017147064208984375, -0.009641647338867188, -0.00213623046875, 0.0053691864013671875, 0.012874603271484375, 0.020380020141601562, 0.02788543701171875, 0.03539085388183594, 0.042896270751953125, 0.05040168762207031, 0.0579071044921875, 0.06541252136230469, 0.07291793823242188, 0.08042335510253906, 0.08792877197265625, 0.09543418884277344, 0.10293960571289062, 0.11044502258300781, 0.117950439453125, 0.1254558563232422, 0.13296127319335938, 0.14046669006347656, 0.14797210693359375, 0.15547752380371094, 0.16298294067382812, 0.1704883575439453, 0.1779937744140625, 0.1854991912841797, 0.19300460815429688, 0.20051002502441406, 0.20801544189453125, 0.21552085876464844, 0.22302627563476562, 0.2305316925048828, 0.238037109375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 3.0, 6.0, 5.0, 4.0, 9.0, 10.0, 14.0, 14.0, 23.0, 22.0, 29.0, 34.0, 36.0, 48.0, 42.0, 40.0, 44.0, 44.0, 59.0, 54.0, 55.0, 56.0, 52.0, 48.0, 36.0, 36.0, 35.0, 18.0, 21.0, 18.0, 18.0, 13.0, 10.0, 7.0, 8.0, 7.0, 5.0, 8.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.2470703125, -0.2401905059814453, -0.23331069946289062, -0.22643089294433594, -0.21955108642578125, -0.21267127990722656, -0.20579147338867188, -0.1989116668701172, -0.1920318603515625, -0.1851520538330078, -0.17827224731445312, -0.17139244079589844, -0.16451263427734375, -0.15763282775878906, -0.15075302124023438, -0.1438732147216797, -0.136993408203125, -0.1301136016845703, -0.12323379516601562, -0.11635398864746094, -0.10947418212890625, -0.10259437561035156, -0.09571456909179688, -0.08883476257324219, -0.0819549560546875, -0.07507514953613281, -0.06819534301757812, -0.06131553649902344, -0.05443572998046875, -0.04755592346191406, -0.040676116943359375, -0.03379631042480469, -0.02691650390625, -0.020036697387695312, -0.013156890869140625, -0.0062770843505859375, 0.00060272216796875, 0.0074825286865234375, 0.014362335205078125, 0.021242141723632812, 0.0281219482421875, 0.03500175476074219, 0.041881561279296875, 0.04876136779785156, 0.05564117431640625, 0.06252098083496094, 0.06940078735351562, 0.07628059387207031, 0.083160400390625, 0.09004020690917969, 0.09692001342773438, 0.10379981994628906, 0.11067962646484375, 0.11755943298339844, 0.12443923950195312, 0.1313190460205078, 0.1381988525390625, 0.1450786590576172, 0.15195846557617188, 0.15883827209472656, 0.16571807861328125, 0.17259788513183594, 0.17947769165039062, 0.1863574981689453, 0.1932373046875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 12.0, 13.0, 18.0, 23.0, 38.0, 65.0, 88.0, 174.0, 401.0, 919.0, 2859.0, 12238.0, 95501.0, 780448.0, 135027.0, 15459.0, 3290.0, 1023.0, 470.0, 203.0, 109.0, 66.0, 35.0, 19.0, 14.0, 10.0, 8.0, 1.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1107177734375, -0.10709571838378906, -0.10347366333007812, -0.09985160827636719, -0.09622955322265625, -0.09260749816894531, -0.08898544311523438, -0.08536338806152344, -0.0817413330078125, -0.07811927795410156, -0.07449722290039062, -0.07087516784667969, -0.06725311279296875, -0.06363105773925781, -0.060009002685546875, -0.05638694763183594, -0.052764892578125, -0.04914283752441406, -0.045520782470703125, -0.04189872741699219, -0.03827667236328125, -0.03465461730957031, -0.031032562255859375, -0.027410507202148438, -0.0237884521484375, -0.020166397094726562, -0.016544342041015625, -0.012922286987304688, -0.00930023193359375, -0.0056781768798828125, -0.002056121826171875, 0.0015659332275390625, 0.00518798828125, 0.008810043334960938, 0.012432098388671875, 0.016054153442382812, 0.01967620849609375, 0.023298263549804688, 0.026920318603515625, 0.030542373657226562, 0.0341644287109375, 0.03778648376464844, 0.041408538818359375, 0.04503059387207031, 0.04865264892578125, 0.05227470397949219, 0.055896759033203125, 0.05951881408691406, 0.063140869140625, 0.06676292419433594, 0.07038497924804688, 0.07400703430175781, 0.07762908935546875, 0.08125114440917969, 0.08487319946289062, 0.08849525451660156, 0.0921173095703125, 0.09573936462402344, 0.09936141967773438, 0.10298347473144531, 0.10660552978515625, 0.11022758483886719, 0.11384963989257812, 0.11747169494628906, 0.12109375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 1.0, 0.0, 4.0, 4.0, 4.0, 4.0, 3.0, 7.0, 14.0, 13.0, 24.0, 24.0, 36.0, 48.0, 62.0, 72.0, 83.0, 98.0, 100.0, 85.0, 77.0, 66.0, 44.0, 34.0, 18.0, 18.0, 12.0, 7.0, 13.0, 3.0, 6.0, 5.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.331899642944336e-05, -3.248453140258789e-05, -3.165006637573242e-05, -3.081560134887695e-05, -2.9981136322021484e-05, -2.9146671295166016e-05, -2.8312206268310547e-05, -2.7477741241455078e-05, -2.664327621459961e-05, -2.580881118774414e-05, -2.4974346160888672e-05, -2.4139881134033203e-05, -2.3305416107177734e-05, -2.2470951080322266e-05, -2.1636486053466797e-05, -2.0802021026611328e-05, -1.996755599975586e-05, -1.913309097290039e-05, -1.8298625946044922e-05, -1.7464160919189453e-05, -1.6629695892333984e-05, -1.5795230865478516e-05, -1.4960765838623047e-05, -1.4126300811767578e-05, -1.329183578491211e-05, -1.245737075805664e-05, -1.1622905731201172e-05, -1.0788440704345703e-05, -9.953975677490234e-06, -9.119510650634766e-06, -8.285045623779297e-06, -7.450580596923828e-06, -6.616115570068359e-06, -5.781650543212891e-06, -4.947185516357422e-06, -4.112720489501953e-06, -3.2782554626464844e-06, -2.4437904357910156e-06, -1.6093254089355469e-06, -7.748603820800781e-07, 5.960464477539063e-08, 8.940696716308594e-07, 1.7285346984863281e-06, 2.562999725341797e-06, 3.3974647521972656e-06, 4.231929779052734e-06, 5.066394805908203e-06, 5.900859832763672e-06, 6.735324859619141e-06, 7.569789886474609e-06, 8.404254913330078e-06, 9.238719940185547e-06, 1.0073184967041016e-05, 1.0907649993896484e-05, 1.1742115020751953e-05, 1.2576580047607422e-05, 1.341104507446289e-05, 1.424551010131836e-05, 1.5079975128173828e-05, 1.5914440155029297e-05, 1.6748905181884766e-05, 1.7583370208740234e-05, 1.8417835235595703e-05, 1.9252300262451172e-05, 2.008676528930664e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 6.0, 10.0, 20.0, 33.0, 43.0, 84.0, 175.0, 437.0, 1224.0, 4923.0, 41140.0, 817080.0, 168954.0, 11153.0, 2070.0, 627.0, 277.0, 117.0, 54.0, 67.0, 23.0, 14.0, 11.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09228515625, -0.08783149719238281, -0.08337783813476562, -0.07892417907714844, -0.07447052001953125, -0.07001686096191406, -0.06556320190429688, -0.06110954284667969, -0.0566558837890625, -0.05220222473144531, -0.047748565673828125, -0.04329490661621094, -0.03884124755859375, -0.03438758850097656, -0.029933929443359375, -0.025480270385742188, -0.021026611328125, -0.016572952270507812, -0.012119293212890625, -0.0076656341552734375, -0.00321197509765625, 0.0012416839599609375, 0.005695343017578125, 0.010149002075195312, 0.0146026611328125, 0.019056320190429688, 0.023509979248046875, 0.027963638305664062, 0.03241729736328125, 0.03687095642089844, 0.041324615478515625, 0.04577827453613281, 0.05023193359375, 0.05468559265136719, 0.059139251708984375, 0.06359291076660156, 0.06804656982421875, 0.07250022888183594, 0.07695388793945312, 0.08140754699707031, 0.0858612060546875, 0.09031486511230469, 0.09476852416992188, 0.09922218322753906, 0.10367584228515625, 0.10812950134277344, 0.11258316040039062, 0.11703681945800781, 0.121490478515625, 0.1259441375732422, 0.13039779663085938, 0.13485145568847656, 0.13930511474609375, 0.14375877380371094, 0.14821243286132812, 0.1526660919189453, 0.1571197509765625, 0.1615734100341797, 0.16602706909179688, 0.17048072814941406, 0.17493438720703125, 0.17938804626464844, 0.18384170532226562, 0.1882953643798828, 0.1927490234375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 1.0, 3.0, 8.0, 0.0, 3.0, 4.0, 7.0, 13.0, 9.0, 14.0, 11.0, 24.0, 16.0, 22.0, 32.0, 46.0, 34.0, 63.0, 62.0, 81.0, 71.0, 70.0, 59.0, 60.0, 38.0, 44.0, 37.0, 34.0, 24.0, 22.0, 15.0, 10.0, 12.0, 7.0, 14.0, 4.0, 9.0, 1.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.07110595703125, -0.06917905807495117, -0.06725215911865234, -0.06532526016235352, -0.06339836120605469, -0.06147146224975586, -0.05954456329345703, -0.0576176643371582, -0.055690765380859375, -0.05376386642456055, -0.05183696746826172, -0.04991006851196289, -0.04798316955566406, -0.046056270599365234, -0.044129371643066406, -0.04220247268676758, -0.04027557373046875, -0.03834867477416992, -0.036421775817871094, -0.034494876861572266, -0.03256797790527344, -0.03064107894897461, -0.02871417999267578, -0.026787281036376953, -0.024860382080078125, -0.022933483123779297, -0.02100658416748047, -0.01907968521118164, -0.017152786254882812, -0.015225887298583984, -0.013298988342285156, -0.011372089385986328, -0.0094451904296875, -0.007518291473388672, -0.005591392517089844, -0.0036644935607910156, -0.0017375946044921875, 0.00018930435180664062, 0.0021162033081054688, 0.004043102264404297, 0.005970001220703125, 0.007896900177001953, 0.009823799133300781, 0.01175069808959961, 0.013677597045898438, 0.015604496002197266, 0.017531394958496094, 0.019458293914794922, 0.02138519287109375, 0.023312091827392578, 0.025238990783691406, 0.027165889739990234, 0.029092788696289062, 0.03101968765258789, 0.03294658660888672, 0.03487348556518555, 0.036800384521484375, 0.0387272834777832, 0.04065418243408203, 0.04258108139038086, 0.04450798034667969, 0.046434879302978516, 0.048361778259277344, 0.05028867721557617, 0.052215576171875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 13.0, 30.0, 76.0, 144.0, 259.0, 234.0, 119.0, 57.0, 30.0, 13.0, 7.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.2298762798309326, -2.172567367553711, -2.1152584552764893, -2.0579495429992676, -2.000640630722046, -1.9433315992355347, -1.886022686958313, -1.8287137746810913, -1.7714048624038696, -1.714095950126648, -1.6567870378494263, -1.599478006362915, -1.5421690940856934, -1.4848601818084717, -1.42755126953125, -1.3702423572540283, -1.3129334449768066, -1.255624532699585, -1.1983156204223633, -1.1410067081451416, -1.0836976766586304, -1.0263887643814087, -0.969079852104187, -0.9117709398269653, -0.8544619083404541, -0.7971529960632324, -0.739844024181366, -0.6825351119041443, -0.6252261996269226, -0.5679172277450562, -0.5106083154678345, -0.4532994031906128, -0.3959904909133911, -0.33868154883384705, -0.28137263655662537, -0.2240636944770813, -0.16675476729869843, -0.10944584012031555, -0.052136898040771484, 0.005172014236450195, 0.06248095631599426, 0.11978988349437714, 0.17709881067276, 0.23440775275230408, 0.29171669483184814, 0.3490256071090698, 0.4063345491886139, 0.46364346146583557, 0.5209524035453796, 0.5782613158226013, 0.6355702877044678, 0.6928791999816895, 0.7501881122589111, 0.8074970245361328, 0.8648059964179993, 0.922114908695221, 0.9794238805770874, 1.036732792854309, 1.0940417051315308, 1.151350736618042, 1.2086596488952637, 1.2659685611724854, 1.323277473449707, 1.3805863857269287, 1.4378952980041504]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 0.0, 7.0, 9.0, 8.0, 5.0, 12.0, 12.0, 12.0, 12.0, 17.0, 20.0, 21.0, 17.0, 35.0, 25.0, 41.0, 36.0, 44.0, 46.0, 49.0, 62.0, 51.0, 45.0, 48.0, 44.0, 46.0, 35.0, 32.0, 29.0, 34.0, 27.0, 24.0, 20.0, 15.0, 11.0, 4.0, 11.0, 11.0, 4.0, 9.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7336015105247498, -0.7075657248497009, -0.6815299391746521, -0.6554941534996033, -0.6294583082199097, -0.6034225225448608, -0.577386736869812, -0.5513509511947632, -0.5253151655197144, -0.4992793798446655, -0.4732435941696167, -0.4472077786922455, -0.42117199301719666, -0.3951362073421478, -0.3691003918647766, -0.3430646061897278, -0.31702882051467896, -0.2909930348396301, -0.2649572491645813, -0.23892143368721008, -0.21288564801216125, -0.18684986233711243, -0.1608140617609024, -0.13477826118469238, -0.10874247550964355, -0.08270668238401413, -0.056670889258384705, -0.03063509613275528, -0.0045993030071258545, 0.021436482667922974, 0.047472283244132996, 0.07350808382034302, 0.09954386949539185, 0.12557965517044067, 0.1516154557466507, 0.17765125632286072, 0.20368704199790955, 0.22972282767295837, 0.2557586431503296, 0.2817944288253784, 0.30783021450042725, 0.3338660001754761, 0.3599017858505249, 0.3859376013278961, 0.41197338700294495, 0.4380091726779938, 0.464044988155365, 0.4900807738304138, 0.5161165595054626, 0.5421523451805115, 0.5681881308555603, 0.5942239165306091, 0.6202597618103027, 0.6462955474853516, 0.6723313331604004, 0.6983671188354492, 0.724402904510498, 0.7504386901855469, 0.7764744758605957, 0.8025102615356445, 0.8285460472106934, 0.8545818328857422, 0.8806176781654358, 0.9066534638404846, 0.9326892495155334]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 10.0, 6.0, 17.0, 11.0, 19.0, 41.0, 57.0, 89.0, 154.0, 249.0, 379.0, 633.0, 1154.0, 2127.0, 4255.0, 9212.0, 23001.0, 69972.0, 314080.0, 1936222.0, 1502900.0, 236949.0, 56726.0, 19656.0, 8150.0, 3741.0, 1896.0, 1055.0, 570.0, 373.0, 219.0, 135.0, 70.0, 66.0, 30.0, 25.0, 15.0, 10.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.073974609375, -0.07158184051513672, -0.06918907165527344, -0.06679630279541016, -0.06440353393554688, -0.062010765075683594, -0.05961799621582031, -0.05722522735595703, -0.05483245849609375, -0.05243968963623047, -0.05004692077636719, -0.047654151916503906, -0.045261383056640625, -0.042868614196777344, -0.04047584533691406, -0.03808307647705078, -0.0356903076171875, -0.03329753875732422, -0.030904769897460938, -0.028512001037597656, -0.026119232177734375, -0.023726463317871094, -0.021333694458007812, -0.01894092559814453, -0.01654815673828125, -0.014155387878417969, -0.011762619018554688, -0.009369850158691406, -0.006977081298828125, -0.004584312438964844, -0.0021915435791015625, 0.00020122528076171875, 0.002593994140625, 0.004986763000488281, 0.0073795318603515625, 0.009772300720214844, 0.012165069580078125, 0.014557838439941406, 0.016950607299804688, 0.01934337615966797, 0.02173614501953125, 0.02412891387939453, 0.026521682739257812, 0.028914451599121094, 0.031307220458984375, 0.033699989318847656, 0.03609275817871094, 0.03848552703857422, 0.0408782958984375, 0.04327106475830078, 0.04566383361816406, 0.048056602478027344, 0.050449371337890625, 0.052842140197753906, 0.05523490905761719, 0.05762767791748047, 0.06002044677734375, 0.06241321563720703, 0.06480598449707031, 0.0671987533569336, 0.06959152221679688, 0.07198429107666016, 0.07437705993652344, 0.07676982879638672, 0.07916259765625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 9.0, 8.0, 6.0, 13.0, 20.0, 24.0, 25.0, 45.0, 40.0, 65.0, 66.0, 64.0, 56.0, 66.0, 73.0, 54.0, 63.0, 49.0, 49.0, 41.0, 39.0, 35.0, 21.0, 20.0, 13.0, 14.0, 12.0, 4.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.058013916015625, -0.056078433990478516, -0.05414295196533203, -0.05220746994018555, -0.05027198791503906, -0.04833650588989258, -0.046401023864746094, -0.04446554183959961, -0.042530059814453125, -0.04059457778930664, -0.038659095764160156, -0.03672361373901367, -0.03478813171386719, -0.0328526496887207, -0.03091716766357422, -0.028981685638427734, -0.02704620361328125, -0.025110721588134766, -0.02317523956298828, -0.021239757537841797, -0.019304275512695312, -0.017368793487548828, -0.015433311462402344, -0.01349782943725586, -0.011562347412109375, -0.00962686538696289, -0.007691383361816406, -0.005755901336669922, -0.0038204193115234375, -0.0018849372863769531, 5.054473876953125e-05, 0.0019860267639160156, 0.0039215087890625, 0.005856990814208984, 0.007792472839355469, 0.009727954864501953, 0.011663436889648438, 0.013598918914794922, 0.015534400939941406, 0.01746988296508789, 0.019405364990234375, 0.02134084701538086, 0.023276329040527344, 0.025211811065673828, 0.027147293090820312, 0.029082775115966797, 0.03101825714111328, 0.032953739166259766, 0.03488922119140625, 0.036824703216552734, 0.03876018524169922, 0.0406956672668457, 0.04263114929199219, 0.04456663131713867, 0.046502113342285156, 0.04843759536743164, 0.050373077392578125, 0.05230855941772461, 0.054244041442871094, 0.05617952346801758, 0.05811500549316406, 0.06005048751831055, 0.06198596954345703, 0.06392145156860352, 0.06585693359375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 12.0, 7.0, 15.0, 33.0, 59.0, 92.0, 174.0, 357.0, 837.0, 2199.0, 7944.0, 45736.0, 735840.0, 3252189.0, 125738.0, 16393.0, 3954.0, 1387.0, 601.0, 313.0, 165.0, 82.0, 56.0, 26.0, 27.0, 23.0, 8.0, 6.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.259033203125, -0.2524280548095703, -0.24582290649414062, -0.23921775817871094, -0.23261260986328125, -0.22600746154785156, -0.21940231323242188, -0.2127971649169922, -0.2061920166015625, -0.1995868682861328, -0.19298171997070312, -0.18637657165527344, -0.17977142333984375, -0.17316627502441406, -0.16656112670898438, -0.1599559783935547, -0.153350830078125, -0.1467456817626953, -0.14014053344726562, -0.13353538513183594, -0.12693023681640625, -0.12032508850097656, -0.11371994018554688, -0.10711479187011719, -0.1005096435546875, -0.09390449523925781, -0.08729934692382812, -0.08069419860839844, -0.07408905029296875, -0.06748390197753906, -0.060878753662109375, -0.05427360534667969, -0.04766845703125, -0.04106330871582031, -0.034458160400390625, -0.027853012084960938, -0.02124786376953125, -0.014642715454101562, -0.008037567138671875, -0.0014324188232421875, 0.0051727294921875, 0.011777877807617188, 0.018383026123046875, 0.024988174438476562, 0.03159332275390625, 0.03819847106933594, 0.044803619384765625, 0.05140876770019531, 0.058013916015625, 0.06461906433105469, 0.07122421264648438, 0.07782936096191406, 0.08443450927734375, 0.09103965759277344, 0.09764480590820312, 0.10424995422363281, 0.1108551025390625, 0.11746025085449219, 0.12406539916992188, 0.13067054748535156, 0.13727569580078125, 0.14388084411621094, 0.15048599243164062, 0.1570911407470703, 0.1636962890625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 5.0, 4.0, 4.0, 9.0, 17.0, 25.0, 29.0, 49.0, 57.0, 78.0, 138.0, 257.0, 451.0, 757.0, 777.0, 536.0, 329.0, 185.0, 120.0, 68.0, 53.0, 35.0, 27.0, 21.0, 10.0, 4.0, 6.0, 5.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1484375, -0.14253616333007812, -0.13663482666015625, -0.13073348999023438, -0.1248321533203125, -0.11893081665039062, -0.11302947998046875, -0.10712814331054688, -0.101226806640625, -0.09532546997070312, -0.08942413330078125, -0.08352279663085938, -0.0776214599609375, -0.07172012329101562, -0.06581878662109375, -0.059917449951171875, -0.05401611328125, -0.048114776611328125, -0.04221343994140625, -0.036312103271484375, -0.0304107666015625, -0.024509429931640625, -0.01860809326171875, -0.012706756591796875, -0.006805419921875, -0.000904083251953125, 0.00499725341796875, 0.010898590087890625, 0.0167999267578125, 0.022701263427734375, 0.02860260009765625, 0.034503936767578125, 0.0404052734375, 0.046306610107421875, 0.05220794677734375, 0.058109283447265625, 0.0640106201171875, 0.06991195678710938, 0.07581329345703125, 0.08171463012695312, 0.087615966796875, 0.09351730346679688, 0.09941864013671875, 0.10531997680664062, 0.1112213134765625, 0.11712265014648438, 0.12302398681640625, 0.12892532348632812, 0.13482666015625, 0.14072799682617188, 0.14662933349609375, 0.15253067016601562, 0.1584320068359375, 0.16433334350585938, 0.17023468017578125, 0.17613601684570312, 0.182037353515625, 0.18793869018554688, 0.19384002685546875, 0.19974136352539062, 0.2056427001953125, 0.21154403686523438, 0.21744537353515625, 0.22334671020507812, 0.229248046875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 18.0, 73.0, 233.0, 371.0, 221.0, 46.0, 12.0, 5.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5941085815429688, -2.4825284481048584, -2.370948314666748, -2.2593679428100586, -2.1477878093719482, -2.036207675933838, -1.924627423286438, -1.813047170639038, -1.7014670372009277, -1.5898869037628174, -1.4783066511154175, -1.3667263984680176, -1.2551462650299072, -1.1435661315917969, -1.031985878944397, -0.9204056859016418, -0.8088254928588867, -0.6972452998161316, -0.5856651067733765, -0.47408491373062134, -0.3625047206878662, -0.2509245276451111, -0.13934433460235596, -0.02776414155960083, 0.0838160514831543, 0.19539624452590942, 0.30697643756866455, 0.4185566306114197, 0.5301368236541748, 0.6417170166969299, 0.7532972097396851, 0.8648774027824402, 0.9764575958251953, 1.0880377292633057, 1.1996179819107056, 1.3111982345581055, 1.4227783679962158, 1.5343585014343262, 1.645938754081726, 1.757519006729126, 1.8690991401672363, 1.9806792736053467, 2.092259407043457, 2.2038397789001465, 2.315419912338257, 2.427000045776367, 2.5385804176330566, 2.650160551071167, 2.7617406845092773, 2.8733208179473877, 2.984900951385498, 3.0964813232421875, 3.208061456680298, 3.319641590118408, 3.4312219619750977, 3.542802095413208, 3.6543822288513184, 3.7659623622894287, 3.877542495727539, 3.9891228675842285, 4.100703239440918, 4.212283134460449, 4.323863506317139, 4.43544340133667, 4.547023773193359]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 5.0, 7.0, 5.0, 6.0, 10.0, 12.0, 17.0, 14.0, 27.0, 21.0, 36.0, 24.0, 38.0, 35.0, 41.0, 39.0, 36.0, 42.0, 42.0, 38.0, 39.0, 41.0, 40.0, 61.0, 35.0, 38.0, 31.0, 35.0, 27.0, 27.0, 19.0, 20.0, 16.0, 8.0, 13.0, 10.0, 10.0, 3.0, 11.0, 6.0, 2.0, 1.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8110286593437195, -0.786143958568573, -0.7612591981887817, -0.7363744974136353, -0.711489737033844, -0.6866050362586975, -0.6617202758789062, -0.6368355751037598, -0.6119508743286133, -0.5870661735534668, -0.5621814131736755, -0.537296712398529, -0.5124119520187378, -0.4875272512435913, -0.46264252066612244, -0.43775779008865356, -0.4128730297088623, -0.38798829913139343, -0.36310356855392456, -0.3382188677787781, -0.3133341073989868, -0.28844940662384033, -0.26356467604637146, -0.2386799454689026, -0.21379521489143372, -0.18891048431396484, -0.16402575373649597, -0.1391410380601883, -0.11425630748271942, -0.08937157690525055, -0.06448686122894287, -0.039602130651474, -0.014717400074005127, 0.010167326778173447, 0.03505205363035202, 0.059936776757240295, 0.08482150733470917, 0.10970623791217804, 0.13459095358848572, 0.1594756841659546, 0.18436041474342346, 0.20924514532089233, 0.2341298758983612, 0.2590146064758301, 0.28389930725097656, 0.3087840676307678, 0.3336687684059143, 0.3585534989833832, 0.38343822956085205, 0.4083229601383209, 0.4332076907157898, 0.4580923914909363, 0.48297715187072754, 0.507861852645874, 0.5327465534210205, 0.5576313138008118, 0.582516074180603, 0.6074007749557495, 0.6322855353355408, 0.6571702361106873, 0.6820549964904785, 0.706939697265625, 0.7318243980407715, 0.7567091584205627, 0.7815938591957092]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 5.0, 4.0, 5.0, 4.0, 7.0, 6.0, 10.0, 30.0, 55.0, 49.0, 111.0, 170.0, 270.0, 450.0, 918.0, 1820.0, 4002.0, 9630.0, 25722.0, 74489.0, 237077.0, 432107.0, 172495.0, 55605.0, 19577.0, 7449.0, 3137.0, 1512.0, 789.0, 453.0, 216.0, 144.0, 99.0, 41.0, 34.0, 23.0, 18.0, 12.0, 6.0, 2.0, 1.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.092529296875, -0.08873176574707031, -0.08493423461914062, -0.08113670349121094, -0.07733917236328125, -0.07354164123535156, -0.06974411010742188, -0.06594657897949219, -0.0621490478515625, -0.05835151672363281, -0.054553985595703125, -0.05075645446777344, -0.04695892333984375, -0.04316139221191406, -0.039363861083984375, -0.03556632995605469, -0.031768798828125, -0.027971267700195312, -0.024173736572265625, -0.020376205444335938, -0.01657867431640625, -0.012781143188476562, -0.008983612060546875, -0.0051860809326171875, -0.0013885498046875, 0.0024089813232421875, 0.006206512451171875, 0.010004043579101562, 0.01380157470703125, 0.017599105834960938, 0.021396636962890625, 0.025194168090820312, 0.02899169921875, 0.03278923034667969, 0.036586761474609375, 0.04038429260253906, 0.04418182373046875, 0.04797935485839844, 0.051776885986328125, 0.05557441711425781, 0.0593719482421875, 0.06316947937011719, 0.06696701049804688, 0.07076454162597656, 0.07456207275390625, 0.07835960388183594, 0.08215713500976562, 0.08595466613769531, 0.089752197265625, 0.09354972839355469, 0.09734725952148438, 0.10114479064941406, 0.10494232177734375, 0.10873985290527344, 0.11253738403320312, 0.11633491516113281, 0.1201324462890625, 0.12392997741699219, 0.12772750854492188, 0.13152503967285156, 0.13532257080078125, 0.13912010192871094, 0.14291763305664062, 0.1467151641845703, 0.1505126953125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 6.0, 5.0, 6.0, 8.0, 14.0, 5.0, 20.0, 17.0, 21.0, 26.0, 24.0, 23.0, 32.0, 36.0, 38.0, 36.0, 47.0, 37.0, 49.0, 47.0, 48.0, 47.0, 45.0, 37.0, 43.0, 45.0, 35.0, 33.0, 28.0, 19.0, 28.0, 9.0, 19.0, 13.0, 12.0, 9.0, 8.0, 5.0, 6.0, 7.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041168212890625, -0.03974723815917969, -0.038326263427734375, -0.03690528869628906, -0.03548431396484375, -0.03406333923339844, -0.032642364501953125, -0.031221389770507812, -0.0298004150390625, -0.028379440307617188, -0.026958465576171875, -0.025537490844726562, -0.02411651611328125, -0.022695541381835938, -0.021274566650390625, -0.019853591918945312, -0.0184326171875, -0.017011642456054688, -0.015590667724609375, -0.014169692993164062, -0.01274871826171875, -0.011327743530273438, -0.009906768798828125, -0.008485794067382812, -0.0070648193359375, -0.0056438446044921875, -0.004222869873046875, -0.0028018951416015625, -0.00138092041015625, 4.00543212890625e-05, 0.001461029052734375, 0.0028820037841796875, 0.004302978515625, 0.0057239532470703125, 0.007144927978515625, 0.008565902709960938, 0.00998687744140625, 0.011407852172851562, 0.012828826904296875, 0.014249801635742188, 0.0156707763671875, 0.017091751098632812, 0.018512725830078125, 0.019933700561523438, 0.02135467529296875, 0.022775650024414062, 0.024196624755859375, 0.025617599487304688, 0.02703857421875, 0.028459548950195312, 0.029880523681640625, 0.03130149841308594, 0.03272247314453125, 0.03414344787597656, 0.035564422607421875, 0.03698539733886719, 0.0384063720703125, 0.03982734680175781, 0.041248321533203125, 0.04266929626464844, 0.04409027099609375, 0.04551124572753906, 0.046932220458984375, 0.04835319519042969, 0.049774169921875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 5.0, 3.0, 11.0, 10.0, 11.0, 16.0, 20.0, 18.0, 36.0, 46.0, 99.0, 143.0, 228.0, 398.0, 696.0, 1409.0, 2944.0, 8268.0, 38915.0, 585055.0, 364620.0, 32447.0, 7445.0, 2719.0, 1333.0, 673.0, 353.0, 213.0, 147.0, 90.0, 54.0, 36.0, 29.0, 30.0, 11.0, 8.0, 6.0, 3.0, 2.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.26611328125, -0.2580375671386719, -0.24996185302734375, -0.24188613891601562, -0.2338104248046875, -0.22573471069335938, -0.21765899658203125, -0.20958328247070312, -0.201507568359375, -0.19343185424804688, -0.18535614013671875, -0.17728042602539062, -0.1692047119140625, -0.16112899780273438, -0.15305328369140625, -0.14497756958007812, -0.13690185546875, -0.12882614135742188, -0.12075042724609375, -0.11267471313476562, -0.1045989990234375, -0.09652328491210938, -0.08844757080078125, -0.08037185668945312, -0.072296142578125, -0.06422042846679688, -0.05614471435546875, -0.048069000244140625, -0.0399932861328125, -0.031917572021484375, -0.02384185791015625, -0.015766143798828125, -0.0076904296875, 0.000385284423828125, 0.00846099853515625, 0.016536712646484375, 0.0246124267578125, 0.032688140869140625, 0.04076385498046875, 0.048839569091796875, 0.056915283203125, 0.06499099731445312, 0.07306671142578125, 0.08114242553710938, 0.0892181396484375, 0.09729385375976562, 0.10536956787109375, 0.11344528198242188, 0.12152099609375, 0.12959671020507812, 0.13767242431640625, 0.14574813842773438, 0.1538238525390625, 0.16189956665039062, 0.16997528076171875, 0.17805099487304688, 0.186126708984375, 0.19420242309570312, 0.20227813720703125, 0.21035385131835938, 0.2184295654296875, 0.22650527954101562, 0.23458099365234375, 0.24265670776367188, 0.250732421875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 0.0, 5.0, 3.0, 4.0, 6.0, 3.0, 6.0, 14.0, 7.0, 9.0, 13.0, 26.0, 29.0, 18.0, 25.0, 25.0, 38.0, 44.0, 41.0, 50.0, 49.0, 49.0, 46.0, 41.0, 33.0, 39.0, 53.0, 35.0, 45.0, 39.0, 21.0, 25.0, 31.0, 24.0, 17.0, 16.0, 16.0, 12.0, 11.0, 8.0, 6.0, 3.0, 4.0, 4.0, 1.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.2408447265625, -0.23380661010742188, -0.22676849365234375, -0.21973037719726562, -0.2126922607421875, -0.20565414428710938, -0.19861602783203125, -0.19157791137695312, -0.184539794921875, -0.17750167846679688, -0.17046356201171875, -0.16342544555664062, -0.1563873291015625, -0.14934921264648438, -0.14231109619140625, -0.13527297973632812, -0.12823486328125, -0.12119674682617188, -0.11415863037109375, -0.10712051391601562, -0.1000823974609375, -0.09304428100585938, -0.08600616455078125, -0.07896804809570312, -0.071929931640625, -0.06489181518554688, -0.05785369873046875, -0.050815582275390625, -0.0437774658203125, -0.036739349365234375, -0.02970123291015625, -0.022663116455078125, -0.015625, -0.008586883544921875, -0.00154876708984375, 0.005489349365234375, 0.0125274658203125, 0.019565582275390625, 0.02660369873046875, 0.033641815185546875, 0.040679931640625, 0.047718048095703125, 0.05475616455078125, 0.061794281005859375, 0.0688323974609375, 0.07587051391601562, 0.08290863037109375, 0.08994674682617188, 0.09698486328125, 0.10402297973632812, 0.11106109619140625, 0.11809921264648438, 0.1251373291015625, 0.13217544555664062, 0.13921356201171875, 0.14625167846679688, 0.153289794921875, 0.16032791137695312, 0.16736602783203125, 0.17440414428710938, 0.1814422607421875, 0.18848037719726562, 0.19551849365234375, 0.20255661010742188, 0.2095947265625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 7.0, 8.0, 11.0, 17.0, 14.0, 24.0, 32.0, 43.0, 75.0, 113.0, 177.0, 279.0, 509.0, 901.0, 1921.0, 4802.0, 14279.0, 54922.0, 266332.0, 577379.0, 92350.0, 22243.0, 6843.0, 2650.0, 1161.0, 556.0, 332.0, 209.0, 94.0, 78.0, 58.0, 37.0, 28.0, 23.0, 12.0, 9.0, 8.0, 11.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.06561279296875, -0.0635080337524414, -0.06140327453613281, -0.05929851531982422, -0.057193756103515625, -0.05508899688720703, -0.05298423767089844, -0.050879478454589844, -0.04877471923828125, -0.046669960021972656, -0.04456520080566406, -0.04246044158935547, -0.040355682373046875, -0.03825092315673828, -0.03614616394042969, -0.034041404724121094, -0.0319366455078125, -0.029831886291503906, -0.027727127075195312, -0.02562236785888672, -0.023517608642578125, -0.02141284942626953, -0.019308090209960938, -0.017203330993652344, -0.01509857177734375, -0.012993812561035156, -0.010889053344726562, -0.008784294128417969, -0.006679534912109375, -0.004574775695800781, -0.0024700164794921875, -0.00036525726318359375, 0.001739501953125, 0.0038442611694335938, 0.0059490203857421875, 0.008053779602050781, 0.010158538818359375, 0.012263298034667969, 0.014368057250976562, 0.016472816467285156, 0.01857757568359375, 0.020682334899902344, 0.022787094116210938, 0.02489185333251953, 0.026996612548828125, 0.02910137176513672, 0.031206130981445312, 0.033310890197753906, 0.0354156494140625, 0.037520408630371094, 0.03962516784667969, 0.04172992706298828, 0.043834686279296875, 0.04593944549560547, 0.04804420471191406, 0.050148963928222656, 0.05225372314453125, 0.054358482360839844, 0.05646324157714844, 0.05856800079345703, 0.060672760009765625, 0.06277751922607422, 0.06488227844238281, 0.0669870376586914, 0.069091796875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 3.0, 5.0, 4.0, 8.0, 2.0, 12.0, 11.0, 16.0, 16.0, 20.0, 14.0, 19.0, 18.0, 25.0, 37.0, 32.0, 41.0, 69.0, 65.0, 63.0, 60.0, 68.0, 64.0, 52.0, 37.0, 32.0, 30.0, 27.0, 16.0, 14.0, 16.0, 20.0, 11.0, 11.0, 13.0, 9.0, 8.0, 8.0, 6.0, 6.0, 1.0, 4.0, 5.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-2.2530555725097656e-05, -2.1889805793762207e-05, -2.1249055862426758e-05, -2.060830593109131e-05, -1.996755599975586e-05, -1.932680606842041e-05, -1.868605613708496e-05, -1.8045306205749512e-05, -1.7404556274414062e-05, -1.6763806343078613e-05, -1.6123056411743164e-05, -1.5482306480407715e-05, -1.4841556549072266e-05, -1.4200806617736816e-05, -1.3560056686401367e-05, -1.2919306755065918e-05, -1.2278556823730469e-05, -1.163780689239502e-05, -1.099705696105957e-05, -1.0356307029724121e-05, -9.715557098388672e-06, -9.074807167053223e-06, -8.434057235717773e-06, -7.793307304382324e-06, -7.152557373046875e-06, -6.511807441711426e-06, -5.8710575103759766e-06, -5.230307579040527e-06, -4.589557647705078e-06, -3.948807716369629e-06, -3.3080577850341797e-06, -2.6673078536987305e-06, -2.0265579223632812e-06, -1.385807991027832e-06, -7.450580596923828e-07, -1.043081283569336e-07, 5.364418029785156e-07, 1.1771917343139648e-06, 1.817941665649414e-06, 2.4586915969848633e-06, 3.0994415283203125e-06, 3.7401914596557617e-06, 4.380941390991211e-06, 5.02169132232666e-06, 5.662441253662109e-06, 6.303191184997559e-06, 6.943941116333008e-06, 7.584691047668457e-06, 8.225440979003906e-06, 8.866190910339355e-06, 9.506940841674805e-06, 1.0147690773010254e-05, 1.0788440704345703e-05, 1.1429190635681152e-05, 1.2069940567016602e-05, 1.271069049835205e-05, 1.33514404296875e-05, 1.399219036102295e-05, 1.4632940292358398e-05, 1.5273690223693848e-05, 1.5914440155029297e-05, 1.6555190086364746e-05, 1.7195940017700195e-05, 1.7836689949035645e-05, 1.8477439880371094e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 5.0, 11.0, 15.0, 29.0, 38.0, 34.0, 67.0, 109.0, 207.0, 380.0, 705.0, 1419.0, 3426.0, 10798.0, 55975.0, 595272.0, 327032.0, 39186.0, 8195.0, 2898.0, 1265.0, 646.0, 332.0, 184.0, 100.0, 82.0, 48.0, 21.0, 16.0, 12.0, 9.0, 8.0, 3.0, 5.0, 7.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.09576416015625, -0.09323787689208984, -0.09071159362792969, -0.08818531036376953, -0.08565902709960938, -0.08313274383544922, -0.08060646057128906, -0.0780801773071289, -0.07555389404296875, -0.0730276107788086, -0.07050132751464844, -0.06797504425048828, -0.06544876098632812, -0.06292247772216797, -0.06039619445800781, -0.057869911193847656, -0.0553436279296875, -0.052817344665527344, -0.05029106140136719, -0.04776477813720703, -0.045238494873046875, -0.04271221160888672, -0.04018592834472656, -0.037659645080566406, -0.03513336181640625, -0.032607078552246094, -0.030080795288085938, -0.02755451202392578, -0.025028228759765625, -0.02250194549560547, -0.019975662231445312, -0.017449378967285156, -0.014923095703125, -0.012396812438964844, -0.009870529174804688, -0.007344245910644531, -0.004817962646484375, -0.0022916793823242188, 0.0002346038818359375, 0.0027608871459960938, 0.00528717041015625, 0.007813453674316406, 0.010339736938476562, 0.012866020202636719, 0.015392303466796875, 0.01791858673095703, 0.020444869995117188, 0.022971153259277344, 0.0254974365234375, 0.028023719787597656, 0.030550003051757812, 0.03307628631591797, 0.035602569580078125, 0.03812885284423828, 0.04065513610839844, 0.043181419372558594, 0.04570770263671875, 0.048233985900878906, 0.05076026916503906, 0.05328655242919922, 0.055812835693359375, 0.05833911895751953, 0.06086540222167969, 0.06339168548583984, 0.06591796875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 8.0, 7.0, 11.0, 9.0, 15.0, 9.0, 18.0, 12.0, 16.0, 19.0, 29.0, 17.0, 40.0, 36.0, 39.0, 43.0, 54.0, 55.0, 58.0, 52.0, 45.0, 54.0, 46.0, 43.0, 32.0, 38.0, 22.0, 31.0, 17.0, 21.0, 17.0, 20.0, 14.0, 7.0, 12.0, 3.0, 5.0, 5.0, 7.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0560302734375, -0.05443000793457031, -0.052829742431640625, -0.05122947692871094, -0.04962921142578125, -0.04802894592285156, -0.046428680419921875, -0.04482841491699219, -0.0432281494140625, -0.04162788391113281, -0.040027618408203125, -0.03842735290527344, -0.03682708740234375, -0.03522682189941406, -0.033626556396484375, -0.03202629089355469, -0.030426025390625, -0.028825759887695312, -0.027225494384765625, -0.025625228881835938, -0.02402496337890625, -0.022424697875976562, -0.020824432373046875, -0.019224166870117188, -0.0176239013671875, -0.016023635864257812, -0.014423370361328125, -0.012823104858398438, -0.01122283935546875, -0.009622573852539062, -0.008022308349609375, -0.0064220428466796875, -0.00482177734375, -0.0032215118408203125, -0.001621246337890625, -2.09808349609375e-05, 0.00157928466796875, 0.0031795501708984375, 0.004779815673828125, 0.0063800811767578125, 0.0079803466796875, 0.009580612182617188, 0.011180877685546875, 0.012781143188476562, 0.01438140869140625, 0.015981674194335938, 0.017581939697265625, 0.019182205200195312, 0.020782470703125, 0.022382736206054688, 0.023983001708984375, 0.025583267211914062, 0.02718353271484375, 0.028783798217773438, 0.030384063720703125, 0.03198432922363281, 0.0335845947265625, 0.03518486022949219, 0.036785125732421875, 0.03838539123535156, 0.03998565673828125, 0.04158592224121094, 0.043186187744140625, 0.04478645324707031, 0.04638671875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 13.0, 21.0, 23.0, 34.0, 68.0, 100.0, 162.0, 202.0, 139.0, 92.0, 57.0, 32.0, 12.0, 16.0, 10.0, 6.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.1225615739822388, -1.0796549320220947, -1.0367484092712402, -0.9938417673110962, -0.9509351253509521, -0.9080285429954529, -0.8651219606399536, -0.8222153186798096, -0.7793087363243103, -0.736402153968811, -0.693495512008667, -0.6505889296531677, -0.6076823472976685, -0.5647757053375244, -0.5218691229820251, -0.4789625108242035, -0.43605589866638184, -0.3931492865085602, -0.3502426743507385, -0.30733609199523926, -0.2644294798374176, -0.22152286767959595, -0.17861628532409668, -0.13570967316627502, -0.09280306100845337, -0.04989645630121231, -0.0069898515939712524, 0.03591674566268921, 0.07882335782051086, 0.12172996997833252, 0.1646365523338318, 0.20754316449165344, 0.25044965744018555, 0.2933562695980072, 0.33626288175582886, 0.3791694641113281, 0.4220760762691498, 0.46498268842697144, 0.5078892707824707, 0.5507959127426147, 0.593702495098114, 0.6366090774536133, 0.6795157194137573, 0.7224223017692566, 0.7653288841247559, 0.8082355260848999, 0.8511421084403992, 0.8940486907958984, 0.9369553327560425, 0.9798619151115417, 1.022768497467041, 1.065675139427185, 1.108581781387329, 1.1514883041381836, 1.1943949460983276, 1.2373015880584717, 1.2802081108093262, 1.3231147527694702, 1.3660212755203247, 1.4089279174804688, 1.4518345594406128, 1.4947412014007568, 1.5376477241516113, 1.5805543661117554, 1.6234610080718994]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 4.0, 0.0, 5.0, 1.0, 5.0, 5.0, 6.0, 8.0, 9.0, 6.0, 17.0, 13.0, 23.0, 18.0, 28.0, 27.0, 34.0, 42.0, 33.0, 42.0, 34.0, 65.0, 81.0, 57.0, 53.0, 55.0, 68.0, 36.0, 31.0, 32.0, 26.0, 15.0, 24.0, 12.0, 9.0, 14.0, 18.0, 14.0, 10.0, 3.0, 8.0, 7.0, 2.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-1.043489694595337, -1.0154638290405273, -0.9874380230903625, -0.9594122171401978, -0.931386411190033, -0.9033605456352234, -0.8753347396850586, -0.847308874130249, -0.8192830681800842, -0.7912572622299194, -0.7632313966751099, -0.7352055907249451, -0.7071797847747803, -0.6791539192199707, -0.6511281132698059, -0.6231023073196411, -0.5950764417648315, -0.5670506358146667, -0.5390247702598572, -0.5109989643096924, -0.4829731285572052, -0.454947292804718, -0.4269214868545532, -0.39889565110206604, -0.37086987495422363, -0.34284403920173645, -0.31481823325157166, -0.2867923974990845, -0.2587665617465973, -0.2307407408952713, -0.2027149200439453, -0.17468908429145813, -0.14666324853897095, -0.11863742023706436, -0.09061159193515778, -0.06258577108383179, -0.0345599427819252, -0.006534114480018616, 0.021491706371307373, 0.049517542123794556, 0.07754336297512054, 0.10556919127702713, 0.13359501957893372, 0.1616208404302597, 0.1896466612815857, 0.21767249703407288, 0.24569831788539886, 0.27372413873672485, 0.30174997448921204, 0.3297758102416992, 0.357801616191864, 0.3858274519443512, 0.4138532876968384, 0.4418790936470032, 0.46990492939949036, 0.49793076515197754, 0.5259565711021423, 0.5539823770523071, 0.5820082426071167, 0.6100340485572815, 0.6380598545074463, 0.6660857200622559, 0.6941115260124207, 0.7221373319625854, 0.750163197517395]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 8.0, 9.0, 21.0, 21.0, 44.0, 66.0, 116.0, 201.0, 413.0, 682.0, 1434.0, 2974.0, 6862.0, 16718.0, 49970.0, 197669.0, 1165404.0, 2159560.0, 452591.0, 93452.0, 27585.0, 9997.0, 4314.0, 1965.0, 1010.0, 513.0, 260.0, 163.0, 104.0, 66.0, 33.0, 13.0, 13.0, 9.0, 7.0, 9.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06207275390625, -0.05994987487792969, -0.057826995849609375, -0.05570411682128906, -0.05358123779296875, -0.05145835876464844, -0.049335479736328125, -0.04721260070800781, -0.0450897216796875, -0.04296684265136719, -0.040843963623046875, -0.03872108459472656, -0.03659820556640625, -0.03447532653808594, -0.032352447509765625, -0.030229568481445312, -0.028106689453125, -0.025983810424804688, -0.023860931396484375, -0.021738052368164062, -0.01961517333984375, -0.017492294311523438, -0.015369415283203125, -0.013246536254882812, -0.0111236572265625, -0.009000778198242188, -0.006877899169921875, -0.0047550201416015625, -0.00263214111328125, -0.0005092620849609375, 0.001613616943359375, 0.0037364959716796875, 0.005859375, 0.007982254028320312, 0.010105133056640625, 0.012228012084960938, 0.01435089111328125, 0.016473770141601562, 0.018596649169921875, 0.020719528198242188, 0.0228424072265625, 0.024965286254882812, 0.027088165283203125, 0.029211044311523438, 0.03133392333984375, 0.03345680236816406, 0.035579681396484375, 0.03770256042480469, 0.039825439453125, 0.04194831848144531, 0.044071197509765625, 0.04619407653808594, 0.04831695556640625, 0.05043983459472656, 0.052562713623046875, 0.05468559265136719, 0.0568084716796875, 0.05893135070800781, 0.061054229736328125, 0.06317710876464844, 0.06529998779296875, 0.06742286682128906, 0.06954574584960938, 0.07166862487792969, 0.07379150390625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 4.0, 9.0, 8.0, 14.0, 13.0, 16.0, 15.0, 17.0, 30.0, 27.0, 27.0, 30.0, 40.0, 52.0, 49.0, 37.0, 38.0, 62.0, 51.0, 49.0, 49.0, 40.0, 49.0, 43.0, 37.0, 45.0, 24.0, 26.0, 27.0, 18.0, 10.0, 13.0, 3.0, 8.0, 4.0, 4.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.047515869140625, -0.04597282409667969, -0.044429779052734375, -0.04288673400878906, -0.04134368896484375, -0.03980064392089844, -0.038257598876953125, -0.03671455383300781, -0.0351715087890625, -0.03362846374511719, -0.032085418701171875, -0.030542373657226562, -0.02899932861328125, -0.027456283569335938, -0.025913238525390625, -0.024370193481445312, -0.0228271484375, -0.021284103393554688, -0.019741058349609375, -0.018198013305664062, -0.01665496826171875, -0.015111923217773438, -0.013568878173828125, -0.012025833129882812, -0.0104827880859375, -0.008939743041992188, -0.007396697998046875, -0.0058536529541015625, -0.00431060791015625, -0.0027675628662109375, -0.001224517822265625, 0.0003185272216796875, 0.001861572265625, 0.0034046173095703125, 0.004947662353515625, 0.0064907073974609375, 0.00803375244140625, 0.009576797485351562, 0.011119842529296875, 0.012662887573242188, 0.0142059326171875, 0.015748977661132812, 0.017292022705078125, 0.018835067749023438, 0.02037811279296875, 0.021921157836914062, 0.023464202880859375, 0.025007247924804688, 0.02655029296875, 0.028093338012695312, 0.029636383056640625, 0.031179428100585938, 0.03272247314453125, 0.03426551818847656, 0.035808563232421875, 0.03735160827636719, 0.0388946533203125, 0.04043769836425781, 0.041980743408203125, 0.04352378845214844, 0.04506683349609375, 0.04660987854003906, 0.048152923583984375, 0.04969596862792969, 0.051239013671875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 6.0, 4.0, 4.0, 7.0, 7.0, 16.0, 18.0, 12.0, 56.0, 65.0, 79.0, 167.0, 266.0, 446.0, 929.0, 2264.0, 6368.0, 19486.0, 84292.0, 737673.0, 2976954.0, 295493.0, 48915.0, 13119.0, 4420.0, 1628.0, 662.0, 357.0, 204.0, 113.0, 87.0, 55.0, 30.0, 22.0, 16.0, 8.0, 9.0, 8.0, 5.0, 1.0, 7.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1156005859375, -0.11165809631347656, -0.10771560668945312, -0.10377311706542969, -0.09983062744140625, -0.09588813781738281, -0.09194564819335938, -0.08800315856933594, -0.0840606689453125, -0.08011817932128906, -0.07617568969726562, -0.07223320007324219, -0.06829071044921875, -0.06434822082519531, -0.060405731201171875, -0.05646324157714844, -0.052520751953125, -0.04857826232910156, -0.044635772705078125, -0.04069328308105469, -0.03675079345703125, -0.03280830383300781, -0.028865814208984375, -0.024923324584960938, -0.0209808349609375, -0.017038345336914062, -0.013095855712890625, -0.009153366088867188, -0.00521087646484375, -0.0012683868408203125, 0.002674102783203125, 0.0066165924072265625, 0.01055908203125, 0.014501571655273438, 0.018444061279296875, 0.022386550903320312, 0.02632904052734375, 0.030271530151367188, 0.034214019775390625, 0.03815650939941406, 0.0420989990234375, 0.04604148864746094, 0.049983978271484375, 0.05392646789550781, 0.05786895751953125, 0.06181144714355469, 0.06575393676757812, 0.06969642639160156, 0.073638916015625, 0.07758140563964844, 0.08152389526367188, 0.08546638488769531, 0.08940887451171875, 0.09335136413574219, 0.09729385375976562, 0.10123634338378906, 0.1051788330078125, 0.10912132263183594, 0.11306381225585938, 0.11700630187988281, 0.12094879150390625, 0.12489128112792969, 0.12883377075195312, 0.13277626037597656, 0.13671875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 3.0, 1.0, 3.0, 5.0, 8.0, 5.0, 10.0, 9.0, 8.0, 15.0, 17.0, 18.0, 38.0, 46.0, 45.0, 55.0, 69.0, 118.0, 158.0, 203.0, 276.0, 430.0, 522.0, 493.0, 372.0, 287.0, 229.0, 143.0, 123.0, 76.0, 69.0, 47.0, 28.0, 30.0, 25.0, 16.0, 11.0, 9.0, 5.0, 1.0, 14.0, 6.0, 8.0, 8.0, 4.0, 0.0, 3.0, 2.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.092529296875, -0.08933639526367188, -0.08614349365234375, -0.08295059204101562, -0.0797576904296875, -0.07656478881835938, -0.07337188720703125, -0.07017898559570312, -0.066986083984375, -0.06379318237304688, -0.06060028076171875, -0.057407379150390625, -0.0542144775390625, -0.051021575927734375, -0.04782867431640625, -0.044635772705078125, -0.04144287109375, -0.038249969482421875, -0.03505706787109375, -0.031864166259765625, -0.0286712646484375, -0.025478363037109375, -0.02228546142578125, -0.019092559814453125, -0.015899658203125, -0.012706756591796875, -0.00951385498046875, -0.006320953369140625, -0.0031280517578125, 6.4849853515625e-05, 0.00325775146484375, 0.006450653076171875, 0.0096435546875, 0.012836456298828125, 0.01602935791015625, 0.019222259521484375, 0.0224151611328125, 0.025608062744140625, 0.02880096435546875, 0.031993865966796875, 0.035186767578125, 0.038379669189453125, 0.04157257080078125, 0.044765472412109375, 0.0479583740234375, 0.051151275634765625, 0.05434417724609375, 0.057537078857421875, 0.06072998046875, 0.06392288208007812, 0.06711578369140625, 0.07030868530273438, 0.0735015869140625, 0.07669448852539062, 0.07988739013671875, 0.08308029174804688, 0.086273193359375, 0.08946609497070312, 0.09265899658203125, 0.09585189819335938, 0.0990447998046875, 0.10223770141601562, 0.10543060302734375, 0.10862350463867188, 0.11181640625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 6.0, 12.0, 25.0, 80.0, 164.0, 280.0, 219.0, 116.0, 51.0, 20.0, 9.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4146473407745361, -1.3522950410842896, -1.289942741394043, -1.2275904417037964, -1.1652381420135498, -1.1028858423233032, -1.0405335426330566, -0.9781813025474548, -0.9158290028572083, -0.8534767031669617, -0.7911244034767151, -0.7287721633911133, -0.6664198637008667, -0.6040675640106201, -0.5417152643203735, -0.47936296463012695, -0.41701066493988037, -0.3546583652496338, -0.2923060655593872, -0.229953795671463, -0.16760149598121643, -0.10524919629096985, -0.042896926403045654, 0.019455373287200928, 0.08180767297744751, 0.1441599726676941, 0.20651225745677948, 0.26886454224586487, 0.33121684193611145, 0.39356914162635803, 0.4559214115142822, 0.5182737112045288, 0.5806260108947754, 0.642978310585022, 0.7053306102752686, 0.7676829099655151, 0.8300352096557617, 0.8923875093460083, 0.9547397494316101, 1.017091989517212, 1.079444408416748, 1.1417967081069946, 1.2041490077972412, 1.2665013074874878, 1.3288536071777344, 1.391205906867981, 1.4535582065582275, 1.5159103870391846, 1.5782626867294312, 1.6406149864196777, 1.7029672861099243, 1.765319585800171, 1.8276718854904175, 1.890024185180664, 1.952376365661621, 2.0147287845611572, 2.0770809650421143, 2.1394331455230713, 2.2017855644226074, 2.2641377449035645, 2.3264901638031006, 2.3888423442840576, 2.4511947631835938, 2.513546943664551, 2.575899362564087]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 2.0, 8.0, 9.0, 12.0, 9.0, 10.0, 15.0, 19.0, 26.0, 20.0, 29.0, 25.0, 39.0, 35.0, 46.0, 47.0, 50.0, 50.0, 39.0, 57.0, 63.0, 48.0, 50.0, 37.0, 28.0, 30.0, 31.0, 33.0, 26.0, 22.0, 16.0, 14.0, 12.0, 9.0, 5.0, 9.0, 9.0, 6.0, 3.0, 1.0, 1.0, 2.0, 5.0, 1.0], "bins": [-0.7618774771690369, -0.7423037886619568, -0.7227301597595215, -0.7031564712524414, -0.6835827827453613, -0.6640090942382812, -0.6444354057312012, -0.6248617768287659, -0.6052880883216858, -0.5857143998146057, -0.5661407709121704, -0.5465670824050903, -0.5269933938980103, -0.5074197053909302, -0.4878460466861725, -0.4682723879814148, -0.4486986994743347, -0.42912501096725464, -0.40955135226249695, -0.38997769355773926, -0.3704040050506592, -0.3508303165435791, -0.3312566578388214, -0.3116829991340637, -0.29210931062698364, -0.27253562211990356, -0.2529619634151459, -0.233388289809227, -0.2138146162033081, -0.19424094259738922, -0.17466726899147034, -0.15509359538555145, -0.13551992177963257, -0.11594624817371368, -0.0963725745677948, -0.07679890096187592, -0.05722522735595703, -0.03765155375003815, -0.018077880144119263, 0.0014957934617996216, 0.021069467067718506, 0.04064314067363739, 0.060216814279556274, 0.07979048788547516, 0.09936416149139404, 0.11893783509731293, 0.1385115087032318, 0.1580851823091507, 0.17765885591506958, 0.19723252952098846, 0.21680620312690735, 0.23637987673282623, 0.2559535503387451, 0.2755272388458252, 0.2951008975505829, 0.3146745562553406, 0.33424824476242065, 0.35382193326950073, 0.3733955919742584, 0.3929692506790161, 0.4125429391860962, 0.43211662769317627, 0.45169028639793396, 0.47126394510269165, 0.49083763360977173]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 6.0, 7.0, 22.0, 15.0, 46.0, 50.0, 104.0, 193.0, 331.0, 685.0, 1342.0, 2837.0, 6480.0, 18029.0, 60192.0, 262146.0, 509846.0, 131878.0, 34696.0, 11213.0, 4406.0, 1966.0, 952.0, 502.0, 255.0, 135.0, 87.0, 52.0, 32.0, 27.0, 10.0, 5.0, 6.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1378173828125, -0.13341140747070312, -0.12900543212890625, -0.12459945678710938, -0.1201934814453125, -0.11578750610351562, -0.11138153076171875, -0.10697555541992188, -0.102569580078125, -0.09816360473632812, -0.09375762939453125, -0.08935165405273438, -0.0849456787109375, -0.08053970336914062, -0.07613372802734375, -0.07172775268554688, -0.06732177734375, -0.06291580200195312, -0.05850982666015625, -0.054103851318359375, -0.0496978759765625, -0.045291900634765625, -0.04088592529296875, -0.036479949951171875, -0.032073974609375, -0.027667999267578125, -0.02326202392578125, -0.018856048583984375, -0.0144500732421875, -0.010044097900390625, -0.00563812255859375, -0.001232147216796875, 0.003173828125, 0.007579803466796875, 0.01198577880859375, 0.016391754150390625, 0.0207977294921875, 0.025203704833984375, 0.02960968017578125, 0.034015655517578125, 0.038421630859375, 0.042827606201171875, 0.04723358154296875, 0.051639556884765625, 0.0560455322265625, 0.060451507568359375, 0.06485748291015625, 0.06926345825195312, 0.07366943359375, 0.07807540893554688, 0.08248138427734375, 0.08688735961914062, 0.0912933349609375, 0.09569931030273438, 0.10010528564453125, 0.10451126098632812, 0.108917236328125, 0.11332321166992188, 0.11772918701171875, 0.12213516235351562, 0.1265411376953125, 0.13094711303710938, 0.13535308837890625, 0.13975906372070312, 0.1441650390625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 7.0, 4.0, 7.0, 11.0, 5.0, 5.0, 11.0, 14.0, 22.0, 14.0, 22.0, 21.0, 46.0, 53.0, 38.0, 32.0, 46.0, 45.0, 55.0, 52.0, 55.0, 55.0, 38.0, 44.0, 47.0, 27.0, 43.0, 38.0, 36.0, 27.0, 17.0, 16.0, 13.0, 8.0, 10.0, 9.0, 1.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.05877685546875, -0.05713605880737305, -0.055495262145996094, -0.05385446548461914, -0.05221366882324219, -0.050572872161865234, -0.04893207550048828, -0.04729127883911133, -0.045650482177734375, -0.04400968551635742, -0.04236888885498047, -0.040728092193603516, -0.03908729553222656, -0.03744649887084961, -0.035805702209472656, -0.0341649055480957, -0.03252410888671875, -0.030883312225341797, -0.029242515563964844, -0.02760171890258789, -0.025960922241210938, -0.024320125579833984, -0.02267932891845703, -0.021038532257080078, -0.019397735595703125, -0.017756938934326172, -0.01611614227294922, -0.014475345611572266, -0.012834548950195312, -0.01119375228881836, -0.009552955627441406, -0.007912158966064453, -0.0062713623046875, -0.004630565643310547, -0.0029897689819335938, -0.0013489723205566406, 0.0002918243408203125, 0.0019326210021972656, 0.0035734176635742188, 0.005214214324951172, 0.006855010986328125, 0.008495807647705078, 0.010136604309082031, 0.011777400970458984, 0.013418197631835938, 0.01505899429321289, 0.016699790954589844, 0.018340587615966797, 0.01998138427734375, 0.021622180938720703, 0.023262977600097656, 0.02490377426147461, 0.026544570922851562, 0.028185367584228516, 0.02982616424560547, 0.03146696090698242, 0.033107757568359375, 0.03474855422973633, 0.03638935089111328, 0.038030147552490234, 0.03967094421386719, 0.04131174087524414, 0.042952537536621094, 0.04459333419799805, 0.046234130859375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 4.0, 9.0, 8.0, 12.0, 32.0, 43.0, 69.0, 118.0, 199.0, 414.0, 899.0, 2139.0, 7842.0, 60659.0, 844909.0, 114862.0, 11475.0, 2777.0, 1020.0, 455.0, 272.0, 124.0, 69.0, 45.0, 43.0, 16.0, 16.0, 11.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.249755859375, -0.24071121215820312, -0.23166656494140625, -0.22262191772460938, -0.2135772705078125, -0.20453262329101562, -0.19548797607421875, -0.18644332885742188, -0.177398681640625, -0.16835403442382812, -0.15930938720703125, -0.15026473999023438, -0.1412200927734375, -0.13217544555664062, -0.12313079833984375, -0.11408615112304688, -0.10504150390625, -0.09599685668945312, -0.08695220947265625, -0.07790756225585938, -0.0688629150390625, -0.059818267822265625, -0.05077362060546875, -0.041728973388671875, -0.032684326171875, -0.023639678955078125, -0.01459503173828125, -0.005550384521484375, 0.0034942626953125, 0.012538909912109375, 0.02158355712890625, 0.030628204345703125, 0.0396728515625, 0.048717498779296875, 0.05776214599609375, 0.06680679321289062, 0.0758514404296875, 0.08489608764648438, 0.09394073486328125, 0.10298538208007812, 0.112030029296875, 0.12107467651367188, 0.13011932373046875, 0.13916397094726562, 0.1482086181640625, 0.15725326538085938, 0.16629791259765625, 0.17534255981445312, 0.18438720703125, 0.19343185424804688, 0.20247650146484375, 0.21152114868164062, 0.2205657958984375, 0.22961044311523438, 0.23865509033203125, 0.24769973754882812, 0.256744384765625, 0.2657890319824219, 0.27483367919921875, 0.2838783264160156, 0.2929229736328125, 0.3019676208496094, 0.31101226806640625, 0.3200569152832031, 0.3291015625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 6.0, 5.0, 6.0, 7.0, 4.0, 9.0, 6.0, 10.0, 12.0, 14.0, 14.0, 18.0, 15.0, 20.0, 28.0, 27.0, 30.0, 35.0, 53.0, 28.0, 33.0, 38.0, 41.0, 35.0, 47.0, 47.0, 42.0, 42.0, 45.0, 39.0, 36.0, 26.0, 29.0, 18.0, 18.0, 14.0, 19.0, 12.0, 19.0, 9.0, 6.0, 9.0, 7.0, 3.0, 4.0, 4.0, 4.0, 3.0, 2.0, 5.0, 6.0, 2.0, 1.0, 1.0], "bins": [-0.1964111328125, -0.1906261444091797, -0.18484115600585938, -0.17905616760253906, -0.17327117919921875, -0.16748619079589844, -0.16170120239257812, -0.1559162139892578, -0.1501312255859375, -0.1443462371826172, -0.13856124877929688, -0.13277626037597656, -0.12699127197265625, -0.12120628356933594, -0.11542129516601562, -0.10963630676269531, -0.103851318359375, -0.09806632995605469, -0.09228134155273438, -0.08649635314941406, -0.08071136474609375, -0.07492637634277344, -0.06914138793945312, -0.06335639953613281, -0.0575714111328125, -0.05178642272949219, -0.046001434326171875, -0.04021644592285156, -0.03443145751953125, -0.028646469116210938, -0.022861480712890625, -0.017076492309570312, -0.01129150390625, -0.0055065155029296875, 0.000278472900390625, 0.0060634613037109375, 0.01184844970703125, 0.017633438110351562, 0.023418426513671875, 0.029203414916992188, 0.0349884033203125, 0.04077339172363281, 0.046558380126953125, 0.05234336853027344, 0.05812835693359375, 0.06391334533691406, 0.06969833374023438, 0.07548332214355469, 0.081268310546875, 0.08705329895019531, 0.09283828735351562, 0.09862327575683594, 0.10440826416015625, 0.11019325256347656, 0.11597824096679688, 0.12176322937011719, 0.1275482177734375, 0.1333332061767578, 0.13911819458007812, 0.14490318298339844, 0.15068817138671875, 0.15647315979003906, 0.16225814819335938, 0.1680431365966797, 0.173828125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 2.0, 11.0, 8.0, 7.0, 7.0, 17.0, 29.0, 28.0, 53.0, 74.0, 89.0, 124.0, 216.0, 343.0, 560.0, 995.0, 1900.0, 4238.0, 10173.0, 30744.0, 111268.0, 556172.0, 240850.0, 59850.0, 17958.0, 6593.0, 2858.0, 1387.0, 776.0, 409.0, 267.0, 168.0, 105.0, 70.0, 63.0, 37.0, 22.0, 22.0, 12.0, 12.0, 14.0, 6.0, 5.0, 6.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.052337646484375, -0.05057954788208008, -0.048821449279785156, -0.047063350677490234, -0.04530525207519531, -0.04354715347290039, -0.04178905487060547, -0.04003095626831055, -0.038272857666015625, -0.0365147590637207, -0.03475666046142578, -0.03299856185913086, -0.031240463256835938, -0.029482364654541016, -0.027724266052246094, -0.025966167449951172, -0.02420806884765625, -0.022449970245361328, -0.020691871643066406, -0.018933773040771484, -0.017175674438476562, -0.01541757583618164, -0.013659477233886719, -0.011901378631591797, -0.010143280029296875, -0.008385181427001953, -0.006627082824707031, -0.004868984222412109, -0.0031108856201171875, -0.0013527870178222656, 0.00040531158447265625, 0.002163410186767578, 0.0039215087890625, 0.005679607391357422, 0.007437705993652344, 0.009195804595947266, 0.010953903198242188, 0.01271200180053711, 0.014470100402832031, 0.016228199005126953, 0.017986297607421875, 0.019744396209716797, 0.02150249481201172, 0.02326059341430664, 0.025018692016601562, 0.026776790618896484, 0.028534889221191406, 0.030292987823486328, 0.03205108642578125, 0.03380918502807617, 0.035567283630371094, 0.037325382232666016, 0.03908348083496094, 0.04084157943725586, 0.04259967803955078, 0.0443577766418457, 0.046115875244140625, 0.04787397384643555, 0.04963207244873047, 0.05139017105102539, 0.05314826965332031, 0.054906368255615234, 0.056664466857910156, 0.05842256546020508, 0.0601806640625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 5.0, 2.0, 2.0, 4.0, 5.0, 2.0, 8.0, 8.0, 12.0, 14.0, 21.0, 18.0, 30.0, 34.0, 32.0, 42.0, 65.0, 63.0, 52.0, 69.0, 76.0, 64.0, 71.0, 54.0, 31.0, 24.0, 31.0, 31.0, 26.0, 19.0, 15.0, 13.0, 16.0, 15.0, 5.0, 6.0, 3.0, 3.0, 3.0, 2.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.390146255493164e-05, -2.3271888494491577e-05, -2.2642314434051514e-05, -2.201274037361145e-05, -2.1383166313171387e-05, -2.0753592252731323e-05, -2.012401819229126e-05, -1.9494444131851196e-05, -1.8864870071411133e-05, -1.823529601097107e-05, -1.7605721950531006e-05, -1.6976147890090942e-05, -1.634657382965088e-05, -1.5716999769210815e-05, -1.5087425708770752e-05, -1.4457851648330688e-05, -1.3828277587890625e-05, -1.3198703527450562e-05, -1.2569129467010498e-05, -1.1939555406570435e-05, -1.1309981346130371e-05, -1.0680407285690308e-05, -1.0050833225250244e-05, -9.42125916481018e-06, -8.791685104370117e-06, -8.162111043930054e-06, -7.53253698348999e-06, -6.902962923049927e-06, -6.273388862609863e-06, -5.6438148021698e-06, -5.014240741729736e-06, -4.384666681289673e-06, -3.7550926208496094e-06, -3.125518560409546e-06, -2.4959444999694824e-06, -1.866370439529419e-06, -1.2367963790893555e-06, -6.07222318649292e-07, 2.2351741790771484e-08, 6.51925802230835e-07, 1.2814998626708984e-06, 1.911073923110962e-06, 2.5406479835510254e-06, 3.170222043991089e-06, 3.7997961044311523e-06, 4.429370164871216e-06, 5.058944225311279e-06, 5.688518285751343e-06, 6.318092346191406e-06, 6.94766640663147e-06, 7.577240467071533e-06, 8.206814527511597e-06, 8.83638858795166e-06, 9.465962648391724e-06, 1.0095536708831787e-05, 1.072511076927185e-05, 1.1354684829711914e-05, 1.1984258890151978e-05, 1.2613832950592041e-05, 1.3243407011032104e-05, 1.3872981071472168e-05, 1.4502555131912231e-05, 1.5132129192352295e-05, 1.576170325279236e-05, 1.6391277313232422e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 1.0, 2.0, 5.0, 10.0, 13.0, 11.0, 21.0, 25.0, 46.0, 56.0, 95.0, 147.0, 239.0, 435.0, 847.0, 1772.0, 4271.0, 13221.0, 59628.0, 501646.0, 388269.0, 57321.0, 12682.0, 4180.0, 1713.0, 769.0, 427.0, 279.0, 144.0, 99.0, 60.0, 34.0, 27.0, 16.0, 16.0, 10.0, 5.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0740966796875, -0.07191658020019531, -0.06973648071289062, -0.06755638122558594, -0.06537628173828125, -0.06319618225097656, -0.061016082763671875, -0.05883598327636719, -0.0566558837890625, -0.05447578430175781, -0.052295684814453125, -0.05011558532714844, -0.04793548583984375, -0.04575538635253906, -0.043575286865234375, -0.04139518737792969, -0.039215087890625, -0.03703498840332031, -0.034854888916015625, -0.03267478942871094, -0.03049468994140625, -0.028314590454101562, -0.026134490966796875, -0.023954391479492188, -0.0217742919921875, -0.019594192504882812, -0.017414093017578125, -0.015233993530273438, -0.01305389404296875, -0.010873794555664062, -0.008693695068359375, -0.0065135955810546875, -0.00433349609375, -0.0021533966064453125, 2.6702880859375e-05, 0.0022068023681640625, 0.00438690185546875, 0.0065670013427734375, 0.008747100830078125, 0.010927200317382812, 0.0131072998046875, 0.015287399291992188, 0.017467498779296875, 0.019647598266601562, 0.02182769775390625, 0.024007797241210938, 0.026187896728515625, 0.028367996215820312, 0.030548095703125, 0.03272819519042969, 0.034908294677734375, 0.03708839416503906, 0.03926849365234375, 0.04144859313964844, 0.043628692626953125, 0.04580879211425781, 0.0479888916015625, 0.05016899108886719, 0.052349090576171875, 0.05452919006347656, 0.05670928955078125, 0.05888938903808594, 0.061069488525390625, 0.06324958801269531, 0.0654296875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 5.0, 3.0, 7.0, 13.0, 7.0, 13.0, 15.0, 13.0, 15.0, 14.0, 28.0, 35.0, 37.0, 41.0, 57.0, 57.0, 82.0, 56.0, 57.0, 65.0, 57.0, 64.0, 42.0, 31.0, 33.0, 33.0, 20.0, 13.0, 22.0, 15.0, 8.0, 6.0, 10.0, 10.0, 3.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048736572265625, -0.04724407196044922, -0.04575157165527344, -0.044259071350097656, -0.042766571044921875, -0.041274070739746094, -0.03978157043457031, -0.03828907012939453, -0.03679656982421875, -0.03530406951904297, -0.03381156921386719, -0.032319068908691406, -0.030826568603515625, -0.029334068298339844, -0.027841567993164062, -0.02634906768798828, -0.0248565673828125, -0.02336406707763672, -0.021871566772460938, -0.020379066467285156, -0.018886566162109375, -0.017394065856933594, -0.015901565551757812, -0.014409065246582031, -0.01291656494140625, -0.011424064636230469, -0.009931564331054688, -0.008439064025878906, -0.006946563720703125, -0.005454063415527344, -0.0039615631103515625, -0.0024690628051757812, -0.0009765625, 0.0005159378051757812, 0.0020084381103515625, 0.0035009384155273438, 0.004993438720703125, 0.006485939025878906, 0.007978439331054688, 0.009470939636230469, 0.01096343994140625, 0.012455940246582031, 0.013948440551757812, 0.015440940856933594, 0.016933441162109375, 0.018425941467285156, 0.019918441772460938, 0.02141094207763672, 0.0229034423828125, 0.02439594268798828, 0.025888442993164062, 0.027380943298339844, 0.028873443603515625, 0.030365943908691406, 0.03185844421386719, 0.03335094451904297, 0.03484344482421875, 0.03633594512939453, 0.03782844543457031, 0.039320945739746094, 0.040813446044921875, 0.042305946350097656, 0.04379844665527344, 0.04529094696044922, 0.046783447265625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 8.0, 8.0, 20.0, 64.0, 127.0, 322.0, 252.0, 112.0, 50.0, 17.0, 9.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4606847763061523, -1.3905689716339111, -1.3204530477523804, -1.2503372430801392, -1.1802213191986084, -1.1101055145263672, -1.039989709854126, -0.96987384557724, -0.899757981300354, -0.829642117023468, -0.759526252746582, -0.6894104480743408, -0.6192945837974548, -0.5491787195205688, -0.47906288504600525, -0.40894705057144165, -0.33883118629455566, -0.2687153220176697, -0.19859948754310608, -0.1284836381673813, -0.058367788791656494, 0.011748075485229492, 0.08186390995979309, 0.1519797444343567, 0.22209560871124268, 0.29221147298812866, 0.36232730746269226, 0.43244314193725586, 0.5025590062141418, 0.5726748704910278, 0.642790675163269, 0.712906539440155, 0.7830226421356201, 0.8531385064125061, 0.9232543706893921, 0.9933701753616333, 1.063486099243164, 1.1336019039154053, 1.2037177085876465, 1.2738335132598877, 1.3439494371414185, 1.4140652418136597, 1.4841811656951904, 1.5542969703674316, 1.6244127750396729, 1.6945286989212036, 1.7646445035934448, 1.8347604274749756, 1.9048762321472168, 1.974992036819458, 2.045107841491699, 2.1152238845825195, 2.1853396892547607, 2.255455493927002, 2.325571298599243, 2.3956871032714844, 2.4658031463623047, 2.535918951034546, 2.606034755706787, 2.6761507987976074, 2.7462666034698486, 2.81638240814209, 2.886498212814331, 2.9566140174865723, 3.0267298221588135]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 6.0, 4.0, 5.0, 11.0, 5.0, 11.0, 6.0, 13.0, 16.0, 15.0, 21.0, 25.0, 29.0, 30.0, 31.0, 30.0, 43.0, 36.0, 48.0, 68.0, 61.0, 65.0, 60.0, 43.0, 53.0, 35.0, 31.0, 22.0, 23.0, 20.0, 19.0, 17.0, 16.0, 13.0, 11.0, 14.0, 7.0, 7.0, 7.0, 6.0, 1.0, 4.0, 6.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.8308830857276917, -0.8063111305236816, -0.7817391753196716, -0.7571672201156616, -0.7325952649116516, -0.7080233097076416, -0.6834513545036316, -0.6588793992996216, -0.6343074440956116, -0.6097354888916016, -0.5851635336875916, -0.5605915784835815, -0.5360196232795715, -0.5114476680755615, -0.4868757128715515, -0.4623037576675415, -0.4377318322658539, -0.41315987706184387, -0.38858792185783386, -0.36401596665382385, -0.33944401144981384, -0.31487205624580383, -0.2903001308441162, -0.2657281756401062, -0.241156205534935, -0.216584250330925, -0.19201229512691498, -0.16744035482406616, -0.14286839962005615, -0.11829643696546555, -0.09372448921203613, -0.06915253400802612, -0.04458057880401611, -0.020008625462651253, 0.004563327878713608, 0.02913527935743332, 0.05370723456144333, 0.07827918976545334, 0.10285113751888275, 0.12742309272289276, 0.15199504792690277, 0.17656700313091278, 0.2011389583349228, 0.2257108986377716, 0.2502828538417816, 0.2748548090457916, 0.29942676424980164, 0.32399871945381165, 0.34857067465782166, 0.37314262986183167, 0.3977145850658417, 0.4222865402698517, 0.4468584954738617, 0.4714304506778717, 0.4960023760795593, 0.5205743312835693, 0.5451462864875793, 0.5697182416915894, 0.5942901968955994, 0.6188621520996094, 0.6434341073036194, 0.6680060625076294, 0.6925780177116394, 0.7171499729156494, 0.7417219281196594]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 4.0, 12.0, 12.0, 17.0, 21.0, 52.0, 78.0, 114.0, 215.0, 319.0, 633.0, 1216.0, 2441.0, 5559.0, 15243.0, 52736.0, 312309.0, 2355352.0, 1250542.0, 147460.0, 31583.0, 10148.0, 4193.0, 1863.0, 924.0, 486.0, 297.0, 148.0, 126.0, 65.0, 38.0, 28.0, 16.0, 11.0, 9.0, 8.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.09442138671875, -0.09204959869384766, -0.08967781066894531, -0.08730602264404297, -0.08493423461914062, -0.08256244659423828, -0.08019065856933594, -0.0778188705444336, -0.07544708251953125, -0.0730752944946289, -0.07070350646972656, -0.06833171844482422, -0.06595993041992188, -0.06358814239501953, -0.06121635437011719, -0.058844566345214844, -0.0564727783203125, -0.054100990295410156, -0.05172920227050781, -0.04935741424560547, -0.046985626220703125, -0.04461383819580078, -0.04224205017089844, -0.039870262145996094, -0.03749847412109375, -0.035126686096191406, -0.03275489807128906, -0.03038311004638672, -0.028011322021484375, -0.02563953399658203, -0.023267745971679688, -0.020895957946777344, -0.018524169921875, -0.016152381896972656, -0.013780593872070312, -0.011408805847167969, -0.009037017822265625, -0.006665229797363281, -0.0042934417724609375, -0.0019216537475585938, 0.00045013427734375, 0.0028219223022460938, 0.0051937103271484375, 0.007565498352050781, 0.009937286376953125, 0.012309074401855469, 0.014680862426757812, 0.017052650451660156, 0.0194244384765625, 0.021796226501464844, 0.024168014526367188, 0.02653980255126953, 0.028911590576171875, 0.03128337860107422, 0.03365516662597656, 0.036026954650878906, 0.03839874267578125, 0.040770530700683594, 0.04314231872558594, 0.04551410675048828, 0.047885894775390625, 0.05025768280029297, 0.05262947082519531, 0.055001258850097656, 0.057373046875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 2.0, 5.0, 4.0, 3.0, 8.0, 6.0, 7.0, 12.0, 12.0, 14.0, 27.0, 32.0, 26.0, 24.0, 33.0, 35.0, 34.0, 32.0, 34.0, 33.0, 51.0, 47.0, 49.0, 37.0, 44.0, 32.0, 39.0, 43.0, 34.0, 42.0, 24.0, 24.0, 27.0, 24.0, 22.0, 20.0, 14.0, 10.0, 8.0, 6.0, 7.0, 7.0, 4.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.042877197265625, -0.04151439666748047, -0.04015159606933594, -0.038788795471191406, -0.037425994873046875, -0.036063194274902344, -0.03470039367675781, -0.03333759307861328, -0.03197479248046875, -0.03061199188232422, -0.029249191284179688, -0.027886390686035156, -0.026523590087890625, -0.025160789489746094, -0.023797988891601562, -0.02243518829345703, -0.0210723876953125, -0.01970958709716797, -0.018346786499023438, -0.016983985900878906, -0.015621185302734375, -0.014258384704589844, -0.012895584106445312, -0.011532783508300781, -0.01016998291015625, -0.008807182312011719, -0.0074443817138671875, -0.006081581115722656, -0.004718780517578125, -0.0033559799194335938, -0.0019931793212890625, -0.0006303787231445312, 0.000732421875, 0.0020952224731445312, 0.0034580230712890625, 0.004820823669433594, 0.006183624267578125, 0.007546424865722656, 0.008909225463867188, 0.010272026062011719, 0.01163482666015625, 0.012997627258300781, 0.014360427856445312, 0.015723228454589844, 0.017086029052734375, 0.018448829650878906, 0.019811630249023438, 0.02117443084716797, 0.0225372314453125, 0.02390003204345703, 0.025262832641601562, 0.026625633239746094, 0.027988433837890625, 0.029351234436035156, 0.030714035034179688, 0.03207683563232422, 0.03343963623046875, 0.03480243682861328, 0.03616523742675781, 0.037528038024902344, 0.038890838623046875, 0.040253639221191406, 0.04161643981933594, 0.04297924041748047, 0.044342041015625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 7.0, 9.0, 33.0, 56.0, 58.0, 119.0, 221.0, 459.0, 1071.0, 3519.0, 15478.0, 148591.0, 3665702.0, 327376.0, 24454.0, 4782.0, 1329.0, 467.0, 239.0, 114.0, 63.0, 38.0, 33.0, 17.0, 12.0, 7.0, 10.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1949462890625, -0.18896865844726562, -0.18299102783203125, -0.17701339721679688, -0.1710357666015625, -0.16505813598632812, -0.15908050537109375, -0.15310287475585938, -0.147125244140625, -0.14114761352539062, -0.13516998291015625, -0.12919235229492188, -0.1232147216796875, -0.11723709106445312, -0.11125946044921875, -0.10528182983398438, -0.09930419921875, -0.09332656860351562, -0.08734893798828125, -0.08137130737304688, -0.0753936767578125, -0.06941604614257812, -0.06343841552734375, -0.057460784912109375, -0.051483154296875, -0.045505523681640625, -0.03952789306640625, -0.033550262451171875, -0.0275726318359375, -0.021595001220703125, -0.01561737060546875, -0.009639739990234375, -0.003662109375, 0.002315521240234375, 0.00829315185546875, 0.014270782470703125, 0.0202484130859375, 0.026226043701171875, 0.03220367431640625, 0.038181304931640625, 0.044158935546875, 0.050136566162109375, 0.05611419677734375, 0.062091827392578125, 0.0680694580078125, 0.07404708862304688, 0.08002471923828125, 0.08600234985351562, 0.09197998046875, 0.09795761108398438, 0.10393524169921875, 0.10991287231445312, 0.1158905029296875, 0.12186813354492188, 0.12784576416015625, 0.13382339477539062, 0.139801025390625, 0.14577865600585938, 0.15175628662109375, 0.15773391723632812, 0.1637115478515625, 0.16968917846679688, 0.17566680908203125, 0.18164443969726562, 0.1876220703125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 1.0, 2.0, 3.0, 4.0, 4.0, 10.0, 9.0, 15.0, 12.0, 19.0, 23.0, 35.0, 57.0, 96.0, 113.0, 194.0, 294.0, 423.0, 613.0, 699.0, 465.0, 322.0, 185.0, 137.0, 104.0, 51.0, 41.0, 30.0, 32.0, 15.0, 13.0, 9.0, 11.0, 10.0, 4.0, 2.0, 4.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.119140625, -0.11554431915283203, -0.11194801330566406, -0.1083517074584961, -0.10475540161132812, -0.10115909576416016, -0.09756278991699219, -0.09396648406982422, -0.09037017822265625, -0.08677387237548828, -0.08317756652832031, -0.07958126068115234, -0.07598495483398438, -0.0723886489868164, -0.06879234313964844, -0.06519603729248047, -0.0615997314453125, -0.05800342559814453, -0.05440711975097656, -0.050810813903808594, -0.047214508056640625, -0.043618202209472656, -0.04002189636230469, -0.03642559051513672, -0.03282928466796875, -0.02923297882080078, -0.025636672973632812, -0.022040367126464844, -0.018444061279296875, -0.014847755432128906, -0.011251449584960938, -0.007655143737792969, -0.004058837890625, -0.00046253204345703125, 0.0031337738037109375, 0.006730079650878906, 0.010326385498046875, 0.013922691345214844, 0.017518997192382812, 0.02111530303955078, 0.02471160888671875, 0.02830791473388672, 0.03190422058105469, 0.035500526428222656, 0.039096832275390625, 0.042693138122558594, 0.04628944396972656, 0.04988574981689453, 0.0534820556640625, 0.05707836151123047, 0.06067466735839844, 0.0642709732055664, 0.06786727905273438, 0.07146358489990234, 0.07505989074707031, 0.07865619659423828, 0.08225250244140625, 0.08584880828857422, 0.08944511413574219, 0.09304141998291016, 0.09663772583007812, 0.1002340316772461, 0.10383033752441406, 0.10742664337158203, 0.11102294921875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 6.0, 7.0, 9.0, 31.0, 58.0, 177.0, 243.0, 213.0, 143.0, 63.0, 25.0, 13.0, 6.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.8412970304489136, -1.7834926843643188, -1.7256882190704346, -1.6678838729858398, -1.6100794076919556, -1.5522750616073608, -1.4944705963134766, -1.4366662502288818, -1.378861904144287, -1.3210575580596924, -1.263253092765808, -1.2054487466812134, -1.147644281387329, -1.0898399353027344, -1.0320355892181396, -0.9742311239242554, -0.9164266586303711, -0.8586222529411316, -0.8008178472518921, -0.7430135011672974, -0.6852090358734131, -0.6274046897888184, -0.5696002840995789, -0.5117958784103394, -0.45399147272109985, -0.39618706703186035, -0.33838266134262085, -0.28057828545570374, -0.22277387976646423, -0.16496947407722473, -0.10716509819030762, -0.049360692501068115, 0.008443832397460938, 0.06624823063611984, 0.12405262887477875, 0.18185701966285706, 0.23966142535209656, 0.29746583104133606, 0.3552702069282532, 0.4130746126174927, 0.4708790183067322, 0.5286834239959717, 0.5864878296852112, 0.6442922353744507, 0.7020965814590454, 0.7599010467529297, 0.8177053928375244, 0.8755097985267639, 0.9333142042160034, 0.9911186099052429, 1.0489230155944824, 1.1067273616790771, 1.1645318269729614, 1.2223361730575562, 1.2801406383514404, 1.3379449844360352, 1.3957493305206299, 1.4535536766052246, 1.5113581418991089, 1.5691624879837036, 1.626966953277588, 1.6847712993621826, 1.7425756454467773, 1.8003801107406616, 1.858184576034546]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 5.0, 9.0, 14.0, 15.0, 20.0, 25.0, 30.0, 29.0, 52.0, 54.0, 58.0, 79.0, 65.0, 68.0, 65.0, 72.0, 64.0, 45.0, 50.0, 41.0, 29.0, 21.0, 14.0, 21.0, 15.0, 10.0, 4.0, 9.0, 7.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7511221766471863, -0.7279333472251892, -0.7047445178031921, -0.6815556883811951, -0.6583667993545532, -0.6351779699325562, -0.6119891405105591, -0.588800311088562, -0.5656114816665649, -0.5424226522445679, -0.5192338228225708, -0.49604496359825134, -0.4728561341762543, -0.4496673047542572, -0.42647844552993774, -0.4032896161079407, -0.3801007866859436, -0.35691195726394653, -0.33372312784194946, -0.31053426861763, -0.28734543919563293, -0.26415660977363586, -0.2409677654504776, -0.21777892112731934, -0.19459009170532227, -0.1714012622833252, -0.14821241796016693, -0.12502357363700867, -0.1018347442150116, -0.07864590734243393, -0.05545707046985626, -0.032268226146698, -0.009079396724700928, 0.01410944014787674, 0.03729827702045441, 0.060487113893032074, 0.08367595076560974, 0.10686478763818741, 0.13005362451076508, 0.15324246883392334, 0.1764312982559204, 0.19962012767791748, 0.22280897200107574, 0.245997816324234, 0.2691866457462311, 0.29237547516822815, 0.3155643343925476, 0.3387531638145447, 0.36194199323654175, 0.3851308226585388, 0.4083196520805359, 0.43150851130485535, 0.4546973407268524, 0.4778861701488495, 0.501075029373169, 0.524263858795166, 0.5474526882171631, 0.5706415176391602, 0.5938303470611572, 0.6170191764831543, 0.6402080059051514, 0.6633968949317932, 0.6865857243537903, 0.7097745537757874, 0.7329633831977844]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 8.0, 24.0, 29.0, 33.0, 56.0, 86.0, 138.0, 230.0, 387.0, 616.0, 1052.0, 1854.0, 3494.0, 7425.0, 16826.0, 43524.0, 125211.0, 319162.0, 322948.0, 128447.0, 44311.0, 17085.0, 7415.0, 3525.0, 1920.0, 1101.0, 654.0, 374.0, 218.0, 136.0, 99.0, 56.0, 33.0, 29.0, 19.0, 6.0, 13.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06781005859375, -0.06547260284423828, -0.06313514709472656, -0.060797691345214844, -0.058460235595703125, -0.056122779846191406, -0.05378532409667969, -0.05144786834716797, -0.04911041259765625, -0.04677295684814453, -0.04443550109863281, -0.042098045349121094, -0.039760589599609375, -0.037423133850097656, -0.03508567810058594, -0.03274822235107422, -0.0304107666015625, -0.02807331085205078, -0.025735855102539062, -0.023398399353027344, -0.021060943603515625, -0.018723487854003906, -0.016386032104492188, -0.014048576354980469, -0.01171112060546875, -0.009373664855957031, -0.0070362091064453125, -0.004698753356933594, -0.002361297607421875, -2.384185791015625e-05, 0.0023136138916015625, 0.004651069641113281, 0.006988525390625, 0.009325981140136719, 0.011663436889648438, 0.014000892639160156, 0.016338348388671875, 0.018675804138183594, 0.021013259887695312, 0.02335071563720703, 0.02568817138671875, 0.02802562713623047, 0.030363082885742188, 0.032700538635253906, 0.035037994384765625, 0.037375450134277344, 0.03971290588378906, 0.04205036163330078, 0.0443878173828125, 0.04672527313232422, 0.04906272888183594, 0.051400184631347656, 0.053737640380859375, 0.056075096130371094, 0.05841255187988281, 0.06075000762939453, 0.06308746337890625, 0.06542491912841797, 0.06776237487792969, 0.0700998306274414, 0.07243728637695312, 0.07477474212646484, 0.07711219787597656, 0.07944965362548828, 0.081787109375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 8.0, 5.0, 5.0, 10.0, 7.0, 13.0, 17.0, 18.0, 18.0, 18.0, 24.0, 29.0, 39.0, 35.0, 28.0, 40.0, 47.0, 34.0, 42.0, 46.0, 44.0, 37.0, 42.0, 39.0, 35.0, 25.0, 33.0, 22.0, 37.0, 27.0, 32.0, 16.0, 22.0, 18.0, 14.0, 20.0, 7.0, 10.0, 10.0, 2.0, 3.0, 4.0, 5.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04022216796875, -0.03884601593017578, -0.03746986389160156, -0.036093711853027344, -0.034717559814453125, -0.033341407775878906, -0.03196525573730469, -0.03058910369873047, -0.02921295166015625, -0.02783679962158203, -0.026460647583007812, -0.025084495544433594, -0.023708343505859375, -0.022332191467285156, -0.020956039428710938, -0.01957988739013672, -0.0182037353515625, -0.01682758331298828, -0.015451431274414062, -0.014075279235839844, -0.012699127197265625, -0.011322975158691406, -0.009946823120117188, -0.008570671081542969, -0.00719451904296875, -0.005818367004394531, -0.0044422149658203125, -0.0030660629272460938, -0.001689910888671875, -0.00031375885009765625, 0.0010623931884765625, 0.0024385452270507812, 0.003814697265625, 0.005190849304199219, 0.0065670013427734375, 0.007943153381347656, 0.009319305419921875, 0.010695457458496094, 0.012071609497070312, 0.013447761535644531, 0.01482391357421875, 0.01620006561279297, 0.017576217651367188, 0.018952369689941406, 0.020328521728515625, 0.021704673767089844, 0.023080825805664062, 0.02445697784423828, 0.0258331298828125, 0.02720928192138672, 0.028585433959960938, 0.029961585998535156, 0.031337738037109375, 0.032713890075683594, 0.03409004211425781, 0.03546619415283203, 0.03684234619140625, 0.03821849822998047, 0.03959465026855469, 0.040970802307128906, 0.042346954345703125, 0.043723106384277344, 0.04509925842285156, 0.04647541046142578, 0.0478515625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 7.0, 6.0, 5.0, 12.0, 11.0, 12.0, 17.0, 30.0, 35.0, 53.0, 100.0, 201.0, 341.0, 704.0, 1706.0, 5120.0, 22546.0, 163258.0, 718263.0, 112431.0, 16744.0, 4139.0, 1453.0, 590.0, 314.0, 149.0, 100.0, 77.0, 40.0, 31.0, 18.0, 9.0, 9.0, 9.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.160888671875, -0.15634536743164062, -0.15180206298828125, -0.14725875854492188, -0.1427154541015625, -0.13817214965820312, -0.13362884521484375, -0.12908554077148438, -0.124542236328125, -0.11999893188476562, -0.11545562744140625, -0.11091232299804688, -0.1063690185546875, -0.10182571411132812, -0.09728240966796875, -0.09273910522460938, -0.08819580078125, -0.08365249633789062, -0.07910919189453125, -0.07456588745117188, -0.0700225830078125, -0.06547927856445312, -0.06093597412109375, -0.056392669677734375, -0.051849365234375, -0.047306060791015625, -0.04276275634765625, -0.038219451904296875, -0.0336761474609375, -0.029132843017578125, -0.02458953857421875, -0.020046234130859375, -0.0155029296875, -0.010959625244140625, -0.00641632080078125, -0.001873016357421875, 0.0026702880859375, 0.007213592529296875, 0.01175689697265625, 0.016300201416015625, 0.020843505859375, 0.025386810302734375, 0.02993011474609375, 0.034473419189453125, 0.0390167236328125, 0.043560028076171875, 0.04810333251953125, 0.052646636962890625, 0.05718994140625, 0.061733245849609375, 0.06627655029296875, 0.07081985473632812, 0.0753631591796875, 0.07990646362304688, 0.08444976806640625, 0.08899307250976562, 0.093536376953125, 0.09807968139648438, 0.10262298583984375, 0.10716629028320312, 0.1117095947265625, 0.11625289916992188, 0.12079620361328125, 0.12533950805664062, 0.1298828125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 4.0, 9.0, 9.0, 13.0, 14.0, 30.0, 19.0, 29.0, 32.0, 35.0, 33.0, 41.0, 34.0, 60.0, 48.0, 34.0, 42.0, 47.0, 55.0, 51.0, 37.0, 52.0, 40.0, 24.0, 40.0, 32.0, 22.0, 22.0, 13.0, 19.0, 7.0, 6.0, 11.0, 10.0, 5.0, 7.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.185546875, -0.17974853515625, -0.1739501953125, -0.16815185546875, -0.162353515625, -0.15655517578125, -0.1507568359375, -0.14495849609375, -0.13916015625, -0.13336181640625, -0.1275634765625, -0.12176513671875, -0.115966796875, -0.11016845703125, -0.1043701171875, -0.09857177734375, -0.0927734375, -0.08697509765625, -0.0811767578125, -0.07537841796875, -0.069580078125, -0.06378173828125, -0.0579833984375, -0.05218505859375, -0.04638671875, -0.04058837890625, -0.0347900390625, -0.02899169921875, -0.023193359375, -0.01739501953125, -0.0115966796875, -0.00579833984375, 0.0, 0.00579833984375, 0.0115966796875, 0.01739501953125, 0.023193359375, 0.02899169921875, 0.0347900390625, 0.04058837890625, 0.04638671875, 0.05218505859375, 0.0579833984375, 0.06378173828125, 0.069580078125, 0.07537841796875, 0.0811767578125, 0.08697509765625, 0.0927734375, 0.09857177734375, 0.1043701171875, 0.11016845703125, 0.115966796875, 0.12176513671875, 0.1275634765625, 0.13336181640625, 0.13916015625, 0.14495849609375, 0.1507568359375, 0.15655517578125, 0.162353515625, 0.16815185546875, 0.1739501953125, 0.17974853515625, 0.185546875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 2.0, 14.0, 20.0, 25.0, 38.0, 45.0, 68.0, 108.0, 189.0, 334.0, 722.0, 1618.0, 4775.0, 17801.0, 103342.0, 726763.0, 158586.0, 24195.0, 6098.0, 2046.0, 852.0, 381.0, 213.0, 111.0, 68.0, 54.0, 27.0, 21.0, 12.0, 6.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06341552734375, -0.06119823455810547, -0.05898094177246094, -0.056763648986816406, -0.054546356201171875, -0.052329063415527344, -0.05011177062988281, -0.04789447784423828, -0.04567718505859375, -0.04345989227294922, -0.04124259948730469, -0.039025306701660156, -0.036808013916015625, -0.034590721130371094, -0.03237342834472656, -0.03015613555908203, -0.0279388427734375, -0.02572154998779297, -0.023504257202148438, -0.021286964416503906, -0.019069671630859375, -0.016852378845214844, -0.014635086059570312, -0.012417793273925781, -0.01020050048828125, -0.007983207702636719, -0.0057659149169921875, -0.0035486221313476562, -0.001331329345703125, 0.0008859634399414062, 0.0031032562255859375, 0.005320549011230469, 0.007537841796875, 0.009755134582519531, 0.011972427368164062, 0.014189720153808594, 0.016407012939453125, 0.018624305725097656, 0.020841598510742188, 0.02305889129638672, 0.02527618408203125, 0.02749347686767578, 0.029710769653320312, 0.031928062438964844, 0.034145355224609375, 0.036362648010253906, 0.03857994079589844, 0.04079723358154297, 0.0430145263671875, 0.04523181915283203, 0.04744911193847656, 0.049666404724121094, 0.051883697509765625, 0.054100990295410156, 0.05631828308105469, 0.05853557586669922, 0.06075286865234375, 0.06297016143798828, 0.06518745422363281, 0.06740474700927734, 0.06962203979492188, 0.0718393325805664, 0.07405662536621094, 0.07627391815185547, 0.0784912109375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 3.0, 7.0, 13.0, 16.0, 16.0, 35.0, 40.0, 46.0, 64.0, 67.0, 96.0, 86.0, 107.0, 74.0, 87.0, 50.0, 43.0, 38.0, 35.0, 14.0, 16.0, 11.0, 7.0, 13.0, 4.0, 2.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3589859008789062e-05, -1.290440559387207e-05, -1.2218952178955078e-05, -1.1533498764038086e-05, -1.0848045349121094e-05, -1.0162591934204102e-05, -9.47713851928711e-06, -8.791685104370117e-06, -8.106231689453125e-06, -7.420778274536133e-06, -6.735324859619141e-06, -6.0498714447021484e-06, -5.364418029785156e-06, -4.678964614868164e-06, -3.993511199951172e-06, -3.3080577850341797e-06, -2.6226043701171875e-06, -1.9371509552001953e-06, -1.2516975402832031e-06, -5.662441253662109e-07, 1.1920928955078125e-07, 8.046627044677734e-07, 1.4901161193847656e-06, 2.175569534301758e-06, 2.86102294921875e-06, 3.546476364135742e-06, 4.231929779052734e-06, 4.9173831939697266e-06, 5.602836608886719e-06, 6.288290023803711e-06, 6.973743438720703e-06, 7.659196853637695e-06, 8.344650268554688e-06, 9.03010368347168e-06, 9.715557098388672e-06, 1.0401010513305664e-05, 1.1086463928222656e-05, 1.1771917343139648e-05, 1.245737075805664e-05, 1.3142824172973633e-05, 1.3828277587890625e-05, 1.4513731002807617e-05, 1.519918441772461e-05, 1.58846378326416e-05, 1.6570091247558594e-05, 1.7255544662475586e-05, 1.7940998077392578e-05, 1.862645149230957e-05, 1.9311904907226562e-05, 1.9997358322143555e-05, 2.0682811737060547e-05, 2.136826515197754e-05, 2.205371856689453e-05, 2.2739171981811523e-05, 2.3424625396728516e-05, 2.4110078811645508e-05, 2.47955322265625e-05, 2.5480985641479492e-05, 2.6166439056396484e-05, 2.6851892471313477e-05, 2.753734588623047e-05, 2.822279930114746e-05, 2.8908252716064453e-05, 2.9593706130981445e-05, 3.0279159545898438e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 9.0, 8.0, 6.0, 14.0, 14.0, 31.0, 47.0, 83.0, 181.0, 391.0, 946.0, 2824.0, 11516.0, 78043.0, 772579.0, 157426.0, 18114.0, 4105.0, 1251.0, 489.0, 219.0, 114.0, 53.0, 31.0, 19.0, 13.0, 7.0, 7.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06292724609375, -0.060265541076660156, -0.05760383605957031, -0.05494213104248047, -0.052280426025390625, -0.04961872100830078, -0.04695701599121094, -0.044295310974121094, -0.04163360595703125, -0.038971900939941406, -0.03631019592285156, -0.03364849090576172, -0.030986785888671875, -0.02832508087158203, -0.025663375854492188, -0.023001670837402344, -0.0203399658203125, -0.017678260803222656, -0.015016555786132812, -0.012354850769042969, -0.009693145751953125, -0.007031440734863281, -0.0043697357177734375, -0.0017080307006835938, 0.00095367431640625, 0.0036153793334960938, 0.0062770843505859375, 0.008938789367675781, 0.011600494384765625, 0.014262199401855469, 0.016923904418945312, 0.019585609436035156, 0.022247314453125, 0.024909019470214844, 0.027570724487304688, 0.03023242950439453, 0.032894134521484375, 0.03555583953857422, 0.03821754455566406, 0.040879249572753906, 0.04354095458984375, 0.046202659606933594, 0.04886436462402344, 0.05152606964111328, 0.054187774658203125, 0.05684947967529297, 0.05951118469238281, 0.062172889709472656, 0.0648345947265625, 0.06749629974365234, 0.07015800476074219, 0.07281970977783203, 0.07548141479492188, 0.07814311981201172, 0.08080482482910156, 0.0834665298461914, 0.08612823486328125, 0.0887899398803711, 0.09145164489746094, 0.09411334991455078, 0.09677505493164062, 0.09943675994873047, 0.10209846496582031, 0.10476016998291016, 0.107421875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 2.0, 2.0, 10.0, 9.0, 21.0, 27.0, 31.0, 42.0, 56.0, 65.0, 69.0, 88.0, 104.0, 91.0, 75.0, 76.0, 55.0, 53.0, 32.0, 24.0, 19.0, 8.0, 10.0, 8.0, 6.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07061767578125, -0.0686197280883789, -0.06662178039550781, -0.06462383270263672, -0.06262588500976562, -0.06062793731689453, -0.05862998962402344, -0.056632041931152344, -0.05463409423828125, -0.052636146545410156, -0.05063819885253906, -0.04864025115966797, -0.046642303466796875, -0.04464435577392578, -0.04264640808105469, -0.040648460388183594, -0.0386505126953125, -0.036652565002441406, -0.03465461730957031, -0.03265666961669922, -0.030658721923828125, -0.02866077423095703, -0.026662826538085938, -0.024664878845214844, -0.02266693115234375, -0.020668983459472656, -0.018671035766601562, -0.01667308807373047, -0.014675140380859375, -0.012677192687988281, -0.010679244995117188, -0.008681297302246094, -0.006683349609375, -0.004685401916503906, -0.0026874542236328125, -0.0006895065307617188, 0.001308441162109375, 0.0033063888549804688, 0.0053043365478515625, 0.007302284240722656, 0.00930023193359375, 0.011298179626464844, 0.013296127319335938, 0.015294075012207031, 0.017292022705078125, 0.01928997039794922, 0.021287918090820312, 0.023285865783691406, 0.0252838134765625, 0.027281761169433594, 0.029279708862304688, 0.03127765655517578, 0.033275604248046875, 0.03527355194091797, 0.03727149963378906, 0.039269447326660156, 0.04126739501953125, 0.043265342712402344, 0.04526329040527344, 0.04726123809814453, 0.049259185791015625, 0.05125713348388672, 0.05325508117675781, 0.055253028869628906, 0.0572509765625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 8.0, 17.0, 32.0, 121.0, 363.0, 297.0, 108.0, 36.0, 12.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.206325054168701, -2.137188673019409, -2.0680525302886963, -1.9989162683486938, -1.9297800064086914, -1.8606436252593994, -1.791507363319397, -1.7223711013793945, -1.653234839439392, -1.5840985774993896, -1.5149623155593872, -1.4458260536193848, -1.3766896724700928, -1.3075535297393799, -1.238417148590088, -1.1692808866500854, -1.100144624710083, -1.0310083627700806, -0.9618721008300781, -0.8927357792854309, -0.8235995173454285, -0.754463255405426, -0.6853269338607788, -0.6161906719207764, -0.5470544099807739, -0.4779181480407715, -0.40878185629844666, -0.3396455645561218, -0.2705093026161194, -0.20137304067611694, -0.13223674893379211, -0.06310045719146729, 0.006036043167114258, 0.0751723200082779, 0.14430859684944153, 0.21344487369060516, 0.2825811505317688, 0.35171741247177124, 0.42085370421409607, 0.4899899959564209, 0.5591262578964233, 0.6282625198364258, 0.6973987817764282, 0.7665351033210754, 0.8356713652610779, 0.9048076272010803, 0.9739439487457275, 1.04308021068573, 1.1122164726257324, 1.1813527345657349, 1.2504889965057373, 1.3196252584457397, 1.3887615203857422, 1.4578979015350342, 1.5270341634750366, 1.596170425415039, 1.6653066873550415, 1.734442949295044, 1.8035792112350464, 1.8727154731750488, 1.9418518543243408, 2.0109879970550537, 2.0801243782043457, 2.1492605209350586, 2.2183969020843506]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 0.0, 3.0, 4.0, 3.0, 6.0, 4.0, 9.0, 7.0, 5.0, 10.0, 11.0, 8.0, 13.0, 15.0, 14.0, 21.0, 22.0, 24.0, 28.0, 32.0, 37.0, 43.0, 48.0, 76.0, 61.0, 65.0, 57.0, 59.0, 43.0, 35.0, 21.0, 36.0, 31.0, 26.0, 24.0, 10.0, 19.0, 20.0, 9.0, 11.0, 9.0, 5.0, 6.0, 6.0, 9.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6456982493400574, -0.623222827911377, -0.6007474660873413, -0.5782720446586609, -0.5557966232299805, -0.5333212018013, -0.5108457803726196, -0.488370418548584, -0.46589499711990356, -0.44341957569122314, -0.4209441840648651, -0.3984687924385071, -0.37599337100982666, -0.35351794958114624, -0.3310425579547882, -0.3085671663284302, -0.28609174489974976, -0.26361632347106934, -0.2411409318447113, -0.21866552531719208, -0.19619011878967285, -0.17371471226215363, -0.1512393057346344, -0.12876389920711517, -0.10628849267959595, -0.08381308615207672, -0.061337679624557495, -0.03886227309703827, -0.016386866569519043, 0.006088539958000183, 0.02856394648551941, 0.051039353013038635, 0.07351481914520264, 0.09599022567272186, 0.11846563220024109, 0.14094103872776031, 0.16341644525527954, 0.18589185178279877, 0.208367258310318, 0.23084266483783722, 0.25331807136535645, 0.27579349279403687, 0.2982688844203949, 0.32074427604675293, 0.34321969747543335, 0.36569511890411377, 0.3881705105304718, 0.41064590215682983, 0.43312132358551025, 0.4555967450141907, 0.4780721366405487, 0.5005475282669067, 0.5230229496955872, 0.5454983711242676, 0.5679737329483032, 0.5904491543769836, 0.6129245758056641, 0.6353999972343445, 0.6578754186630249, 0.6803507804870605, 0.702826201915741, 0.7253016233444214, 0.747776985168457, 0.7702524065971375, 0.7927278280258179]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 2.0, 3.0, 8.0, 7.0, 16.0, 17.0, 22.0, 39.0, 37.0, 81.0, 127.0, 177.0, 285.0, 460.0, 737.0, 1248.0, 2275.0, 4059.0, 7655.0, 16602.0, 45034.0, 173660.0, 982675.0, 2231021.0, 559787.0, 109053.0, 32024.0, 12876.0, 6157.0, 3267.0, 1924.0, 1107.0, 647.0, 411.0, 263.0, 173.0, 115.0, 75.0, 45.0, 40.0, 31.0, 22.0, 9.0, 9.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.051666259765625, -0.049776554107666016, -0.04788684844970703, -0.04599714279174805, -0.04410743713378906, -0.04221773147583008, -0.040328025817871094, -0.03843832015991211, -0.036548614501953125, -0.03465890884399414, -0.032769203186035156, -0.030879497528076172, -0.028989791870117188, -0.027100086212158203, -0.02521038055419922, -0.023320674896240234, -0.02143096923828125, -0.019541263580322266, -0.01765155792236328, -0.015761852264404297, -0.013872146606445312, -0.011982440948486328, -0.010092735290527344, -0.00820302963256836, -0.006313323974609375, -0.004423618316650391, -0.0025339126586914062, -0.0006442070007324219, 0.0012454986572265625, 0.003135204315185547, 0.005024909973144531, 0.006914615631103516, 0.0088043212890625, 0.010694026947021484, 0.012583732604980469, 0.014473438262939453, 0.016363143920898438, 0.018252849578857422, 0.020142555236816406, 0.02203226089477539, 0.023921966552734375, 0.02581167221069336, 0.027701377868652344, 0.029591083526611328, 0.03148078918457031, 0.0333704948425293, 0.03526020050048828, 0.037149906158447266, 0.03903961181640625, 0.040929317474365234, 0.04281902313232422, 0.0447087287902832, 0.04659843444824219, 0.04848814010620117, 0.050377845764160156, 0.05226755142211914, 0.054157257080078125, 0.05604696273803711, 0.057936668395996094, 0.05982637405395508, 0.06171607971191406, 0.06360578536987305, 0.06549549102783203, 0.06738519668579102, 0.06927490234375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 7.0, 7.0, 4.0, 6.0, 6.0, 8.0, 9.0, 12.0, 23.0, 18.0, 22.0, 20.0, 36.0, 51.0, 37.0, 44.0, 42.0, 37.0, 56.0, 58.0, 54.0, 45.0, 54.0, 34.0, 45.0, 50.0, 34.0, 33.0, 36.0, 17.0, 21.0, 17.0, 23.0, 12.0, 4.0, 7.0, 9.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.055450439453125, -0.053768157958984375, -0.05208587646484375, -0.050403594970703125, -0.0487213134765625, -0.047039031982421875, -0.04535675048828125, -0.043674468994140625, -0.0419921875, -0.040309906005859375, -0.03862762451171875, -0.036945343017578125, -0.0352630615234375, -0.033580780029296875, -0.03189849853515625, -0.030216217041015625, -0.028533935546875, -0.026851654052734375, -0.02516937255859375, -0.023487091064453125, -0.0218048095703125, -0.020122528076171875, -0.01844024658203125, -0.016757965087890625, -0.01507568359375, -0.013393402099609375, -0.01171112060546875, -0.010028839111328125, -0.0083465576171875, -0.006664276123046875, -0.00498199462890625, -0.003299713134765625, -0.001617431640625, 6.4849853515625e-05, 0.00174713134765625, 0.003429412841796875, 0.0051116943359375, 0.006793975830078125, 0.00847625732421875, 0.010158538818359375, 0.0118408203125, 0.013523101806640625, 0.01520538330078125, 0.016887664794921875, 0.0185699462890625, 0.020252227783203125, 0.02193450927734375, 0.023616790771484375, 0.025299072265625, 0.026981353759765625, 0.02866363525390625, 0.030345916748046875, 0.0320281982421875, 0.033710479736328125, 0.03539276123046875, 0.037075042724609375, 0.03875732421875, 0.040439605712890625, 0.04212188720703125, 0.043804168701171875, 0.0454864501953125, 0.047168731689453125, 0.04885101318359375, 0.050533294677734375, 0.052215576171875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 3.0, 9.0, 9.0, 16.0, 30.0, 36.0, 72.0, 94.0, 181.0, 536.0, 1914.0, 9065.0, 88956.0, 3719728.0, 350134.0, 18727.0, 3254.0, 843.0, 312.0, 128.0, 64.0, 47.0, 24.0, 25.0, 17.0, 13.0, 9.0, 8.0, 5.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1859130859375, -0.1791973114013672, -0.17248153686523438, -0.16576576232910156, -0.15904998779296875, -0.15233421325683594, -0.14561843872070312, -0.1389026641845703, -0.1321868896484375, -0.1254711151123047, -0.11875534057617188, -0.11203956604003906, -0.10532379150390625, -0.09860801696777344, -0.09189224243164062, -0.08517646789550781, -0.078460693359375, -0.07174491882324219, -0.06502914428710938, -0.05831336975097656, -0.05159759521484375, -0.04488182067871094, -0.038166046142578125, -0.03145027160644531, -0.0247344970703125, -0.018018722534179688, -0.011302947998046875, -0.0045871734619140625, 0.00212860107421875, 0.008844375610351562, 0.015560150146484375, 0.022275924682617188, 0.02899169921875, 0.03570747375488281, 0.042423248291015625, 0.04913902282714844, 0.05585479736328125, 0.06257057189941406, 0.06928634643554688, 0.07600212097167969, 0.0827178955078125, 0.08943367004394531, 0.09614944458007812, 0.10286521911621094, 0.10958099365234375, 0.11629676818847656, 0.12301254272460938, 0.1297283172607422, 0.136444091796875, 0.1431598663330078, 0.14987564086914062, 0.15659141540527344, 0.16330718994140625, 0.17002296447753906, 0.17673873901367188, 0.1834545135498047, 0.1901702880859375, 0.1968860626220703, 0.20360183715820312, 0.21031761169433594, 0.21703338623046875, 0.22374916076660156, 0.23046493530273438, 0.2371807098388672, 0.243896484375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 7.0, 5.0, 7.0, 5.0, 11.0, 15.0, 15.0, 22.0, 37.0, 47.0, 53.0, 98.0, 148.0, 266.0, 376.0, 618.0, 664.0, 621.0, 369.0, 230.0, 125.0, 105.0, 59.0, 48.0, 27.0, 23.0, 14.0, 10.0, 16.0, 5.0, 6.0, 4.0, 3.0, 6.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10040283203125, -0.09674739837646484, -0.09309196472167969, -0.08943653106689453, -0.08578109741210938, -0.08212566375732422, -0.07847023010253906, -0.0748147964477539, -0.07115936279296875, -0.0675039291381836, -0.06384849548339844, -0.06019306182861328, -0.056537628173828125, -0.05288219451904297, -0.04922676086425781, -0.045571327209472656, -0.0419158935546875, -0.038260459899902344, -0.03460502624511719, -0.03094959259033203, -0.027294158935546875, -0.02363872528076172, -0.019983291625976562, -0.016327857971191406, -0.01267242431640625, -0.009016990661621094, -0.0053615570068359375, -0.0017061233520507812, 0.001949310302734375, 0.005604743957519531, 0.009260177612304688, 0.012915611267089844, 0.016571044921875, 0.020226478576660156, 0.023881912231445312, 0.02753734588623047, 0.031192779541015625, 0.03484821319580078, 0.03850364685058594, 0.042159080505371094, 0.04581451416015625, 0.049469947814941406, 0.05312538146972656, 0.05678081512451172, 0.060436248779296875, 0.06409168243408203, 0.06774711608886719, 0.07140254974365234, 0.0750579833984375, 0.07871341705322266, 0.08236885070800781, 0.08602428436279297, 0.08967971801757812, 0.09333515167236328, 0.09699058532714844, 0.1006460189819336, 0.10430145263671875, 0.1079568862915039, 0.11161231994628906, 0.11526775360107422, 0.11892318725585938, 0.12257862091064453, 0.1262340545654297, 0.12988948822021484, 0.133544921875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 9.0, 10.0, 30.0, 56.0, 112.0, 174.0, 234.0, 171.0, 92.0, 68.0, 18.0, 11.0, 7.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0755388736724854, -1.0312937498092651, -0.9870485663414001, -0.9428034424781799, -0.8985582590103149, -0.8543131351470947, -0.8100680112838745, -0.7658228278160095, -0.7215776443481445, -0.6773325204849243, -0.6330873370170593, -0.5888422131538391, -0.5445970296859741, -0.5003519058227539, -0.4561067521572113, -0.4118615984916687, -0.3676164746284485, -0.3233713209629059, -0.2791261672973633, -0.23488102853298187, -0.19063587486743927, -0.14639072120189667, -0.10214558243751526, -0.057900428771972656, -0.013655275106430054, 0.03058987483382225, 0.07483502477407455, 0.11908017098903656, 0.16332532465457916, 0.20757047832012177, 0.2518156170845032, 0.2960607707500458, 0.3403059244155884, 0.384551078081131, 0.4287962317466736, 0.4730413556098938, 0.5172865390777588, 0.561531662940979, 0.6057767868041992, 0.6500219702720642, 0.6942671537399292, 0.7385122776031494, 0.7827574610710144, 0.8270025849342346, 0.8712477684020996, 0.9154928922653198, 0.95973801612854, 1.0039832592010498, 1.0482282638549805, 1.0924733877182007, 1.136718511581421, 1.1809637546539307, 1.2252088785171509, 1.269454002380371, 1.3136991262435913, 1.3579442501068115, 1.4021894931793213, 1.4464346170425415, 1.4906797409057617, 1.5349249839782715, 1.5791701078414917, 1.623415231704712, 1.6676603555679321, 1.7119054794311523, 1.756150722503662]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 7.0, 8.0, 9.0, 10.0, 10.0, 14.0, 13.0, 21.0, 15.0, 18.0, 29.0, 29.0, 33.0, 41.0, 52.0, 50.0, 51.0, 45.0, 47.0, 52.0, 55.0, 61.0, 38.0, 39.0, 35.0, 40.0, 28.0, 17.0, 25.0, 15.0, 11.0, 15.0, 15.0, 17.0, 17.0, 2.0, 3.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.5719928741455078, -0.5546301603317261, -0.5372673869132996, -0.519904613494873, -0.5025418996810913, -0.4851791560649872, -0.46781641244888306, -0.45045366883277893, -0.4330909252166748, -0.4157281816005707, -0.39836543798446655, -0.3810026943683624, -0.3636399507522583, -0.3462772071361542, -0.32891446352005005, -0.3115517199039459, -0.2941889762878418, -0.27682623267173767, -0.25946348905563354, -0.24210074543952942, -0.2247380018234253, -0.20737525820732117, -0.19001251459121704, -0.17264977097511292, -0.1552870273590088, -0.13792428374290466, -0.12056154012680054, -0.10319879651069641, -0.08583605289459229, -0.06847330927848816, -0.05111056566238403, -0.03374782204627991, -0.016385138034820557, 0.0009776055812835693, 0.018340349197387695, 0.03570309281349182, 0.05306583642959595, 0.07042858004570007, 0.0877913236618042, 0.10515406727790833, 0.12251681089401245, 0.13987955451011658, 0.1572422981262207, 0.17460504174232483, 0.19196778535842896, 0.20933052897453308, 0.2266932725906372, 0.24405601620674133, 0.26141875982284546, 0.2787815034389496, 0.2961442470550537, 0.31350699067115784, 0.33086973428726196, 0.3482324779033661, 0.3655952215194702, 0.38295796513557434, 0.40032070875167847, 0.4176834523677826, 0.4350461959838867, 0.45240893959999084, 0.46977168321609497, 0.4871344268321991, 0.5044971704483032, 0.521859884262085, 0.5392226576805115]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 15.0, 8.0, 17.0, 32.0, 37.0, 43.0, 66.0, 123.0, 160.0, 259.0, 441.0, 812.0, 1279.0, 2497.0, 5165.0, 11566.0, 32259.0, 108556.0, 370343.0, 358759.0, 103291.0, 31142.0, 11239.0, 4784.0, 2403.0, 1287.0, 754.0, 395.0, 272.0, 171.0, 120.0, 75.0, 54.0, 34.0, 31.0, 23.0, 12.0, 8.0, 7.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08160400390625, -0.07888221740722656, -0.07616043090820312, -0.07343864440917969, -0.07071685791015625, -0.06799507141113281, -0.06527328491210938, -0.06255149841308594, -0.0598297119140625, -0.05710792541503906, -0.054386138916015625, -0.05166435241699219, -0.04894256591796875, -0.04622077941894531, -0.043498992919921875, -0.04077720642089844, -0.038055419921875, -0.03533363342285156, -0.032611846923828125, -0.029890060424804688, -0.02716827392578125, -0.024446487426757812, -0.021724700927734375, -0.019002914428710938, -0.0162811279296875, -0.013559341430664062, -0.010837554931640625, -0.008115768432617188, -0.00539398193359375, -0.0026721954345703125, 4.9591064453125e-05, 0.0027713775634765625, 0.0054931640625, 0.008214950561523438, 0.010936737060546875, 0.013658523559570312, 0.01638031005859375, 0.019102096557617188, 0.021823883056640625, 0.024545669555664062, 0.0272674560546875, 0.029989242553710938, 0.032711029052734375, 0.03543281555175781, 0.03815460205078125, 0.04087638854980469, 0.043598175048828125, 0.04631996154785156, 0.049041748046875, 0.05176353454589844, 0.054485321044921875, 0.05720710754394531, 0.05992889404296875, 0.06265068054199219, 0.06537246704101562, 0.06809425354003906, 0.0708160400390625, 0.07353782653808594, 0.07625961303710938, 0.07898139953613281, 0.08170318603515625, 0.08442497253417969, 0.08714675903320312, 0.08986854553222656, 0.09259033203125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 3.0, 6.0, 10.0, 12.0, 11.0, 14.0, 29.0, 24.0, 36.0, 30.0, 36.0, 38.0, 50.0, 51.0, 45.0, 54.0, 51.0, 50.0, 57.0, 49.0, 61.0, 42.0, 42.0, 30.0, 30.0, 16.0, 27.0, 24.0, 19.0, 13.0, 7.0, 10.0, 6.0, 2.0, 4.0, 3.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055694580078125, -0.053822994232177734, -0.05195140838623047, -0.0500798225402832, -0.04820823669433594, -0.04633665084838867, -0.044465065002441406, -0.04259347915649414, -0.040721893310546875, -0.03885030746459961, -0.036978721618652344, -0.03510713577270508, -0.03323554992675781, -0.03136396408081055, -0.02949237823486328, -0.027620792388916016, -0.02574920654296875, -0.023877620697021484, -0.02200603485107422, -0.020134449005126953, -0.018262863159179688, -0.016391277313232422, -0.014519691467285156, -0.01264810562133789, -0.010776519775390625, -0.00890493392944336, -0.007033348083496094, -0.005161762237548828, -0.0032901763916015625, -0.0014185905456542969, 0.00045299530029296875, 0.0023245811462402344, 0.0041961669921875, 0.006067752838134766, 0.007939338684082031, 0.009810924530029297, 0.011682510375976562, 0.013554096221923828, 0.015425682067871094, 0.01729726791381836, 0.019168853759765625, 0.02104043960571289, 0.022912025451660156, 0.024783611297607422, 0.026655197143554688, 0.028526782989501953, 0.03039836883544922, 0.032269954681396484, 0.03414154052734375, 0.036013126373291016, 0.03788471221923828, 0.03975629806518555, 0.04162788391113281, 0.04349946975708008, 0.045371055603027344, 0.04724264144897461, 0.049114227294921875, 0.05098581314086914, 0.052857398986816406, 0.05472898483276367, 0.05660057067871094, 0.0584721565246582, 0.06034374237060547, 0.062215328216552734, 0.0640869140625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 4.0, 10.0, 6.0, 16.0, 11.0, 14.0, 36.0, 39.0, 74.0, 100.0, 191.0, 292.0, 624.0, 1277.0, 3379.0, 11080.0, 53497.0, 593125.0, 326432.0, 43424.0, 9398.0, 2981.0, 1236.0, 548.0, 263.0, 182.0, 103.0, 61.0, 52.0, 34.0, 23.0, 16.0, 8.0, 3.0, 4.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.1512451171875, -0.14715099334716797, -0.14305686950683594, -0.1389627456665039, -0.13486862182617188, -0.13077449798583984, -0.1266803741455078, -0.12258625030517578, -0.11849212646484375, -0.11439800262451172, -0.11030387878417969, -0.10620975494384766, -0.10211563110351562, -0.0980215072631836, -0.09392738342285156, -0.08983325958251953, -0.0857391357421875, -0.08164501190185547, -0.07755088806152344, -0.0734567642211914, -0.06936264038085938, -0.06526851654052734, -0.06117439270019531, -0.05708026885986328, -0.05298614501953125, -0.04889202117919922, -0.04479789733886719, -0.040703773498535156, -0.036609649658203125, -0.032515525817871094, -0.028421401977539062, -0.02432727813720703, -0.020233154296875, -0.01613903045654297, -0.012044906616210938, -0.007950782775878906, -0.003856658935546875, 0.00023746490478515625, 0.0043315887451171875, 0.008425712585449219, 0.01251983642578125, 0.01661396026611328, 0.020708084106445312, 0.024802207946777344, 0.028896331787109375, 0.032990455627441406, 0.03708457946777344, 0.04117870330810547, 0.0452728271484375, 0.04936695098876953, 0.05346107482910156, 0.057555198669433594, 0.061649322509765625, 0.06574344635009766, 0.06983757019042969, 0.07393169403076172, 0.07802581787109375, 0.08211994171142578, 0.08621406555175781, 0.09030818939208984, 0.09440231323242188, 0.0984964370727539, 0.10259056091308594, 0.10668468475341797, 0.11077880859375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 2.0, 5.0, 3.0, 7.0, 8.0, 4.0, 9.0, 5.0, 13.0, 26.0, 20.0, 31.0, 40.0, 32.0, 35.0, 40.0, 50.0, 51.0, 64.0, 49.0, 55.0, 54.0, 51.0, 45.0, 51.0, 42.0, 28.0, 34.0, 36.0, 28.0, 23.0, 8.0, 7.0, 10.0, 8.0, 8.0, 4.0, 6.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.238037109375, -0.231414794921875, -0.22479248046875, -0.218170166015625, -0.2115478515625, -0.204925537109375, -0.19830322265625, -0.191680908203125, -0.18505859375, -0.178436279296875, -0.17181396484375, -0.165191650390625, -0.1585693359375, -0.151947021484375, -0.14532470703125, -0.138702392578125, -0.132080078125, -0.125457763671875, -0.11883544921875, -0.112213134765625, -0.1055908203125, -0.098968505859375, -0.09234619140625, -0.085723876953125, -0.0791015625, -0.072479248046875, -0.06585693359375, -0.059234619140625, -0.0526123046875, -0.045989990234375, -0.03936767578125, -0.032745361328125, -0.026123046875, -0.019500732421875, -0.01287841796875, -0.006256103515625, 0.0003662109375, 0.006988525390625, 0.01361083984375, 0.020233154296875, 0.02685546875, 0.033477783203125, 0.04010009765625, 0.046722412109375, 0.0533447265625, 0.059967041015625, 0.06658935546875, 0.073211669921875, 0.079833984375, 0.086456298828125, 0.09307861328125, 0.099700927734375, 0.1063232421875, 0.112945556640625, 0.11956787109375, 0.126190185546875, 0.1328125, 0.139434814453125, 0.14605712890625, 0.152679443359375, 0.1593017578125, 0.165924072265625, 0.17254638671875, 0.179168701171875, 0.185791015625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 8.0, 6.0, 20.0, 15.0, 31.0, 43.0, 33.0, 87.0, 148.0, 244.0, 431.0, 825.0, 1621.0, 3315.0, 7342.0, 18753.0, 54751.0, 202517.0, 596082.0, 107312.0, 32827.0, 12195.0, 4970.0, 2318.0, 1110.0, 667.0, 342.0, 197.0, 139.0, 81.0, 39.0, 37.0, 14.0, 16.0, 11.0, 7.0, 0.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.025390625, -0.02429962158203125, -0.0232086181640625, -0.02211761474609375, -0.021026611328125, -0.01993560791015625, -0.0188446044921875, -0.01775360107421875, -0.01666259765625, -0.01557159423828125, -0.0144805908203125, -0.01338958740234375, -0.012298583984375, -0.01120758056640625, -0.0101165771484375, -0.00902557373046875, -0.0079345703125, -0.00684356689453125, -0.0057525634765625, -0.00466156005859375, -0.003570556640625, -0.00247955322265625, -0.0013885498046875, -0.00029754638671875, 0.00079345703125, 0.00188446044921875, 0.0029754638671875, 0.00406646728515625, 0.005157470703125, 0.00624847412109375, 0.0073394775390625, 0.00843048095703125, 0.009521484375, 0.01061248779296875, 0.0117034912109375, 0.01279449462890625, 0.013885498046875, 0.01497650146484375, 0.0160675048828125, 0.01715850830078125, 0.01824951171875, 0.01934051513671875, 0.0204315185546875, 0.02152252197265625, 0.022613525390625, 0.02370452880859375, 0.0247955322265625, 0.02588653564453125, 0.0269775390625, 0.02806854248046875, 0.0291595458984375, 0.03025054931640625, 0.031341552734375, 0.03243255615234375, 0.0335235595703125, 0.03461456298828125, 0.03570556640625, 0.03679656982421875, 0.0378875732421875, 0.03897857666015625, 0.040069580078125, 0.04116058349609375, 0.0422515869140625, 0.04334259033203125, 0.04443359375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 7.0, 11.0, 12.0, 13.0, 18.0, 28.0, 35.0, 52.0, 49.0, 68.0, 72.0, 115.0, 102.0, 80.0, 71.0, 70.0, 53.0, 37.0, 29.0, 19.0, 9.0, 12.0, 8.0, 7.0, 9.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1219253540039062e-05, -2.0633451640605927e-05, -2.004764974117279e-05, -1.9461847841739655e-05, -1.887604594230652e-05, -1.8290244042873383e-05, -1.7704442143440247e-05, -1.711864024400711e-05, -1.6532838344573975e-05, -1.594703644514084e-05, -1.5361234545707703e-05, -1.4775432646274567e-05, -1.418963074684143e-05, -1.3603828847408295e-05, -1.3018026947975159e-05, -1.2432225048542023e-05, -1.1846423149108887e-05, -1.126062124967575e-05, -1.0674819350242615e-05, -1.0089017450809479e-05, -9.503215551376343e-06, -8.917413651943207e-06, -8.33161175251007e-06, -7.745809853076935e-06, -7.160007953643799e-06, -6.574206054210663e-06, -5.988404154777527e-06, -5.402602255344391e-06, -4.816800355911255e-06, -4.230998456478119e-06, -3.645196557044983e-06, -3.059394657611847e-06, -2.473592758178711e-06, -1.887790858745575e-06, -1.301988959312439e-06, -7.16187059879303e-07, -1.30385160446167e-07, 4.55416738986969e-07, 1.041218638420105e-06, 1.627020537853241e-06, 2.212822437286377e-06, 2.798624336719513e-06, 3.384426236152649e-06, 3.970228135585785e-06, 4.556030035018921e-06, 5.141831934452057e-06, 5.727633833885193e-06, 6.313435733318329e-06, 6.899237632751465e-06, 7.485039532184601e-06, 8.070841431617737e-06, 8.656643331050873e-06, 9.242445230484009e-06, 9.828247129917145e-06, 1.041404902935028e-05, 1.0999850928783417e-05, 1.1585652828216553e-05, 1.2171454727649689e-05, 1.2757256627082825e-05, 1.334305852651596e-05, 1.3928860425949097e-05, 1.4514662325382233e-05, 1.5100464224815369e-05, 1.5686266124248505e-05, 1.627206802368164e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 1.0, 3.0, 4.0, 7.0, 9.0, 19.0, 14.0, 37.0, 58.0, 118.0, 195.0, 395.0, 920.0, 2418.0, 7681.0, 33530.0, 226068.0, 687888.0, 69336.0, 13540.0, 3807.0, 1302.0, 595.0, 251.0, 138.0, 87.0, 47.0, 28.0, 28.0, 14.0, 5.0, 3.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048431396484375, -0.046651363372802734, -0.04487133026123047, -0.0430912971496582, -0.04131126403808594, -0.03953123092651367, -0.037751197814941406, -0.03597116470336914, -0.034191131591796875, -0.03241109848022461, -0.030631065368652344, -0.028851032257080078, -0.027070999145507812, -0.025290966033935547, -0.02351093292236328, -0.021730899810791016, -0.01995086669921875, -0.018170833587646484, -0.01639080047607422, -0.014610767364501953, -0.012830734252929688, -0.011050701141357422, -0.009270668029785156, -0.007490634918212891, -0.005710601806640625, -0.003930568695068359, -0.0021505355834960938, -0.0003705024719238281, 0.0014095306396484375, 0.003189563751220703, 0.004969596862792969, 0.006749629974365234, 0.0085296630859375, 0.010309696197509766, 0.012089729309082031, 0.013869762420654297, 0.015649795532226562, 0.017429828643798828, 0.019209861755371094, 0.02098989486694336, 0.022769927978515625, 0.02454996109008789, 0.026329994201660156, 0.028110027313232422, 0.029890060424804688, 0.03167009353637695, 0.03345012664794922, 0.035230159759521484, 0.03701019287109375, 0.038790225982666016, 0.04057025909423828, 0.04235029220581055, 0.04413032531738281, 0.04591035842895508, 0.047690391540527344, 0.04947042465209961, 0.051250457763671875, 0.05303049087524414, 0.054810523986816406, 0.05659055709838867, 0.05837059020996094, 0.0601506233215332, 0.06193065643310547, 0.06371068954467773, 0.06549072265625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 6.0, 17.0, 13.0, 16.0, 30.0, 28.0, 30.0, 38.0, 60.0, 73.0, 111.0, 108.0, 101.0, 84.0, 59.0, 48.0, 27.0, 32.0, 26.0, 17.0, 15.0, 14.0, 6.0, 5.0, 6.0, 4.0, 5.0, 6.0, 2.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05499267578125, -0.0534820556640625, -0.051971435546875, -0.0504608154296875, -0.0489501953125, -0.0474395751953125, -0.045928955078125, -0.0444183349609375, -0.04290771484375, -0.0413970947265625, -0.039886474609375, -0.0383758544921875, -0.036865234375, -0.0353546142578125, -0.033843994140625, -0.0323333740234375, -0.03082275390625, -0.0293121337890625, -0.027801513671875, -0.0262908935546875, -0.0247802734375, -0.0232696533203125, -0.021759033203125, -0.0202484130859375, -0.01873779296875, -0.0172271728515625, -0.015716552734375, -0.0142059326171875, -0.0126953125, -0.0111846923828125, -0.009674072265625, -0.0081634521484375, -0.00665283203125, -0.0051422119140625, -0.003631591796875, -0.0021209716796875, -0.0006103515625, 0.0009002685546875, 0.002410888671875, 0.0039215087890625, 0.00543212890625, 0.0069427490234375, 0.008453369140625, 0.0099639892578125, 0.011474609375, 0.0129852294921875, 0.014495849609375, 0.0160064697265625, 0.01751708984375, 0.0190277099609375, 0.020538330078125, 0.0220489501953125, 0.0235595703125, 0.0250701904296875, 0.026580810546875, 0.0280914306640625, 0.02960205078125, 0.0311126708984375, 0.032623291015625, 0.0341339111328125, 0.03564453125, 0.0371551513671875, 0.038665771484375, 0.0401763916015625, 0.04168701171875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 6.0, 3.0, 3.0, 8.0, 8.0, 23.0, 39.0, 90.0, 148.0, 319.0, 190.0, 82.0, 52.0, 18.0, 7.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1870087385177612, -1.1456937789916992, -1.1043787002563477, -1.0630637407302856, -1.0217487812042236, -0.9804337024688721, -0.9391187429428101, -0.8978037238121033, -0.8564887046813965, -0.8151736855506897, -0.7738586664199829, -0.7325437068939209, -0.6912286877632141, -0.6499136686325073, -0.6085987091064453, -0.5672836899757385, -0.5259686708450317, -0.48465365171432495, -0.44333866238594055, -0.40202367305755615, -0.36070865392684937, -0.3193936347961426, -0.2780786454677582, -0.23676365613937378, -0.195448637008667, -0.1541336327791214, -0.1128186285495758, -0.07150362432003021, -0.03018862009048462, 0.011126384139060974, 0.05244138836860657, 0.09375637769699097, 0.1350712776184082, 0.1763862818479538, 0.2177012860774994, 0.2590162754058838, 0.3003312945365906, 0.34164631366729736, 0.38296130299568176, 0.42427629232406616, 0.46559131145477295, 0.5069063305854797, 0.5482213497161865, 0.5895363092422485, 0.6308513283729553, 0.6721663475036621, 0.7134813070297241, 0.7547963261604309, 0.7961113452911377, 0.8374263644218445, 0.8787413835525513, 0.9200563430786133, 0.9613713622093201, 1.0026863813400269, 1.0440013408660889, 1.0853164196014404, 1.1266313791275024, 1.1679463386535645, 1.209261417388916, 1.250576376914978, 1.29189133644104, 1.3332064151763916, 1.3745213747024536, 1.4158363342285156, 1.4571514129638672]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 4.0, 11.0, 8.0, 7.0, 9.0, 9.0, 10.0, 20.0, 7.0, 22.0, 24.0, 21.0, 24.0, 32.0, 23.0, 31.0, 50.0, 46.0, 59.0, 71.0, 76.0, 72.0, 61.0, 45.0, 28.0, 32.0, 37.0, 27.0, 16.0, 21.0, 12.0, 13.0, 15.0, 10.0, 9.0, 12.0, 8.0, 6.0, 2.0, 3.0, 2.0, 0.0, 7.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.706863284111023, -0.6832928657531738, -0.6597223877906799, -0.6361519694328308, -0.6125814914703369, -0.5890110731124878, -0.5654406547546387, -0.5418702363967896, -0.5182997584342957, -0.49472931027412415, -0.47115886211395264, -0.4475884437561035, -0.424017995595932, -0.4004475474357605, -0.3768771290779114, -0.35330668091773987, -0.32973623275756836, -0.30616578459739685, -0.28259533643722534, -0.2590249180793762, -0.2354544699192047, -0.2118840217590332, -0.1883135885000229, -0.16474315524101257, -0.14117270708084106, -0.11760226637125015, -0.09403182566165924, -0.07046138495206833, -0.04689094424247742, -0.023320503532886505, 0.00024993717670440674, 0.02382037043571472, 0.04739081859588623, 0.07096125930547714, 0.09453170001506805, 0.11810214072465897, 0.14167258143424988, 0.1652430295944214, 0.1888134628534317, 0.21238389611244202, 0.23595434427261353, 0.25952479243278503, 0.28309524059295654, 0.30666565895080566, 0.3302361071109772, 0.3538065552711487, 0.3773769736289978, 0.4009474217891693, 0.4245178699493408, 0.44808831810951233, 0.47165876626968384, 0.49522918462753296, 0.5187996625900269, 0.542370080947876, 0.5659404993057251, 0.5895109176635742, 0.6130813956260681, 0.6366518139839172, 0.6602222919464111, 0.6837927103042603, 0.7073631286621094, 0.7309336066246033, 0.7545040249824524, 0.7780745029449463, 0.8016449213027954]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 2.0, 2.0, 6.0, 6.0, 8.0, 16.0, 23.0, 34.0, 45.0, 63.0, 133.0, 186.0, 326.0, 539.0, 944.0, 1787.0, 3716.0, 8684.0, 24871.0, 104970.0, 705011.0, 2558197.0, 650420.0, 95682.0, 22690.0, 8050.0, 3556.0, 1819.0, 946.0, 591.0, 378.0, 195.0, 121.0, 85.0, 64.0, 29.0, 34.0, 20.0, 19.0, 12.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06561279296875, -0.06322479248046875, -0.0608367919921875, -0.05844879150390625, -0.056060791015625, -0.05367279052734375, -0.0512847900390625, -0.04889678955078125, -0.0465087890625, -0.04412078857421875, -0.0417327880859375, -0.03934478759765625, -0.036956787109375, -0.03456878662109375, -0.0321807861328125, -0.02979278564453125, -0.02740478515625, -0.02501678466796875, -0.0226287841796875, -0.02024078369140625, -0.017852783203125, -0.01546478271484375, -0.0130767822265625, -0.01068878173828125, -0.00830078125, -0.00591278076171875, -0.0035247802734375, -0.00113677978515625, 0.001251220703125, 0.00363922119140625, 0.0060272216796875, 0.00841522216796875, 0.01080322265625, 0.01319122314453125, 0.0155792236328125, 0.01796722412109375, 0.020355224609375, 0.02274322509765625, 0.0251312255859375, 0.02751922607421875, 0.0299072265625, 0.03229522705078125, 0.0346832275390625, 0.03707122802734375, 0.039459228515625, 0.04184722900390625, 0.0442352294921875, 0.04662322998046875, 0.04901123046875, 0.05139923095703125, 0.0537872314453125, 0.05617523193359375, 0.058563232421875, 0.06095123291015625, 0.0633392333984375, 0.06572723388671875, 0.068115234375, 0.07050323486328125, 0.0728912353515625, 0.07527923583984375, 0.077667236328125, 0.08005523681640625, 0.0824432373046875, 0.08483123779296875, 0.08721923828125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 3.0, 2.0, 7.0, 6.0, 11.0, 11.0, 8.0, 13.0, 17.0, 21.0, 18.0, 22.0, 25.0, 30.0, 40.0, 48.0, 52.0, 44.0, 46.0, 34.0, 37.0, 49.0, 37.0, 31.0, 45.0, 45.0, 33.0, 39.0, 35.0, 25.0, 23.0, 13.0, 25.0, 20.0, 11.0, 10.0, 15.0, 10.0, 8.0, 8.0, 3.0, 3.0, 4.0, 7.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04779052734375, -0.04626941680908203, -0.04474830627441406, -0.043227195739746094, -0.041706085205078125, -0.040184974670410156, -0.03866386413574219, -0.03714275360107422, -0.03562164306640625, -0.03410053253173828, -0.03257942199707031, -0.031058311462402344, -0.029537200927734375, -0.028016090393066406, -0.026494979858398438, -0.02497386932373047, -0.0234527587890625, -0.02193164825439453, -0.020410537719726562, -0.018889427185058594, -0.017368316650390625, -0.015847206115722656, -0.014326095581054688, -0.012804985046386719, -0.01128387451171875, -0.009762763977050781, -0.008241653442382812, -0.006720542907714844, -0.005199432373046875, -0.0036783218383789062, -0.0021572113037109375, -0.0006361007690429688, 0.000885009765625, 0.0024061203002929688, 0.0039272308349609375, 0.005448341369628906, 0.006969451904296875, 0.008490562438964844, 0.010011672973632812, 0.011532783508300781, 0.01305389404296875, 0.014575004577636719, 0.016096115112304688, 0.017617225646972656, 0.019138336181640625, 0.020659446716308594, 0.022180557250976562, 0.02370166778564453, 0.0252227783203125, 0.02674388885498047, 0.028264999389648438, 0.029786109924316406, 0.031307220458984375, 0.032828330993652344, 0.03434944152832031, 0.03587055206298828, 0.03739166259765625, 0.03891277313232422, 0.04043388366699219, 0.041954994201660156, 0.043476104736328125, 0.044997215270996094, 0.04651832580566406, 0.04803943634033203, 0.049560546875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 9.0, 8.0, 16.0, 22.0, 42.0, 76.0, 134.0, 296.0, 890.0, 5281.0, 107682.0, 3944523.0, 127618.0, 6108.0, 970.0, 279.0, 138.0, 78.0, 47.0, 32.0, 12.0, 11.0, 4.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32763671875, -0.3197460174560547, -0.3118553161621094, -0.30396461486816406, -0.29607391357421875, -0.28818321228027344, -0.2802925109863281, -0.2724018096923828, -0.2645111083984375, -0.2566204071044922, -0.24872970581054688, -0.24083900451660156, -0.23294830322265625, -0.22505760192871094, -0.21716690063476562, -0.2092761993408203, -0.201385498046875, -0.1934947967529297, -0.18560409545898438, -0.17771339416503906, -0.16982269287109375, -0.16193199157714844, -0.15404129028320312, -0.1461505889892578, -0.1382598876953125, -0.1303691864013672, -0.12247848510742188, -0.11458778381347656, -0.10669708251953125, -0.09880638122558594, -0.09091567993164062, -0.08302497863769531, -0.07513427734375, -0.06724357604980469, -0.059352874755859375, -0.05146217346191406, -0.04357147216796875, -0.03568077087402344, -0.027790069580078125, -0.019899368286132812, -0.0120086669921875, -0.0041179656982421875, 0.003772735595703125, 0.011663436889648438, 0.01955413818359375, 0.027444839477539062, 0.035335540771484375, 0.04322624206542969, 0.051116943359375, 0.05900764465332031, 0.06689834594726562, 0.07478904724121094, 0.08267974853515625, 0.09057044982910156, 0.09846115112304688, 0.10635185241699219, 0.1142425537109375, 0.12213325500488281, 0.13002395629882812, 0.13791465759277344, 0.14580535888671875, 0.15369606018066406, 0.16158676147460938, 0.1694774627685547, 0.1773681640625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 6.0, 11.0, 10.0, 8.0, 18.0, 23.0, 29.0, 28.0, 45.0, 49.0, 92.0, 123.0, 151.0, 228.0, 352.0, 453.0, 594.0, 536.0, 402.0, 271.0, 189.0, 120.0, 74.0, 56.0, 49.0, 30.0, 24.0, 18.0, 22.0, 13.0, 9.0, 6.0, 7.0, 2.0, 5.0, 3.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08837890625, -0.0852975845336914, -0.08221626281738281, -0.07913494110107422, -0.07605361938476562, -0.07297229766845703, -0.06989097595214844, -0.06680965423583984, -0.06372833251953125, -0.060647010803222656, -0.05756568908691406, -0.05448436737060547, -0.051403045654296875, -0.04832172393798828, -0.04524040222167969, -0.042159080505371094, -0.0390777587890625, -0.035996437072753906, -0.03291511535644531, -0.02983379364013672, -0.026752471923828125, -0.02367115020751953, -0.020589828491210938, -0.017508506774902344, -0.01442718505859375, -0.011345863342285156, -0.008264541625976562, -0.005183219909667969, -0.002101898193359375, 0.0009794235229492188, 0.0040607452392578125, 0.007142066955566406, 0.010223388671875, 0.013304710388183594, 0.016386032104492188, 0.01946735382080078, 0.022548675537109375, 0.02562999725341797, 0.028711318969726562, 0.031792640686035156, 0.03487396240234375, 0.037955284118652344, 0.04103660583496094, 0.04411792755126953, 0.047199249267578125, 0.05028057098388672, 0.05336189270019531, 0.056443214416503906, 0.0595245361328125, 0.0626058578491211, 0.06568717956542969, 0.06876850128173828, 0.07184982299804688, 0.07493114471435547, 0.07801246643066406, 0.08109378814697266, 0.08417510986328125, 0.08725643157958984, 0.09033775329589844, 0.09341907501220703, 0.09650039672851562, 0.09958171844482422, 0.10266304016113281, 0.1057443618774414, 0.10882568359375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 4.0, 5.0, 12.0, 17.0, 34.0, 61.0, 100.0, 141.0, 157.0, 165.0, 119.0, 74.0, 45.0, 23.0, 13.0, 12.0, 7.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3923041820526123, -1.3603432178497314, -1.3283822536468506, -1.2964212894439697, -1.2644603252410889, -1.2324994802474976, -1.2005385160446167, -1.1685775518417358, -1.136616587638855, -1.1046556234359741, -1.0726946592330933, -1.0407336950302124, -1.008772850036621, -0.9768118262290955, -0.9448509216308594, -0.9128899574279785, -0.8809289932250977, -0.8489680290222168, -0.8170070648193359, -0.7850461602210999, -0.753085196018219, -0.7211242318153381, -0.689163327217102, -0.6572023630142212, -0.6252413988113403, -0.5932804346084595, -0.5613194704055786, -0.5293585658073425, -0.49739760160446167, -0.4654366374015808, -0.43347570300102234, -0.40151476860046387, -0.3695538640022278, -0.3375928997993469, -0.30563196539878845, -0.27367103099823, -0.24171006679534912, -0.20974911749362946, -0.1777881681919098, -0.14582721889019012, -0.11386626958847046, -0.0819053202867508, -0.04994437098503113, -0.017983421683311462, 0.013977527618408203, 0.04593847692012787, 0.07789942622184753, 0.1098603755235672, 0.14182132482528687, 0.17378227412700653, 0.2057432234287262, 0.23770417273044586, 0.2696651220321655, 0.3016260862350464, 0.33358702063560486, 0.36554795503616333, 0.3975089192390442, 0.42946988344192505, 0.4614308178424835, 0.493391752243042, 0.5253527164459229, 0.5573136806488037, 0.5892746448516846, 0.6212355494499207, 0.6531965136528015]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 7.0, 6.0, 1.0, 5.0, 3.0, 7.0, 14.0, 7.0, 15.0, 10.0, 18.0, 14.0, 22.0, 21.0, 29.0, 26.0, 23.0, 29.0, 37.0, 41.0, 39.0, 55.0, 42.0, 37.0, 44.0, 39.0, 44.0, 29.0, 34.0, 36.0, 29.0, 29.0, 26.0, 34.0, 22.0, 16.0, 21.0, 13.0, 16.0, 11.0, 14.0, 7.0, 9.0, 4.0, 5.0, 9.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.4441753029823303, -0.4309903681278229, -0.41780543327331543, -0.404620498418808, -0.39143556356430054, -0.3782505989074707, -0.36506566405296326, -0.3518807291984558, -0.33869579434394836, -0.3255108594894409, -0.31232592463493347, -0.299140989780426, -0.2859560251235962, -0.27277112007141113, -0.2595861554145813, -0.24640122056007385, -0.2332162857055664, -0.22003135085105896, -0.2068464159965515, -0.19366146624088287, -0.18047653138637543, -0.16729159653186798, -0.15410664677619934, -0.1409217119216919, -0.12773677706718445, -0.114551842212677, -0.10136689990758896, -0.08818195760250092, -0.07499702274799347, -0.06181208789348602, -0.04862714558839798, -0.035442203283309937, -0.02225726842880249, -0.009072329849004745, 0.004112608730792999, 0.017297547310590744, 0.03048248589038849, 0.043667420744895935, 0.05685236304998398, 0.07003730535507202, 0.08322224020957947, 0.09640717506408691, 0.10959211736917496, 0.122777059674263, 0.13596199452877045, 0.1491469293832779, 0.16233187913894653, 0.17551681399345398, 0.18870174884796143, 0.20188668370246887, 0.21507161855697632, 0.22825656831264496, 0.2414415031671524, 0.25462645292282104, 0.2678113877773285, 0.28099632263183594, 0.2941812574863434, 0.30736619234085083, 0.3205511271953583, 0.3337360620498657, 0.34692102670669556, 0.3601059317588806, 0.37329089641571045, 0.3864758312702179, 0.39966076612472534]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 9.0, 4.0, 8.0, 8.0, 18.0, 30.0, 36.0, 55.0, 81.0, 150.0, 208.0, 379.0, 642.0, 1222.0, 2377.0, 5110.0, 12100.0, 29815.0, 86796.0, 294932.0, 407995.0, 133728.0, 43036.0, 16380.0, 6750.0, 3156.0, 1563.0, 805.0, 456.0, 255.0, 163.0, 99.0, 69.0, 43.0, 30.0, 22.0, 16.0, 11.0, 4.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.09588623046875, -0.09323596954345703, -0.09058570861816406, -0.0879354476928711, -0.08528518676757812, -0.08263492584228516, -0.07998466491699219, -0.07733440399169922, -0.07468414306640625, -0.07203388214111328, -0.06938362121582031, -0.06673336029052734, -0.06408309936523438, -0.061432838439941406, -0.05878257751464844, -0.05613231658935547, -0.0534820556640625, -0.05083179473876953, -0.04818153381347656, -0.045531272888183594, -0.042881011962890625, -0.040230751037597656, -0.03758049011230469, -0.03493022918701172, -0.03227996826171875, -0.02962970733642578, -0.026979446411132812, -0.024329185485839844, -0.021678924560546875, -0.019028663635253906, -0.016378402709960938, -0.013728141784667969, -0.011077880859375, -0.008427619934082031, -0.0057773590087890625, -0.0031270980834960938, -0.000476837158203125, 0.0021734237670898438, 0.0048236846923828125, 0.007473945617675781, 0.01012420654296875, 0.012774467468261719, 0.015424728393554688, 0.018074989318847656, 0.020725250244140625, 0.023375511169433594, 0.026025772094726562, 0.02867603302001953, 0.0313262939453125, 0.03397655487060547, 0.03662681579589844, 0.039277076721191406, 0.041927337646484375, 0.044577598571777344, 0.04722785949707031, 0.04987812042236328, 0.05252838134765625, 0.05517864227294922, 0.05782890319824219, 0.060479164123535156, 0.06312942504882812, 0.0657796859741211, 0.06842994689941406, 0.07108020782470703, 0.07373046875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 4.0, 6.0, 9.0, 6.0, 7.0, 7.0, 8.0, 13.0, 12.0, 20.0, 12.0, 17.0, 24.0, 28.0, 22.0, 30.0, 34.0, 37.0, 39.0, 44.0, 41.0, 35.0, 51.0, 39.0, 37.0, 35.0, 42.0, 53.0, 39.0, 23.0, 32.0, 32.0, 19.0, 26.0, 15.0, 24.0, 10.0, 7.0, 11.0, 9.0, 11.0, 5.0, 7.0, 8.0, 3.0, 3.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04931640625, -0.04781532287597656, -0.046314239501953125, -0.04481315612792969, -0.04331207275390625, -0.04181098937988281, -0.040309906005859375, -0.03880882263183594, -0.0373077392578125, -0.03580665588378906, -0.034305572509765625, -0.03280448913574219, -0.03130340576171875, -0.029802322387695312, -0.028301239013671875, -0.026800155639648438, -0.025299072265625, -0.023797988891601562, -0.022296905517578125, -0.020795822143554688, -0.01929473876953125, -0.017793655395507812, -0.016292572021484375, -0.014791488647460938, -0.0132904052734375, -0.011789321899414062, -0.010288238525390625, -0.008787155151367188, -0.00728607177734375, -0.0057849884033203125, -0.004283905029296875, -0.0027828216552734375, -0.00128173828125, 0.0002193450927734375, 0.001720428466796875, 0.0032215118408203125, 0.00472259521484375, 0.0062236785888671875, 0.007724761962890625, 0.009225845336914062, 0.0107269287109375, 0.012228012084960938, 0.013729095458984375, 0.015230178833007812, 0.01673126220703125, 0.018232345581054688, 0.019733428955078125, 0.021234512329101562, 0.022735595703125, 0.024236679077148438, 0.025737762451171875, 0.027238845825195312, 0.02873992919921875, 0.030241012573242188, 0.031742095947265625, 0.03324317932128906, 0.0347442626953125, 0.03624534606933594, 0.037746429443359375, 0.03924751281738281, 0.04074859619140625, 0.04224967956542969, 0.043750762939453125, 0.04525184631347656, 0.0467529296875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 7.0, 6.0, 1.0, 12.0, 20.0, 21.0, 23.0, 32.0, 55.0, 95.0, 131.0, 214.0, 344.0, 651.0, 1283.0, 3048.0, 8928.0, 34519.0, 219314.0, 690311.0, 67077.0, 14234.0, 4379.0, 1830.0, 828.0, 448.0, 241.0, 185.0, 119.0, 57.0, 44.0, 33.0, 26.0, 13.0, 6.0, 8.0, 4.0, 3.0, 4.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1431884765625, -0.13923263549804688, -0.13527679443359375, -0.13132095336914062, -0.1273651123046875, -0.12340927124023438, -0.11945343017578125, -0.11549758911132812, -0.111541748046875, -0.10758590698242188, -0.10363006591796875, -0.09967422485351562, -0.0957183837890625, -0.09176254272460938, -0.08780670166015625, -0.08385086059570312, -0.07989501953125, -0.07593917846679688, -0.07198333740234375, -0.06802749633789062, -0.0640716552734375, -0.060115814208984375, -0.05615997314453125, -0.052204132080078125, -0.048248291015625, -0.044292449951171875, -0.04033660888671875, -0.036380767822265625, -0.0324249267578125, -0.028469085693359375, -0.02451324462890625, -0.020557403564453125, -0.0166015625, -0.012645721435546875, -0.00868988037109375, -0.004734039306640625, -0.0007781982421875, 0.003177642822265625, 0.00713348388671875, 0.011089324951171875, 0.015045166015625, 0.019001007080078125, 0.02295684814453125, 0.026912689208984375, 0.0308685302734375, 0.034824371337890625, 0.03878021240234375, 0.042736053466796875, 0.04669189453125, 0.050647735595703125, 0.05460357666015625, 0.058559417724609375, 0.0625152587890625, 0.06647109985351562, 0.07042694091796875, 0.07438278198242188, 0.078338623046875, 0.08229446411132812, 0.08625030517578125, 0.09020614624023438, 0.0941619873046875, 0.09811782836914062, 0.10207366943359375, 0.10602951049804688, 0.1099853515625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 10.0, 5.0, 8.0, 10.0, 13.0, 14.0, 23.0, 26.0, 27.0, 38.0, 49.0, 55.0, 60.0, 62.0, 59.0, 73.0, 65.0, 52.0, 50.0, 62.0, 31.0, 45.0, 36.0, 29.0, 29.0, 25.0, 6.0, 9.0, 9.0, 3.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.314208984375, -0.3063220977783203, -0.2984352111816406, -0.29054832458496094, -0.28266143798828125, -0.27477455139160156, -0.2668876647949219, -0.2590007781982422, -0.2511138916015625, -0.2432270050048828, -0.23534011840820312, -0.22745323181152344, -0.21956634521484375, -0.21167945861816406, -0.20379257202148438, -0.1959056854248047, -0.188018798828125, -0.1801319122314453, -0.17224502563476562, -0.16435813903808594, -0.15647125244140625, -0.14858436584472656, -0.14069747924804688, -0.1328105926513672, -0.1249237060546875, -0.11703681945800781, -0.10914993286132812, -0.10126304626464844, -0.09337615966796875, -0.08548927307128906, -0.07760238647460938, -0.06971549987792969, -0.06182861328125, -0.05394172668457031, -0.046054840087890625, -0.03816795349121094, -0.03028106689453125, -0.022394180297851562, -0.014507293701171875, -0.0066204071044921875, 0.0012664794921875, 0.009153366088867188, 0.017040252685546875, 0.024927139282226562, 0.03281402587890625, 0.04070091247558594, 0.048587799072265625, 0.05647468566894531, 0.064361572265625, 0.07224845886230469, 0.08013534545898438, 0.08802223205566406, 0.09590911865234375, 0.10379600524902344, 0.11168289184570312, 0.11956977844238281, 0.1274566650390625, 0.1353435516357422, 0.14323043823242188, 0.15111732482910156, 0.15900421142578125, 0.16689109802246094, 0.17477798461914062, 0.1826648712158203, 0.1905517578125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 6.0, 9.0, 14.0, 13.0, 28.0, 38.0, 54.0, 86.0, 128.0, 245.0, 538.0, 1256.0, 3009.0, 8354.0, 27160.0, 117923.0, 702873.0, 140075.0, 31250.0, 9512.0, 3307.0, 1379.0, 582.0, 290.0, 156.0, 90.0, 60.0, 37.0, 26.0, 15.0, 7.0, 9.0, 8.0, 4.0, 1.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034759521484375, -0.033621788024902344, -0.03248405456542969, -0.03134632110595703, -0.030208587646484375, -0.02907085418701172, -0.027933120727539062, -0.026795387268066406, -0.02565765380859375, -0.024519920349121094, -0.023382186889648438, -0.02224445343017578, -0.021106719970703125, -0.01996898651123047, -0.018831253051757812, -0.017693519592285156, -0.0165557861328125, -0.015418052673339844, -0.014280319213867188, -0.013142585754394531, -0.012004852294921875, -0.010867118835449219, -0.009729385375976562, -0.008591651916503906, -0.00745391845703125, -0.006316184997558594, -0.0051784515380859375, -0.004040718078613281, -0.002902984619140625, -0.0017652511596679688, -0.0006275177001953125, 0.0005102157592773438, 0.00164794921875, 0.0027856826782226562, 0.0039234161376953125, 0.005061149597167969, 0.006198883056640625, 0.007336616516113281, 0.008474349975585938, 0.009612083435058594, 0.01074981689453125, 0.011887550354003906, 0.013025283813476562, 0.014163017272949219, 0.015300750732421875, 0.01643848419189453, 0.017576217651367188, 0.018713951110839844, 0.0198516845703125, 0.020989418029785156, 0.022127151489257812, 0.02326488494873047, 0.024402618408203125, 0.02554035186767578, 0.026678085327148438, 0.027815818786621094, 0.02895355224609375, 0.030091285705566406, 0.031229019165039062, 0.03236675262451172, 0.033504486083984375, 0.03464221954345703, 0.03577995300292969, 0.036917686462402344, 0.038055419921875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 4.0, 6.0, 4.0, 7.0, 7.0, 11.0, 14.0, 16.0, 22.0, 24.0, 48.0, 53.0, 85.0, 88.0, 92.0, 103.0, 87.0, 80.0, 54.0, 51.0, 27.0, 21.0, 26.0, 11.0, 13.0, 5.0, 9.0, 12.0, 6.0, 7.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.531839370727539e-05, -1.471489667892456e-05, -1.411139965057373e-05, -1.35079026222229e-05, -1.290440559387207e-05, -1.230090856552124e-05, -1.169741153717041e-05, -1.109391450881958e-05, -1.049041748046875e-05, -9.88692045211792e-06, -9.28342342376709e-06, -8.67992639541626e-06, -8.07642936706543e-06, -7.4729323387146e-06, -6.8694353103637695e-06, -6.2659382820129395e-06, -5.662441253662109e-06, -5.058944225311279e-06, -4.455447196960449e-06, -3.851950168609619e-06, -3.248453140258789e-06, -2.644956111907959e-06, -2.041459083557129e-06, -1.4379620552062988e-06, -8.344650268554688e-07, -2.3096799850463867e-07, 3.725290298461914e-07, 9.760260581970215e-07, 1.5795230865478516e-06, 2.1830201148986816e-06, 2.7865171432495117e-06, 3.390014171600342e-06, 3.993511199951172e-06, 4.597008228302002e-06, 5.200505256652832e-06, 5.804002285003662e-06, 6.407499313354492e-06, 7.010996341705322e-06, 7.614493370056152e-06, 8.217990398406982e-06, 8.821487426757812e-06, 9.424984455108643e-06, 1.0028481483459473e-05, 1.0631978511810303e-05, 1.1235475540161133e-05, 1.1838972568511963e-05, 1.2442469596862793e-05, 1.3045966625213623e-05, 1.3649463653564453e-05, 1.4252960681915283e-05, 1.4856457710266113e-05, 1.5459954738616943e-05, 1.6063451766967773e-05, 1.6666948795318604e-05, 1.7270445823669434e-05, 1.7873942852020264e-05, 1.8477439880371094e-05, 1.9080936908721924e-05, 1.9684433937072754e-05, 2.0287930965423584e-05, 2.0891427993774414e-05, 2.1494925022125244e-05, 2.2098422050476074e-05, 2.2701919078826904e-05, 2.3305416107177734e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 4.0, 10.0, 12.0, 16.0, 23.0, 33.0, 36.0, 52.0, 100.0, 149.0, 267.0, 445.0, 803.0, 1574.0, 3428.0, 8035.0, 21706.0, 72809.0, 416582.0, 412823.0, 72797.0, 21791.0, 8140.0, 3464.0, 1519.0, 763.0, 424.0, 262.0, 152.0, 117.0, 92.0, 36.0, 19.0, 19.0, 7.0, 10.0, 7.0, 5.0, 10.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0295562744140625, -0.02860283851623535, -0.027649402618408203, -0.026695966720581055, -0.025742530822753906, -0.024789094924926758, -0.02383565902709961, -0.02288222312927246, -0.021928787231445312, -0.020975351333618164, -0.020021915435791016, -0.019068479537963867, -0.01811504364013672, -0.01716160774230957, -0.016208171844482422, -0.015254735946655273, -0.014301300048828125, -0.013347864151000977, -0.012394428253173828, -0.01144099235534668, -0.010487556457519531, -0.009534120559692383, -0.008580684661865234, -0.007627248764038086, -0.0066738128662109375, -0.005720376968383789, -0.004766941070556641, -0.003813505172729492, -0.0028600692749023438, -0.0019066333770751953, -0.0009531974792480469, 2.384185791015625e-07, 0.00095367431640625, 0.0019071102142333984, 0.002860546112060547, 0.0038139820098876953, 0.004767417907714844, 0.005720853805541992, 0.006674289703369141, 0.007627725601196289, 0.008581161499023438, 0.009534597396850586, 0.010488033294677734, 0.011441469192504883, 0.012394905090332031, 0.01334834098815918, 0.014301776885986328, 0.015255212783813477, 0.016208648681640625, 0.017162084579467773, 0.018115520477294922, 0.01906895637512207, 0.02002239227294922, 0.020975828170776367, 0.021929264068603516, 0.022882699966430664, 0.023836135864257812, 0.02478957176208496, 0.02574300765991211, 0.026696443557739258, 0.027649879455566406, 0.028603315353393555, 0.029556751251220703, 0.03051018714904785, 0.031463623046875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 3.0, 6.0, 6.0, 2.0, 17.0, 8.0, 23.0, 20.0, 27.0, 30.0, 43.0, 54.0, 61.0, 92.0, 84.0, 94.0, 74.0, 76.0, 64.0, 48.0, 45.0, 27.0, 21.0, 10.0, 15.0, 5.0, 14.0, 13.0, 5.0, 3.0, 2.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034423828125, -0.033111572265625, -0.03179931640625, -0.030487060546875, -0.0291748046875, -0.027862548828125, -0.02655029296875, -0.025238037109375, -0.02392578125, -0.022613525390625, -0.02130126953125, -0.019989013671875, -0.0186767578125, -0.017364501953125, -0.01605224609375, -0.014739990234375, -0.013427734375, -0.012115478515625, -0.01080322265625, -0.009490966796875, -0.0081787109375, -0.006866455078125, -0.00555419921875, -0.004241943359375, -0.0029296875, -0.001617431640625, -0.00030517578125, 0.001007080078125, 0.0023193359375, 0.003631591796875, 0.00494384765625, 0.006256103515625, 0.007568359375, 0.008880615234375, 0.01019287109375, 0.011505126953125, 0.0128173828125, 0.014129638671875, 0.01544189453125, 0.016754150390625, 0.01806640625, 0.019378662109375, 0.02069091796875, 0.022003173828125, 0.0233154296875, 0.024627685546875, 0.02593994140625, 0.027252197265625, 0.028564453125, 0.029876708984375, 0.03118896484375, 0.032501220703125, 0.0338134765625, 0.035125732421875, 0.03643798828125, 0.037750244140625, 0.0390625, 0.040374755859375, 0.04168701171875, 0.042999267578125, 0.0443115234375, 0.045623779296875, 0.04693603515625, 0.048248291015625, 0.049560546875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 7.0, 18.0, 29.0, 70.0, 205.0, 399.0, 148.0, 75.0, 29.0, 11.0, 4.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.105802059173584, -2.052506923675537, -1.9992116689682007, -1.9459164142608643, -1.8926211595535278, -1.8393259048461914, -1.7860307693481445, -1.732735514640808, -1.6794402599334717, -1.6261450052261353, -1.5728498697280884, -1.519554615020752, -1.4662593603134155, -1.412964105606079, -1.3596689701080322, -1.3063737154006958, -1.253078579902649, -1.1997833251953125, -1.1464881896972656, -1.0931929349899292, -1.0398976802825928, -0.9866024851799011, -0.9333072900772095, -0.880012035369873, -0.8267168402671814, -0.7734216451644897, -0.7201263904571533, -0.6668311953544617, -0.61353600025177, -0.5602407455444336, -0.5069455504417419, -0.4536503255367279, -0.4003552198410034, -0.3470599949359894, -0.29376477003097534, -0.2404695749282837, -0.18717435002326965, -0.13387912511825562, -0.08058393001556396, -0.027288705110549927, 0.02600651979446411, 0.07930173724889755, 0.132596954703331, 0.18589216470718384, 0.23918738961219788, 0.2924826145172119, 0.34577780961990356, 0.3990730345249176, 0.45236825942993164, 0.5056634545326233, 0.5589587092399597, 0.6122539043426514, 0.6655491590499878, 0.7188443541526794, 0.7721395492553711, 0.8254348039627075, 0.8787299990653992, 0.9320251941680908, 0.9853204488754272, 1.0386157035827637, 1.0919108390808105, 1.145206093788147, 1.1985013484954834, 1.2517964839935303, 1.3050917387008667]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 4.0, 8.0, 4.0, 9.0, 8.0, 11.0, 14.0, 19.0, 20.0, 28.0, 22.0, 29.0, 28.0, 49.0, 59.0, 80.0, 94.0, 89.0, 78.0, 50.0, 37.0, 40.0, 32.0, 23.0, 27.0, 16.0, 23.0, 13.0, 21.0, 10.0, 10.0, 7.0, 11.0, 7.0, 4.0, 2.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.8954162001609802, -0.8705326318740845, -0.845649003982544, -0.8207653760910034, -0.7958818078041077, -0.7709982395172119, -0.7461146116256714, -0.7212309837341309, -0.6963474154472351, -0.6714638471603394, -0.6465802192687988, -0.6216965913772583, -0.5968130230903625, -0.5719294548034668, -0.5470458269119263, -0.5221621990203857, -0.49727863073349, -0.47239503264427185, -0.4475114345550537, -0.42262783646583557, -0.39774423837661743, -0.3728606402873993, -0.34797704219818115, -0.323093444108963, -0.2982098460197449, -0.27332624793052673, -0.2484426498413086, -0.22355905175209045, -0.19867545366287231, -0.17379185557365417, -0.14890825748443604, -0.1240246593952179, -0.09914106130599976, -0.07425746321678162, -0.04937386512756348, -0.024490267038345337, 0.00039333105087280273, 0.025276929140090942, 0.05016052722930908, 0.07504412531852722, 0.09992772340774536, 0.1248113214969635, 0.14969491958618164, 0.17457851767539978, 0.19946211576461792, 0.22434571385383606, 0.2492293119430542, 0.27411291003227234, 0.2989965081214905, 0.3238801062107086, 0.34876370429992676, 0.3736473023891449, 0.39853090047836304, 0.4234144985675812, 0.4482980966567993, 0.47318169474601746, 0.4980652928352356, 0.5229488611221313, 0.5478324890136719, 0.5727161169052124, 0.5975996851921082, 0.6224832534790039, 0.6473668813705444, 0.672250509262085, 0.6971340775489807]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 10.0, 13.0, 10.0, 21.0, 38.0, 55.0, 83.0, 155.0, 250.0, 396.0, 760.0, 1435.0, 2897.0, 6542.0, 17188.0, 54241.0, 223531.0, 1077675.0, 2029715.0, 600563.0, 122850.0, 33320.0, 12165.0, 4974.0, 2381.0, 1245.0, 649.0, 371.0, 255.0, 163.0, 105.0, 75.0, 45.0, 38.0, 19.0, 17.0, 6.0, 11.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.099365234375, -0.0961923599243164, -0.09301948547363281, -0.08984661102294922, -0.08667373657226562, -0.08350086212158203, -0.08032798767089844, -0.07715511322021484, -0.07398223876953125, -0.07080936431884766, -0.06763648986816406, -0.06446361541748047, -0.061290740966796875, -0.05811786651611328, -0.05494499206542969, -0.051772117614746094, -0.0485992431640625, -0.045426368713378906, -0.04225349426269531, -0.03908061981201172, -0.035907745361328125, -0.03273487091064453, -0.029561996459960938, -0.026389122009277344, -0.02321624755859375, -0.020043373107910156, -0.016870498657226562, -0.013697624206542969, -0.010524749755859375, -0.007351875305175781, -0.0041790008544921875, -0.0010061264038085938, 0.002166748046875, 0.005339622497558594, 0.008512496948242188, 0.011685371398925781, 0.014858245849609375, 0.01803112030029297, 0.021203994750976562, 0.024376869201660156, 0.02754974365234375, 0.030722618103027344, 0.03389549255371094, 0.03706836700439453, 0.040241241455078125, 0.04341411590576172, 0.04658699035644531, 0.049759864807128906, 0.0529327392578125, 0.056105613708496094, 0.05927848815917969, 0.06245136260986328, 0.06562423706054688, 0.06879711151123047, 0.07196998596191406, 0.07514286041259766, 0.07831573486328125, 0.08148860931396484, 0.08466148376464844, 0.08783435821533203, 0.09100723266601562, 0.09418010711669922, 0.09735298156738281, 0.1005258560180664, 0.10369873046875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 3.0, 3.0, 4.0, 3.0, 7.0, 8.0, 7.0, 12.0, 10.0, 13.0, 17.0, 24.0, 20.0, 22.0, 32.0, 33.0, 28.0, 37.0, 44.0, 38.0, 42.0, 41.0, 39.0, 46.0, 50.0, 50.0, 37.0, 36.0, 36.0, 31.0, 29.0, 34.0, 24.0, 26.0, 18.0, 24.0, 9.0, 11.0, 12.0, 7.0, 14.0, 5.0, 2.0, 1.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04644775390625, -0.044939517974853516, -0.04343128204345703, -0.04192304611206055, -0.04041481018066406, -0.03890657424926758, -0.037398338317871094, -0.03589010238647461, -0.034381866455078125, -0.03287363052368164, -0.031365394592285156, -0.029857158660888672, -0.028348922729492188, -0.026840686798095703, -0.02533245086669922, -0.023824214935302734, -0.02231597900390625, -0.020807743072509766, -0.01929950714111328, -0.017791271209716797, -0.016283035278320312, -0.014774799346923828, -0.013266563415527344, -0.01175832748413086, -0.010250091552734375, -0.00874185562133789, -0.007233619689941406, -0.005725383758544922, -0.0042171478271484375, -0.002708911895751953, -0.0012006759643554688, 0.0003075599670410156, 0.0018157958984375, 0.0033240318298339844, 0.004832267761230469, 0.006340503692626953, 0.007848739624023438, 0.009356975555419922, 0.010865211486816406, 0.01237344741821289, 0.013881683349609375, 0.01538991928100586, 0.016898155212402344, 0.018406391143798828, 0.019914627075195312, 0.021422863006591797, 0.02293109893798828, 0.024439334869384766, 0.02594757080078125, 0.027455806732177734, 0.02896404266357422, 0.030472278594970703, 0.03198051452636719, 0.03348875045776367, 0.034996986389160156, 0.03650522232055664, 0.038013458251953125, 0.03952169418334961, 0.041029930114746094, 0.04253816604614258, 0.04404640197753906, 0.04555463790893555, 0.04706287384033203, 0.048571109771728516, 0.050079345703125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 6.0, 14.0, 15.0, 20.0, 40.0, 44.0, 88.0, 108.0, 175.0, 262.0, 508.0, 1131.0, 3232.0, 16470.0, 776648.0, 3353766.0, 34159.0, 4675.0, 1392.0, 663.0, 318.0, 176.0, 110.0, 83.0, 52.0, 24.0, 28.0, 16.0, 12.0, 15.0, 8.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.434326171875, -0.4223060607910156, -0.41028594970703125, -0.3982658386230469, -0.3862457275390625, -0.3742256164550781, -0.36220550537109375, -0.3501853942871094, -0.338165283203125, -0.3261451721191406, -0.31412506103515625, -0.3021049499511719, -0.2900848388671875, -0.2780647277832031, -0.26604461669921875, -0.2540245056152344, -0.24200439453125, -0.22998428344726562, -0.21796417236328125, -0.20594406127929688, -0.1939239501953125, -0.18190383911132812, -0.16988372802734375, -0.15786361694335938, -0.145843505859375, -0.13382339477539062, -0.12180328369140625, -0.10978317260742188, -0.0977630615234375, -0.08574295043945312, -0.07372283935546875, -0.061702728271484375, -0.0496826171875, -0.037662506103515625, -0.02564239501953125, -0.013622283935546875, -0.0016021728515625, 0.010417938232421875, 0.02243804931640625, 0.034458160400390625, 0.046478271484375, 0.058498382568359375, 0.07051849365234375, 0.08253860473632812, 0.0945587158203125, 0.10657882690429688, 0.11859893798828125, 0.13061904907226562, 0.14263916015625, 0.15465927124023438, 0.16667938232421875, 0.17869949340820312, 0.1907196044921875, 0.20273971557617188, 0.21475982666015625, 0.22677993774414062, 0.238800048828125, 0.2508201599121094, 0.26284027099609375, 0.2748603820800781, 0.2868804931640625, 0.2989006042480469, 0.31092071533203125, 0.3229408264160156, 0.3349609375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 5.0, 5.0, 2.0, 9.0, 11.0, 19.0, 17.0, 25.0, 49.0, 43.0, 48.0, 78.0, 129.0, 163.0, 189.0, 273.0, 369.0, 402.0, 450.0, 400.0, 321.0, 269.0, 184.0, 149.0, 108.0, 73.0, 81.0, 45.0, 36.0, 32.0, 22.0, 17.0, 16.0, 6.0, 10.0, 2.0, 2.0, 7.0, 2.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1507568359375, -0.1457843780517578, -0.14081192016601562, -0.13583946228027344, -0.13086700439453125, -0.12589454650878906, -0.12092208862304688, -0.11594963073730469, -0.1109771728515625, -0.10600471496582031, -0.10103225708007812, -0.09605979919433594, -0.09108734130859375, -0.08611488342285156, -0.08114242553710938, -0.07616996765136719, -0.071197509765625, -0.06622505187988281, -0.061252593994140625, -0.05628013610839844, -0.05130767822265625, -0.04633522033691406, -0.041362762451171875, -0.03639030456542969, -0.0314178466796875, -0.026445388793945312, -0.021472930908203125, -0.016500473022460938, -0.01152801513671875, -0.0065555572509765625, -0.001583099365234375, 0.0033893585205078125, 0.00836181640625, 0.013334274291992188, 0.018306732177734375, 0.023279190063476562, 0.02825164794921875, 0.03322410583496094, 0.038196563720703125, 0.04316902160644531, 0.0481414794921875, 0.05311393737792969, 0.058086395263671875, 0.06305885314941406, 0.06803131103515625, 0.07300376892089844, 0.07797622680664062, 0.08294868469238281, 0.087921142578125, 0.09289360046386719, 0.09786605834960938, 0.10283851623535156, 0.10781097412109375, 0.11278343200683594, 0.11775588989257812, 0.12272834777832031, 0.1277008056640625, 0.1326732635498047, 0.13764572143554688, 0.14261817932128906, 0.14759063720703125, 0.15256309509277344, 0.15753555297851562, 0.1625080108642578, 0.16748046875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 11.0, 7.0, 7.0, 17.0, 37.0, 88.0, 161.0, 213.0, 223.0, 115.0, 69.0, 23.0, 10.0, 6.0, 7.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.9089221954345703, -3.8128654956817627, -3.716808557510376, -3.6207518577575684, -3.5246949195861816, -3.428638219833374, -3.3325815200805664, -3.2365245819091797, -3.140467882156372, -3.0444111824035645, -2.9483542442321777, -2.85229754447937, -2.7562408447265625, -2.660183906555176, -2.564127206802368, -2.4680705070495605, -2.372013568878174, -2.275956869125366, -2.1798999309539795, -2.083843231201172, -1.9877864122390747, -1.8917295932769775, -1.79567289352417, -1.6996160745620728, -1.6035592555999756, -1.5075024366378784, -1.4114456176757812, -1.3153889179229736, -1.2193320989608765, -1.1232752799987793, -1.0272185802459717, -0.9311617612838745, -0.8351047039031982, -0.7390478849411011, -0.6429911255836487, -0.5469343662261963, -0.4508775472640991, -0.35482075810432434, -0.25876396894454956, -0.16270720958709717, -0.066650390625, 0.02940639853477478, 0.12546318769454956, 0.22151997685432434, 0.3175767660140991, 0.4136335551738739, 0.5096903443336487, 0.6057471036911011, 0.7018039226531982, 0.7978607416152954, 0.8939175009727478, 0.9899742603302002, 1.0860310792922974, 1.1820878982543945, 1.2781445980072021, 1.3742014169692993, 1.4702582359313965, 1.5663150548934937, 1.6623718738555908, 1.7584285736083984, 1.8544853925704956, 1.9505422115325928, 2.0465989112854004, 2.142655849456787, 2.2387125492095947]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 4.0, 7.0, 3.0, 11.0, 8.0, 8.0, 13.0, 15.0, 13.0, 11.0, 24.0, 24.0, 36.0, 25.0, 25.0, 33.0, 34.0, 26.0, 45.0, 46.0, 46.0, 52.0, 43.0, 46.0, 43.0, 45.0, 26.0, 43.0, 26.0, 26.0, 21.0, 30.0, 17.0, 17.0, 13.0, 16.0, 10.0, 10.0, 10.0, 10.0, 10.0, 6.0, 10.0, 3.0, 3.0, 1.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.8835044503211975, -0.854857861995697, -0.8262112140655518, -0.7975646257400513, -0.7689180374145508, -0.7402713894844055, -0.711624801158905, -0.6829781532287598, -0.6543315649032593, -0.6256849765777588, -0.5970383286476135, -0.568391740322113, -0.5397450923919678, -0.5110985040664673, -0.4824519157409668, -0.4538052976131439, -0.42515867948532104, -0.39651206135749817, -0.3678654432296753, -0.3392188549041748, -0.31057223677635193, -0.28192561864852905, -0.25327903032302856, -0.2246324121952057, -0.1959857940673828, -0.16733917593955994, -0.13869257271289825, -0.11004596203565598, -0.0813993513584137, -0.05275273323059082, -0.024106130003929138, 0.004540473222732544, 0.033187150955200195, 0.061833761632442474, 0.09048037230968475, 0.11912698298692703, 0.1477735936641693, 0.1764202117919922, 0.20506681501865387, 0.23371341824531555, 0.2623600363731384, 0.2910066545009613, 0.3196532726287842, 0.34829986095428467, 0.37694647908210754, 0.4055930972099304, 0.4342396855354309, 0.4628863036632538, 0.49153292179107666, 0.5201795101165771, 0.5488261580467224, 0.5774727463722229, 0.6061193943023682, 0.6347659826278687, 0.6634125709533691, 0.6920591592788696, 0.7207058072090149, 0.7493523955345154, 0.7779990434646606, 0.8066456317901611, 0.8352922201156616, 0.8639388680458069, 0.8925854563713074, 0.9212321043014526, 0.9498786926269531]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 4.0, 7.0, 6.0, 10.0, 16.0, 25.0, 43.0, 62.0, 75.0, 127.0, 195.0, 298.0, 429.0, 691.0, 1036.0, 1720.0, 3027.0, 5328.0, 10033.0, 20578.0, 45123.0, 112434.0, 395497.0, 288356.0, 88842.0, 37225.0, 17237.0, 8750.0, 4583.0, 2639.0, 1540.0, 903.0, 605.0, 346.0, 239.0, 164.0, 121.0, 76.0, 43.0, 38.0, 28.0, 26.0, 11.0, 9.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0731201171875, -0.07096195220947266, -0.06880378723144531, -0.06664562225341797, -0.06448745727539062, -0.06232929229736328, -0.06017112731933594, -0.058012962341308594, -0.05585479736328125, -0.053696632385253906, -0.05153846740722656, -0.04938030242919922, -0.047222137451171875, -0.04506397247314453, -0.04290580749511719, -0.040747642517089844, -0.0385894775390625, -0.036431312561035156, -0.03427314758300781, -0.03211498260498047, -0.029956817626953125, -0.02779865264892578, -0.025640487670898438, -0.023482322692871094, -0.02132415771484375, -0.019165992736816406, -0.017007827758789062, -0.014849662780761719, -0.012691497802734375, -0.010533332824707031, -0.008375167846679688, -0.006217002868652344, -0.004058837890625, -0.0019006729125976562, 0.0002574920654296875, 0.0024156570434570312, 0.004573822021484375, 0.006731986999511719, 0.008890151977539062, 0.011048316955566406, 0.01320648193359375, 0.015364646911621094, 0.017522811889648438, 0.01968097686767578, 0.021839141845703125, 0.02399730682373047, 0.026155471801757812, 0.028313636779785156, 0.0304718017578125, 0.032629966735839844, 0.03478813171386719, 0.03694629669189453, 0.039104461669921875, 0.04126262664794922, 0.04342079162597656, 0.045578956604003906, 0.04773712158203125, 0.049895286560058594, 0.05205345153808594, 0.05421161651611328, 0.056369781494140625, 0.05852794647216797, 0.06068611145019531, 0.06284427642822266, 0.06500244140625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 4.0, 4.0, 6.0, 9.0, 5.0, 11.0, 14.0, 8.0, 10.0, 21.0, 21.0, 20.0, 36.0, 41.0, 40.0, 39.0, 44.0, 42.0, 56.0, 45.0, 39.0, 47.0, 41.0, 45.0, 47.0, 31.0, 36.0, 34.0, 35.0, 24.0, 21.0, 26.0, 12.0, 16.0, 16.0, 11.0, 8.0, 8.0, 4.0, 5.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0726318359375, -0.07026100158691406, -0.06789016723632812, -0.06551933288574219, -0.06314849853515625, -0.06077766418457031, -0.058406829833984375, -0.05603599548339844, -0.0536651611328125, -0.05129432678222656, -0.048923492431640625, -0.04655265808105469, -0.04418182373046875, -0.04181098937988281, -0.039440155029296875, -0.03706932067871094, -0.034698486328125, -0.03232765197753906, -0.029956817626953125, -0.027585983276367188, -0.02521514892578125, -0.022844314575195312, -0.020473480224609375, -0.018102645874023438, -0.0157318115234375, -0.013360977172851562, -0.010990142822265625, -0.008619308471679688, -0.00624847412109375, -0.0038776397705078125, -0.001506805419921875, 0.0008640289306640625, 0.00323486328125, 0.0056056976318359375, 0.007976531982421875, 0.010347366333007812, 0.01271820068359375, 0.015089035034179688, 0.017459869384765625, 0.019830703735351562, 0.0222015380859375, 0.024572372436523438, 0.026943206787109375, 0.029314041137695312, 0.03168487548828125, 0.03405570983886719, 0.036426544189453125, 0.03879737854003906, 0.041168212890625, 0.04353904724121094, 0.045909881591796875, 0.04828071594238281, 0.05065155029296875, 0.05302238464355469, 0.055393218994140625, 0.05776405334472656, 0.0601348876953125, 0.06250572204589844, 0.06487655639648438, 0.06724739074707031, 0.06961822509765625, 0.07198905944824219, 0.07435989379882812, 0.07673072814941406, 0.0791015625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 6.0, 8.0, 13.0, 20.0, 38.0, 59.0, 133.0, 227.0, 400.0, 1135.0, 4488.0, 33634.0, 924628.0, 74031.0, 7163.0, 1577.0, 537.0, 221.0, 108.0, 53.0, 29.0, 15.0, 12.0, 9.0, 5.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.255859375, -0.24847412109375, -0.2410888671875, -0.23370361328125, -0.226318359375, -0.21893310546875, -0.2115478515625, -0.20416259765625, -0.19677734375, -0.18939208984375, -0.1820068359375, -0.17462158203125, -0.167236328125, -0.15985107421875, -0.1524658203125, -0.14508056640625, -0.1376953125, -0.13031005859375, -0.1229248046875, -0.11553955078125, -0.108154296875, -0.10076904296875, -0.0933837890625, -0.08599853515625, -0.07861328125, -0.07122802734375, -0.0638427734375, -0.05645751953125, -0.049072265625, -0.04168701171875, -0.0343017578125, -0.02691650390625, -0.01953125, -0.01214599609375, -0.0047607421875, 0.00262451171875, 0.010009765625, 0.01739501953125, 0.0247802734375, 0.03216552734375, 0.03955078125, 0.04693603515625, 0.0543212890625, 0.06170654296875, 0.069091796875, 0.07647705078125, 0.0838623046875, 0.09124755859375, 0.0986328125, 0.10601806640625, 0.1134033203125, 0.12078857421875, 0.128173828125, 0.13555908203125, 0.1429443359375, 0.15032958984375, 0.15771484375, 0.16510009765625, 0.1724853515625, 0.17987060546875, 0.187255859375, 0.19464111328125, 0.2020263671875, 0.20941162109375, 0.216796875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 2.0, 2.0, 3.0, 12.0, 7.0, 4.0, 8.0, 9.0, 10.0, 10.0, 14.0, 16.0, 22.0, 25.0, 29.0, 34.0, 41.0, 47.0, 72.0, 66.0, 78.0, 84.0, 69.0, 81.0, 50.0, 38.0, 23.0, 25.0, 24.0, 20.0, 16.0, 13.0, 12.0, 11.0, 5.0, 6.0, 3.0, 3.0, 3.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34814453125, -0.3368034362792969, -0.32546234130859375, -0.3141212463378906, -0.3027801513671875, -0.2914390563964844, -0.28009796142578125, -0.2687568664550781, -0.257415771484375, -0.24607467651367188, -0.23473358154296875, -0.22339248657226562, -0.2120513916015625, -0.20071029663085938, -0.18936920166015625, -0.17802810668945312, -0.16668701171875, -0.15534591674804688, -0.14400482177734375, -0.13266372680664062, -0.1213226318359375, -0.10998153686523438, -0.09864044189453125, -0.08729934692382812, -0.075958251953125, -0.06461715698242188, -0.05327606201171875, -0.041934967041015625, -0.0305938720703125, -0.019252777099609375, -0.00791168212890625, 0.003429412841796875, 0.0147705078125, 0.026111602783203125, 0.03745269775390625, 0.048793792724609375, 0.0601348876953125, 0.07147598266601562, 0.08281707763671875, 0.09415817260742188, 0.105499267578125, 0.11684036254882812, 0.12818145751953125, 0.13952255249023438, 0.1508636474609375, 0.16220474243164062, 0.17354583740234375, 0.18488693237304688, 0.19622802734375, 0.20756912231445312, 0.21891021728515625, 0.23025131225585938, 0.2415924072265625, 0.2529335021972656, 0.26427459716796875, 0.2756156921386719, 0.286956787109375, 0.2982978820800781, 0.30963897705078125, 0.3209800720214844, 0.3323211669921875, 0.3436622619628906, 0.35500335693359375, 0.3663444519042969, 0.377685546875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 6.0, 5.0, 2.0, 9.0, 11.0, 6.0, 20.0, 14.0, 18.0, 37.0, 42.0, 50.0, 76.0, 117.0, 166.0, 279.0, 464.0, 1062.0, 2347.0, 6899.0, 30214.0, 762292.0, 211221.0, 23247.0, 5779.0, 2014.0, 858.0, 469.0, 249.0, 163.0, 116.0, 74.0, 62.0, 36.0, 28.0, 25.0, 20.0, 15.0, 9.0, 7.0, 10.0, 3.0, 4.0, 1.0, 7.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04010009765625, -0.03871345520019531, -0.037326812744140625, -0.03594017028808594, -0.03455352783203125, -0.03316688537597656, -0.031780242919921875, -0.030393600463867188, -0.0290069580078125, -0.027620315551757812, -0.026233673095703125, -0.024847030639648438, -0.02346038818359375, -0.022073745727539062, -0.020687103271484375, -0.019300460815429688, -0.017913818359375, -0.016527175903320312, -0.015140533447265625, -0.013753890991210938, -0.01236724853515625, -0.010980606079101562, -0.009593963623046875, -0.008207321166992188, -0.0068206787109375, -0.0054340362548828125, -0.004047393798828125, -0.0026607513427734375, -0.00127410888671875, 0.0001125335693359375, 0.001499176025390625, 0.0028858184814453125, 0.0042724609375, 0.0056591033935546875, 0.007045745849609375, 0.008432388305664062, 0.00981903076171875, 0.011205673217773438, 0.012592315673828125, 0.013978958129882812, 0.0153656005859375, 0.016752243041992188, 0.018138885498046875, 0.019525527954101562, 0.02091217041015625, 0.022298812866210938, 0.023685455322265625, 0.025072097778320312, 0.026458740234375, 0.027845382690429688, 0.029232025146484375, 0.030618667602539062, 0.03200531005859375, 0.03339195251464844, 0.034778594970703125, 0.03616523742675781, 0.0375518798828125, 0.03893852233886719, 0.040325164794921875, 0.04171180725097656, 0.04309844970703125, 0.04448509216308594, 0.045871734619140625, 0.04725837707519531, 0.04864501953125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 6.0, 9.0, 9.0, 9.0, 11.0, 11.0, 19.0, 24.0, 20.0, 30.0, 33.0, 49.0, 54.0, 63.0, 87.0, 70.0, 72.0, 72.0, 63.0, 57.0, 32.0, 44.0, 32.0, 29.0, 16.0, 18.0, 8.0, 13.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 6.0, 2.0, 5.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4185905456542969e-05, -1.3763085007667542e-05, -1.3340264558792114e-05, -1.2917444109916687e-05, -1.249462366104126e-05, -1.2071803212165833e-05, -1.1648982763290405e-05, -1.1226162314414978e-05, -1.080334186553955e-05, -1.0380521416664124e-05, -9.957700967788696e-06, -9.534880518913269e-06, -9.112060070037842e-06, -8.689239621162415e-06, -8.266419172286987e-06, -7.84359872341156e-06, -7.420778274536133e-06, -6.9979578256607056e-06, -6.575137376785278e-06, -6.152316927909851e-06, -5.729496479034424e-06, -5.306676030158997e-06, -4.883855581283569e-06, -4.461035132408142e-06, -4.038214683532715e-06, -3.6153942346572876e-06, -3.1925737857818604e-06, -2.769753336906433e-06, -2.346932888031006e-06, -1.9241124391555786e-06, -1.5012919902801514e-06, -1.0784715414047241e-06, -6.556510925292969e-07, -2.3283064365386963e-07, 1.8998980522155762e-07, 6.128102540969849e-07, 1.0356307029724121e-06, 1.4584511518478394e-06, 1.8812716007232666e-06, 2.304092049598694e-06, 2.726912498474121e-06, 3.1497329473495483e-06, 3.5725533962249756e-06, 3.995373845100403e-06, 4.41819429397583e-06, 4.841014742851257e-06, 5.2638351917266846e-06, 5.686655640602112e-06, 6.109476089477539e-06, 6.532296538352966e-06, 6.9551169872283936e-06, 7.377937436103821e-06, 7.800757884979248e-06, 8.223578333854675e-06, 8.646398782730103e-06, 9.06921923160553e-06, 9.492039680480957e-06, 9.914860129356384e-06, 1.0337680578231812e-05, 1.0760501027107239e-05, 1.1183321475982666e-05, 1.1606141924858093e-05, 1.202896237373352e-05, 1.2451782822608948e-05, 1.2874603271484375e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 5.0, 7.0, 9.0, 13.0, 18.0, 29.0, 60.0, 132.0, 290.0, 878.0, 3826.0, 24295.0, 889860.0, 115957.0, 10274.0, 1957.0, 527.0, 202.0, 88.0, 41.0, 28.0, 22.0, 15.0, 5.0, 9.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0736083984375, -0.07149219512939453, -0.06937599182128906, -0.0672597885131836, -0.06514358520507812, -0.06302738189697266, -0.06091117858886719, -0.05879497528076172, -0.05667877197265625, -0.05456256866455078, -0.05244636535644531, -0.050330162048339844, -0.048213958740234375, -0.046097755432128906, -0.04398155212402344, -0.04186534881591797, -0.0397491455078125, -0.03763294219970703, -0.03551673889160156, -0.033400535583496094, -0.031284332275390625, -0.029168128967285156, -0.027051925659179688, -0.02493572235107422, -0.02281951904296875, -0.02070331573486328, -0.018587112426757812, -0.016470909118652344, -0.014354705810546875, -0.012238502502441406, -0.010122299194335938, -0.008006095886230469, -0.005889892578125, -0.0037736892700195312, -0.0016574859619140625, 0.00045871734619140625, 0.002574920654296875, 0.004691123962402344, 0.0068073272705078125, 0.008923530578613281, 0.01103973388671875, 0.013155937194824219, 0.015272140502929688, 0.017388343811035156, 0.019504547119140625, 0.021620750427246094, 0.023736953735351562, 0.02585315704345703, 0.0279693603515625, 0.03008556365966797, 0.03220176696777344, 0.034317970275878906, 0.036434173583984375, 0.038550376892089844, 0.04066658020019531, 0.04278278350830078, 0.04489898681640625, 0.04701519012451172, 0.04913139343261719, 0.051247596740722656, 0.053363800048828125, 0.055480003356933594, 0.05759620666503906, 0.05971240997314453, 0.06182861328125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 4.0, 4.0, 9.0, 10.0, 9.0, 7.0, 9.0, 11.0, 9.0, 15.0, 15.0, 28.0, 54.0, 58.0, 84.0, 107.0, 110.0, 119.0, 80.0, 59.0, 47.0, 18.0, 19.0, 23.0, 24.0, 10.0, 8.0, 11.0, 9.0, 10.0, 9.0, 6.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.04913330078125, -0.047570228576660156, -0.04600715637207031, -0.04444408416748047, -0.042881011962890625, -0.04131793975830078, -0.03975486755371094, -0.038191795349121094, -0.03662872314453125, -0.035065650939941406, -0.03350257873535156, -0.03193950653076172, -0.030376434326171875, -0.02881336212158203, -0.027250289916992188, -0.025687217712402344, -0.0241241455078125, -0.022561073303222656, -0.020998001098632812, -0.01943492889404297, -0.017871856689453125, -0.01630878448486328, -0.014745712280273438, -0.013182640075683594, -0.01161956787109375, -0.010056495666503906, -0.008493423461914062, -0.006930351257324219, -0.005367279052734375, -0.0038042068481445312, -0.0022411346435546875, -0.0006780624389648438, 0.000885009765625, 0.0024480819702148438, 0.0040111541748046875, 0.005574226379394531, 0.007137298583984375, 0.008700370788574219, 0.010263442993164062, 0.011826515197753906, 0.01338958740234375, 0.014952659606933594, 0.016515731811523438, 0.01807880401611328, 0.019641876220703125, 0.02120494842529297, 0.022768020629882812, 0.024331092834472656, 0.0258941650390625, 0.027457237243652344, 0.029020309448242188, 0.03058338165283203, 0.032146453857421875, 0.03370952606201172, 0.03527259826660156, 0.036835670471191406, 0.03839874267578125, 0.039961814880371094, 0.04152488708496094, 0.04308795928955078, 0.044651031494140625, 0.04621410369873047, 0.04777717590332031, 0.049340248107910156, 0.0509033203125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 4.0, 8.0, 9.0, 18.0, 43.0, 80.0, 268.0, 363.0, 107.0, 38.0, 33.0, 14.0, 10.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0455381870269775, -1.9872790575027466, -1.9290199279785156, -1.8707609176635742, -1.8125017881393433, -1.7542426586151123, -1.695983648300171, -1.63772451877594, -1.579465389251709, -1.521206259727478, -1.462947130203247, -1.4046881198883057, -1.3464289903640747, -1.2881698608398438, -1.2299108505249023, -1.1716517210006714, -1.1133925914764404, -1.0551334619522095, -0.9968743920326233, -0.9386153221130371, -0.8803561925888062, -0.8220970630645752, -0.763837993144989, -0.7055789232254028, -0.6473197937011719, -0.5890606641769409, -0.5308015942573547, -0.47254249453544617, -0.4142833948135376, -0.35602429509162903, -0.29776519536972046, -0.2395060956478119, -0.18124699592590332, -0.12298789620399475, -0.06472879648208618, -0.006469696760177612, 0.05178940296173096, 0.11004850268363953, 0.1683076024055481, 0.22656670212745667, 0.28482580184936523, 0.3430849015712738, 0.4013440012931824, 0.45960310101509094, 0.5178622007369995, 0.5761213302612305, 0.6343804001808167, 0.6926394701004028, 0.7508985996246338, 0.8091577291488647, 0.8674167990684509, 0.9256758689880371, 0.9839349985122681, 1.042194128036499, 1.1004531383514404, 1.1587122678756714, 1.2169713973999023, 1.2752305269241333, 1.3334896564483643, 1.3917486667633057, 1.4500077962875366, 1.5082669258117676, 1.566525936126709, 1.62478506565094, 1.683044195175171]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 1.0, 3.0, 6.0, 8.0, 4.0, 10.0, 10.0, 11.0, 17.0, 25.0, 21.0, 20.0, 41.0, 45.0, 63.0, 73.0, 87.0, 88.0, 71.0, 78.0, 51.0, 46.0, 32.0, 24.0, 25.0, 26.0, 17.0, 10.0, 7.0, 16.0, 11.0, 9.0, 5.0, 11.0, 6.0, 3.0, 3.0, 1.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.0160033702850342, -0.9856521487236023, -0.9553009271621704, -0.9249496459960938, -0.8945984244346619, -0.86424720287323, -0.8338959813117981, -0.8035447597503662, -0.7731934785842896, -0.7428422570228577, -0.7124910354614258, -0.6821397542953491, -0.6517885327339172, -0.6214373111724854, -0.5910860896110535, -0.5607348680496216, -0.5303835868835449, -0.500032365322113, -0.46968111395835876, -0.4393298923969269, -0.4089786410331726, -0.3786274194717407, -0.34827619791030884, -0.31792494654655457, -0.28757375478744507, -0.2572225332260132, -0.2268712818622589, -0.19652006030082703, -0.16616880893707275, -0.13581758737564087, -0.10546635091304779, -0.07511511445045471, -0.04476386308670044, -0.01441262848675251, 0.01593860611319542, 0.0462898388504982, 0.07664107531309128, 0.10699230432510376, 0.13734354078769684, 0.16769477725028992, 0.198046013712883, 0.22839725017547607, 0.25874847173690796, 0.28909972310066223, 0.3194509446620941, 0.3498021960258484, 0.3801534175872803, 0.41050463914871216, 0.44085589051246643, 0.4712071120738983, 0.5015583634376526, 0.5319095849990845, 0.5622608065605164, 0.5926120281219482, 0.6229633092880249, 0.6533145308494568, 0.6836657524108887, 0.7140169739723206, 0.7443681955337524, 0.7747194766998291, 0.805070698261261, 0.8354219198226929, 0.8657731413841248, 0.8961243629455566, 0.9264756441116333]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 8.0, 7.0, 18.0, 15.0, 11.0, 25.0, 21.0, 12.0, 24.0, 26.0, 29.0, 33.0, 15.0, 43.0, 65.0, 124.0, 151.0, 70.0, 39.0, 30.0, 36.0, 23.0, 20.0, 24.0, 23.0, 23.0, 15.0, 10.0, 8.0, 8.0, 11.0, 8.0, 8.0, 5.0, 5.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0712890625, -0.06891536712646484, -0.06654167175292969, -0.06416797637939453, -0.061794281005859375, -0.05942058563232422, -0.05704689025878906, -0.054673194885253906, -0.05229949951171875, -0.049925804138183594, -0.04755210876464844, -0.04517841339111328, -0.042804718017578125, -0.04043102264404297, -0.03805732727050781, -0.035683631896972656, -0.0333099365234375, -0.030936241149902344, -0.028562545776367188, -0.02618885040283203, -0.023815155029296875, -0.02144145965576172, -0.019067764282226562, -0.016694068908691406, -0.01432037353515625, -0.011946678161621094, -0.009572982788085938, -0.007199287414550781, -0.004825592041015625, -0.0024518966674804688, -7.82012939453125e-05, 0.0022954940795898438, 0.004669189453125, 0.007042884826660156, 0.009416580200195312, 0.011790275573730469, 0.014163970947265625, 0.01653766632080078, 0.018911361694335938, 0.021285057067871094, 0.02365875244140625, 0.026032447814941406, 0.028406143188476562, 0.03077983856201172, 0.033153533935546875, 0.03552722930908203, 0.03790092468261719, 0.040274620056152344, 0.0426483154296875, 0.045022010803222656, 0.04739570617675781, 0.04976940155029297, 0.052143096923828125, 0.05451679229736328, 0.05689048767089844, 0.059264183044433594, 0.06163787841796875, 0.0640115737915039, 0.06638526916503906, 0.06875896453857422, 0.07113265991210938, 0.07350635528564453, 0.07588005065917969, 0.07825374603271484, 0.08062744140625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 6.0, 3.0, 4.0, 1.0, 7.0, 1.0, 5.0, 5.0, 9.0, 20.0, 13.0, 25.0, 33.0, 45.0, 53.0, 103.0, 132.0, 247.0, 489.0, 1103.0, 2891.0, 9028.0, 154523.0, 8198933.0, 13901.0, 3907.0, 1548.0, 671.0, 303.0, 194.0, 97.0, 63.0, 56.0, 39.0, 22.0, 25.0, 23.0, 9.0, 7.0, 7.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 5.0, 2.0, 2.0], "bins": [-0.4251953363418579, -0.4119632840156555, -0.3987312316894531, -0.3854992091655731, -0.3722671568393707, -0.35903510451316833, -0.34580308198928833, -0.33257102966308594, -0.31933897733688354, -0.30610692501068115, -0.29287487268447876, -0.27964285016059875, -0.26641079783439636, -0.25317874550819397, -0.23994670808315277, -0.22671467065811157, -0.21348261833190918, -0.2002505660057068, -0.1870185285806656, -0.1737864911556244, -0.160554438829422, -0.1473223865032196, -0.1340903490781784, -0.12085830420255661, -0.10762625932693481, -0.09439421445131302, -0.08116216957569122, -0.06793012470006943, -0.05469807982444763, -0.041466034948825836, -0.02823399007320404, -0.015001945197582245, -0.0017699003219604492, 0.011462144553661346, 0.024694189429283142, 0.03792623430490494, 0.05115827918052673, 0.06439032405614853, 0.07762236893177032, 0.09085441380739212, 0.10408645868301392, 0.11731850355863571, 0.1305505484342575, 0.1437825858592987, 0.1570146381855011, 0.1702466905117035, 0.1834787279367447, 0.1967107653617859, 0.20994281768798828, 0.22317487001419067, 0.23640690743923187, 0.24963894486427307, 0.26287099719047546, 0.27610304951667786, 0.28933507204055786, 0.30256712436676025, 0.31579917669296265, 0.32903122901916504, 0.34226328134536743, 0.35549530386924744, 0.36872735619544983, 0.3819594085216522, 0.3951914310455322, 0.4084234833717346, 0.421655535697937]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 6.0, 4.0, 7.0, 1.0, 3.0, 7.0, 4.0, 5.0, 6.0, 4.0, 1.0, 7.0, 2.0, 4.0, 4.0, 3.0, 4.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8421979546546936, -0.8183676600456238, -0.794537365436554, -0.7707071304321289, -0.7468768358230591, -0.7230465412139893, -0.6992162466049194, -0.6753859519958496, -0.6515556573867798, -0.62772536277771, -0.6038950681686401, -0.5800647735595703, -0.5562345385551453, -0.5324042439460754, -0.5085739493370056, -0.4847436547279358, -0.46091341972351074, -0.4370831251144409, -0.4132528603076935, -0.38942256569862366, -0.3655923008918762, -0.3417620062828064, -0.3179317116737366, -0.29410141706466675, -0.2702711522579193, -0.24644087255001068, -0.22261059284210205, -0.19878029823303223, -0.1749500185251236, -0.15111973881721497, -0.12728944420814514, -0.10345916450023651, -0.0796288251876831, -0.05579854175448418, -0.03196825832128525, -0.00813797116279602, 0.01569230854511261, 0.03952258825302124, 0.06335288286209106, 0.0871831625699997, 0.11101344227790833, 0.13484372198581696, 0.15867400169372559, 0.1825042963027954, 0.20633457601070404, 0.23016485571861267, 0.2539951503276825, 0.27782541513442993, 0.30165570974349976, 0.3254860043525696, 0.349316269159317, 0.37314656376838684, 0.3969768285751343, 0.4208071231842041, 0.4446374177932739, 0.46846771240234375, 0.4922979772090912, 0.5161282420158386, 0.5399585366249084, 0.5637888312339783, 0.5876191258430481, 0.6114493608474731, 0.635279655456543, 0.6591099500656128, 0.6829402446746826]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 11.0, 13.0, 17.0, 22.0, 40.0, 56.0, 71.0, 92.0, 96.0, 118.0, 97.0, 102.0, 85.0, 66.0, 38.0, 35.0, 16.0, 11.0, 8.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0726318359375, -0.06878089904785156, -0.06492996215820312, -0.06107902526855469, -0.05722808837890625, -0.05337715148925781, -0.049526214599609375, -0.04567527770996094, -0.0418243408203125, -0.03797340393066406, -0.034122467041015625, -0.030271530151367188, -0.02642059326171875, -0.022569656372070312, -0.018718719482421875, -0.014867782592773438, -0.011016845703125, -0.0071659088134765625, -0.003314971923828125, 0.0005359649658203125, 0.00438690185546875, 0.008237838745117188, 0.012088775634765625, 0.015939712524414062, 0.0197906494140625, 0.023641586303710938, 0.027492523193359375, 0.03134346008300781, 0.03519439697265625, 0.03904533386230469, 0.042896270751953125, 0.04674720764160156, 0.05059814453125, 0.05444908142089844, 0.058300018310546875, 0.06215095520019531, 0.06600189208984375, 0.06985282897949219, 0.07370376586914062, 0.07755470275878906, 0.0814056396484375, 0.08525657653808594, 0.08910751342773438, 0.09295845031738281, 0.09680938720703125, 0.10066032409667969, 0.10451126098632812, 0.10836219787597656, 0.112213134765625, 0.11606407165527344, 0.11991500854492188, 0.12376594543457031, 0.12761688232421875, 0.1314678192138672, 0.13531875610351562, 0.13916969299316406, 0.1430206298828125, 0.14687156677246094, 0.15072250366210938, 0.1545734405517578, 0.15842437744140625, 0.1622753143310547, 0.16612625122070312, 0.16997718811035156, 0.173828125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 7.0, 2.0, 4.0, 16.0, 22.0, 32.0, 50.0, 72.0, 175.0, 334.0, 817.0, 2804.0, 12739.0, 75737.0, 306130.0, 103090.0, 16722.0, 3654.0, 1044.0, 381.0, 191.0, 93.0, 62.0, 35.0, 23.0, 5.0, 8.0, 4.0, 3.0, 1.0, 6.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.78271484375, -0.7553253173828125, -0.727935791015625, -0.7005462646484375, -0.67315673828125, -0.6457672119140625, -0.618377685546875, -0.5909881591796875, -0.5635986328125, -0.5362091064453125, -0.508819580078125, -0.4814300537109375, -0.45404052734375, -0.4266510009765625, -0.399261474609375, -0.3718719482421875, -0.344482421875, -0.3170928955078125, -0.289703369140625, -0.2623138427734375, -0.23492431640625, -0.2075347900390625, -0.180145263671875, -0.1527557373046875, -0.1253662109375, -0.0979766845703125, -0.070587158203125, -0.0431976318359375, -0.01580810546875, 0.0115814208984375, 0.038970947265625, 0.0663604736328125, 0.09375, 0.1211395263671875, 0.148529052734375, 0.1759185791015625, 0.20330810546875, 0.2306976318359375, 0.258087158203125, 0.2854766845703125, 0.3128662109375, 0.3402557373046875, 0.367645263671875, 0.3950347900390625, 0.42242431640625, 0.4498138427734375, 0.477203369140625, 0.5045928955078125, 0.531982421875, 0.5593719482421875, 0.586761474609375, 0.6141510009765625, 0.64154052734375, 0.6689300537109375, 0.696319580078125, 0.7237091064453125, 0.7510986328125, 0.7784881591796875, 0.805877685546875, 0.8332672119140625, 0.86065673828125, 0.8880462646484375, 0.915435791015625, 0.9428253173828125, 0.97021484375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 7.0, 4.0, 4.0, 7.0, 15.0, 8.0, 17.0, 16.0, 14.0, 32.0, 26.0, 39.0, 56.0, 61.0, 47.0, 52.0, 77.0, 61.0, 59.0, 76.0, 56.0, 47.0, 39.0, 35.0, 26.0, 27.0, 17.0, 18.0, 9.0, 13.0, 6.0, 9.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0771484375, -0.07456493377685547, -0.07198143005371094, -0.0693979263305664, -0.06681442260742188, -0.06423091888427734, -0.06164741516113281, -0.05906391143798828, -0.05648040771484375, -0.05389690399169922, -0.05131340026855469, -0.048729896545410156, -0.046146392822265625, -0.043562889099121094, -0.04097938537597656, -0.03839588165283203, -0.0358123779296875, -0.03322887420654297, -0.030645370483398438, -0.028061866760253906, -0.025478363037109375, -0.022894859313964844, -0.020311355590820312, -0.01772785186767578, -0.01514434814453125, -0.012560844421386719, -0.009977340698242188, -0.007393836975097656, -0.004810333251953125, -0.0022268295288085938, 0.0003566741943359375, 0.0029401779174804688, 0.005523681640625, 0.008107185363769531, 0.010690689086914062, 0.013274192810058594, 0.015857696533203125, 0.018441200256347656, 0.021024703979492188, 0.02360820770263672, 0.02619171142578125, 0.02877521514892578, 0.03135871887207031, 0.033942222595214844, 0.036525726318359375, 0.039109230041503906, 0.04169273376464844, 0.04427623748779297, 0.0468597412109375, 0.04944324493408203, 0.05202674865722656, 0.054610252380371094, 0.057193756103515625, 0.059777259826660156, 0.06236076354980469, 0.06494426727294922, 0.06752777099609375, 0.07011127471923828, 0.07269477844238281, 0.07527828216552734, 0.07786178588867188, 0.0804452896118164, 0.08302879333496094, 0.08561229705810547, 0.08819580078125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 5.0, 13.0, 18.0, 30.0, 88.0, 122.0, 93.0, 51.0, 22.0, 11.0, 11.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8101673722267151, -0.7868161201477051, -0.7634648680686951, -0.7401136159896851, -0.7167624235153198, -0.6934111714363098, -0.6700599193572998, -0.6467086672782898, -0.6233574151992798, -0.6000061631202698, -0.5766549110412598, -0.5533036589622498, -0.5299524068832397, -0.5066012144088745, -0.4832499623298645, -0.4598987102508545, -0.4365474581718445, -0.4131962060928345, -0.38984495401382446, -0.36649373173713684, -0.34314247965812683, -0.3197912275791168, -0.2964400053024292, -0.2730887532234192, -0.24973750114440918, -0.22638624906539917, -0.20303501188755035, -0.17968377470970154, -0.15633252263069153, -0.13298127055168152, -0.1096300333738327, -0.08627879619598389, -0.0629274845123291, -0.03957623988389969, -0.016224995255470276, 0.007126249372959137, 0.03047749400138855, 0.05382873862981796, 0.07717998325824738, 0.10053122043609619, 0.1238824725151062, 0.1472337245941162, 0.17058496177196503, 0.19393619894981384, 0.21728745102882385, 0.24063870310783386, 0.2639899253845215, 0.2873411774635315, 0.3106924295425415, 0.3340436816215515, 0.3573949337005615, 0.38074615597724915, 0.40409740805625916, 0.42744866013526917, 0.4507998824119568, 0.4741511344909668, 0.4975023865699768, 0.5208536386489868, 0.5442048907279968, 0.5675561428070068, 0.5909073352813721, 0.6142585873603821, 0.6376098394393921, 0.6609610915184021, 0.6843123435974121]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 0.0, 4.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 5.0, 5.0, 7.0, 6.0, 4.0, 8.0, 12.0, 18.0, 34.0, 55.0, 63.0, 63.0, 65.0, 52.0, 21.0, 14.0, 12.0, 6.0, 4.0, 1.0, 4.0, 3.0, 3.0, 1.0, 3.0, 0.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4378100037574768, -0.4249344766139984, -0.41205894947052, -0.39918339252471924, -0.38630786538124084, -0.37343233823776245, -0.36055681109428406, -0.34768128395080566, -0.3348057270050049, -0.3219301998615265, -0.3090546727180481, -0.2961791157722473, -0.2833035886287689, -0.2704280614852905, -0.25755253434181213, -0.24467700719833374, -0.23180148005485535, -0.21892595291137695, -0.20605041086673737, -0.19317488372325897, -0.18029934167861938, -0.167423814535141, -0.1545482873916626, -0.1416727602481842, -0.12879721820354462, -0.11592168360948563, -0.10304614901542664, -0.09017062187194824, -0.07729508727788925, -0.06441955268383026, -0.05154402554035187, -0.03866849094629288, -0.025792956352233887, -0.012917423620820045, -4.1890889406204224e-05, 0.012833639979362488, 0.02570917457342148, 0.03858470916748047, 0.05146023631095886, 0.06433577090501785, 0.07721130549907684, 0.09008684009313583, 0.10296237468719482, 0.11583790183067322, 0.1287134289741516, 0.1415889710187912, 0.1544644981622696, 0.16734004020690918, 0.18021556735038757, 0.19309109449386597, 0.20596663653850555, 0.21884216368198395, 0.23171770572662354, 0.24459323287010193, 0.2574687600135803, 0.2703442871570587, 0.2832198143005371, 0.2960953414440155, 0.3089708685874939, 0.3218464255332947, 0.33472195267677307, 0.34759747982025146, 0.36047300696372986, 0.37334853410720825, 0.38622409105300903]}, "eval/loss": 0.309664785861969, "eval/wer": 0.09321697738992463, "eval/runtime": 583.4014, "eval/samples_per_second": 4.529, "eval/steps_per_second": 0.567, "train/train_runtime": 27349.9818, "train/train_samples_per_second": 5.217, "train/train_steps_per_second": 0.082, "train/total_flos": 0.0, "train/train_loss": 1.4829948718221064} \ No newline at end of file +{"train/loss": 0.1199, "train/learning_rate": 6.936416184971098e-07, "train/epoch": 5.0, "train/global_step": 2230, "_runtime": 28158, "_timestamp": 1647994913, "_step": 2235, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 12.0, 56.0, 279.0, 497.0, 140.0, 30.0, 5.0], "bins": [-7.940925598144531, -7.809273719787598, -7.677621841430664, -7.5459699630737305, -7.414318084716797, -7.282666206359863, -7.15101432800293, -7.019362449645996, -6.8877105712890625, -6.756058692932129, -6.624406814575195, -6.492754936218262, -6.361103057861328, -6.2294511795043945, -6.097799301147461, -5.966147422790527, -5.834495544433594, -5.70284366607666, -5.571191787719727, -5.439539909362793, -5.307888031005859, -5.176236152648926, -5.044584274291992, -4.912932395935059, -4.781280517578125, -4.649628639221191, -4.517976760864258, -4.386324882507324, -4.254673004150391, -4.123021125793457, -3.9913692474365234, -3.85971736907959, -3.728065013885498, -3.5964131355285645, -3.464761257171631, -3.3331093788146973, -3.2014575004577637, -3.06980562210083, -2.9381537437438965, -2.806501865386963, -2.6748499870300293, -2.5431981086730957, -2.411546230316162, -2.2798943519592285, -2.148242473602295, -2.0165905952453613, -1.8849387168884277, -1.7532868385314941, -1.62163507938385, -1.4899832010269165, -1.358331322669983, -1.2266794443130493, -1.0950275659561157, -0.9633756875991821, -0.8317238092422485, -0.7000719308853149, -0.5684200525283813, -0.43676817417144775, -0.30511629581451416, -0.17346441745758057, -0.04181253910064697, 0.08983933925628662, 0.22149121761322021, 0.3531430959701538, 0.4847949743270874]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 5.0, 3.0, 6.0, 2.0, 5.0, 9.0, 10.0, 15.0, 12.0, 17.0, 16.0, 22.0, 29.0, 39.0, 28.0, 36.0, 29.0, 35.0, 38.0, 45.0, 62.0, 45.0, 49.0, 48.0, 51.0, 40.0, 45.0, 43.0, 33.0, 29.0, 31.0, 30.0, 21.0, 16.0, 17.0, 14.0, 10.0, 9.0, 5.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4662081003189087, -0.44751691818237305, -0.4288257360458374, -0.41013455390930176, -0.3914433717727661, -0.37275218963623047, -0.35406097769737244, -0.3353697955608368, -0.31667861342430115, -0.2979874312877655, -0.27929624915122986, -0.2606050670146942, -0.24191386997699738, -0.22322268784046173, -0.2045314908027649, -0.18584030866622925, -0.1671491265296936, -0.14845794439315796, -0.12976676225662231, -0.11107556521892548, -0.09238438308238983, -0.07369320094585419, -0.055002011358737946, -0.036310821771621704, -0.01761963963508606, 0.0010715462267398834, 0.019762732088565826, 0.03845391795039177, 0.05714510381221771, 0.07583628594875336, 0.0945274755358696, 0.11321866512298584, 0.13190990686416626, 0.1506010890007019, 0.16929227113723755, 0.1879834681749344, 0.20667465031147003, 0.22536583244800568, 0.24405702948570251, 0.26274821162223816, 0.2814393937587738, 0.30013057589530945, 0.3188217580318451, 0.33751294016838074, 0.35620415210723877, 0.3748953342437744, 0.39358651638031006, 0.4122776985168457, 0.43096888065338135, 0.449660062789917, 0.46835124492645264, 0.4870424270629883, 0.5057336091995239, 0.5244247913360596, 0.5431159734725952, 0.5618071556091309, 0.5804983377456665, 0.5991895198822021, 0.6178807020187378, 0.6365718841552734, 0.6552630662918091, 0.6739542484283447, 0.6926454305648804, 0.711336612701416, 0.7300278544425964]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 0.0, 2.0, 4.0, 6.0, 8.0, 7.0, 15.0, 12.0, 27.0, 27.0, 51.0, 58.0, 97.0, 154.0, 252.0, 420.0, 743.0, 1437.0, 3148.0, 8260.0, 35352.0, 952590.0, 3075218.0, 95395.0, 12498.0, 4388.0, 1911.0, 942.0, 493.0, 251.0, 183.0, 104.0, 56.0, 47.0, 33.0, 32.0, 8.0, 18.0, 9.0, 7.0, 7.0, 3.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.841796875, -2.753509521484375, -2.66522216796875, -2.576934814453125, -2.4886474609375, -2.400360107421875, -2.31207275390625, -2.223785400390625, -2.135498046875, -2.047210693359375, -1.95892333984375, -1.870635986328125, -1.7823486328125, -1.694061279296875, -1.60577392578125, -1.517486572265625, -1.42919921875, -1.340911865234375, -1.25262451171875, -1.164337158203125, -1.0760498046875, -0.987762451171875, -0.89947509765625, -0.811187744140625, -0.722900390625, -0.634613037109375, -0.54632568359375, -0.458038330078125, -0.3697509765625, -0.281463623046875, -0.19317626953125, -0.104888916015625, -0.0166015625, 0.071685791015625, 0.15997314453125, 0.248260498046875, 0.3365478515625, 0.424835205078125, 0.51312255859375, 0.601409912109375, 0.689697265625, 0.777984619140625, 0.86627197265625, 0.954559326171875, 1.0428466796875, 1.131134033203125, 1.21942138671875, 1.307708740234375, 1.39599609375, 1.484283447265625, 1.57257080078125, 1.660858154296875, 1.7491455078125, 1.837432861328125, 1.92572021484375, 2.014007568359375, 2.102294921875, 2.190582275390625, 2.27886962890625, 2.367156982421875, 2.4554443359375, 2.543731689453125, 2.63201904296875, 2.720306396484375, 2.80859375]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 7.0, 8.0, 10.0, 4.0, 10.0, 13.0, 10.0, 15.0, 26.0, 12.0, 29.0, 26.0, 29.0, 19.0, 31.0, 37.0, 31.0, 38.0, 52.0, 48.0, 44.0, 45.0, 49.0, 38.0, 35.0, 44.0, 37.0, 35.0, 36.0, 31.0, 20.0, 26.0, 24.0, 19.0, 10.0, 16.0, 10.0, 9.0, 7.0, 6.0, 5.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.87841796875, -0.8500137329101562, -0.8216094970703125, -0.7932052612304688, -0.764801025390625, -0.7363967895507812, -0.7079925537109375, -0.6795883178710938, -0.65118408203125, -0.6227798461914062, -0.5943756103515625, -0.5659713745117188, -0.537567138671875, -0.5091629028320312, -0.4807586669921875, -0.45235443115234375, -0.4239501953125, -0.39554595947265625, -0.3671417236328125, -0.33873748779296875, -0.310333251953125, -0.28192901611328125, -0.2535247802734375, -0.22512054443359375, -0.19671630859375, -0.16831207275390625, -0.1399078369140625, -0.11150360107421875, -0.083099365234375, -0.05469512939453125, -0.0262908935546875, 0.00211334228515625, 0.030517578125, 0.05892181396484375, 0.0873260498046875, 0.11573028564453125, 0.144134521484375, 0.17253875732421875, 0.2009429931640625, 0.22934722900390625, 0.25775146484375, 0.28615570068359375, 0.3145599365234375, 0.34296417236328125, 0.371368408203125, 0.39977264404296875, 0.4281768798828125, 0.45658111572265625, 0.4849853515625, 0.5133895874023438, 0.5417938232421875, 0.5701980590820312, 0.598602294921875, 0.6270065307617188, 0.6554107666015625, 0.6838150024414062, 0.71221923828125, 0.7406234741210938, 0.7690277099609375, 0.7974319458007812, 0.825836181640625, 0.8542404174804688, 0.8826446533203125, 0.9110488891601562, 0.939453125]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 4.0, 13.0, 18.0, 28.0, 46.0, 120.0, 245.0, 876.0, 3459606.0, 732161.0, 799.0, 164.0, 90.0, 37.0, 28.0, 21.0, 6.0, 3.0, 6.0, 2.0, 0.0, 5.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-22.125, -21.6102294921875, -21.095458984375, -20.5806884765625, -20.06591796875, -19.5511474609375, -19.036376953125, -18.5216064453125, -18.0068359375, -17.4920654296875, -16.977294921875, -16.4625244140625, -15.94775390625, -15.4329833984375, -14.918212890625, -14.4034423828125, -13.888671875, -13.3739013671875, -12.859130859375, -12.3443603515625, -11.82958984375, -11.3148193359375, -10.800048828125, -10.2852783203125, -9.7705078125, -9.2557373046875, -8.740966796875, -8.2261962890625, -7.71142578125, -7.1966552734375, -6.681884765625, -6.1671142578125, -5.65234375, -5.1375732421875, -4.622802734375, -4.1080322265625, -3.59326171875, -3.0784912109375, -2.563720703125, -2.0489501953125, -1.5341796875, -1.0194091796875, -0.504638671875, 0.0101318359375, 0.52490234375, 1.0396728515625, 1.554443359375, 2.0692138671875, 2.583984375, 3.0987548828125, 3.613525390625, 4.1282958984375, 4.64306640625, 5.1578369140625, 5.672607421875, 6.1873779296875, 6.7021484375, 7.2169189453125, 7.731689453125, 8.2464599609375, 8.76123046875, 9.2760009765625, 9.790771484375, 10.3055419921875, 10.8203125]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 7.0, 15.0, 14.0, 27.0, 67.0, 102.0, 190.0, 681.0, 1946.0, 665.0, 165.0, 80.0, 41.0, 27.0, 20.0, 9.0, 7.0, 2.0, 4.0, 2.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2822265625, -1.2540359497070312, -1.2258453369140625, -1.1976547241210938, -1.169464111328125, -1.1412734985351562, -1.1130828857421875, -1.0848922729492188, -1.05670166015625, -1.0285110473632812, -1.0003204345703125, -0.9721298217773438, -0.943939208984375, -0.9157485961914062, -0.8875579833984375, -0.8593673706054688, -0.8311767578125, -0.8029861450195312, -0.7747955322265625, -0.7466049194335938, -0.718414306640625, -0.6902236938476562, -0.6620330810546875, -0.6338424682617188, -0.60565185546875, -0.5774612426757812, -0.5492706298828125, -0.5210800170898438, -0.492889404296875, -0.46469879150390625, -0.4365081787109375, -0.40831756591796875, -0.380126953125, -0.35193634033203125, -0.3237457275390625, -0.29555511474609375, -0.267364501953125, -0.23917388916015625, -0.2109832763671875, -0.18279266357421875, -0.15460205078125, -0.12641143798828125, -0.0982208251953125, -0.07003021240234375, -0.041839599609375, -0.01364898681640625, 0.0145416259765625, 0.04273223876953125, 0.0709228515625, 0.09911346435546875, 0.1273040771484375, 0.15549468994140625, 0.183685302734375, 0.21187591552734375, 0.2400665283203125, 0.26825714111328125, 0.29644775390625, 0.32463836669921875, 0.3528289794921875, 0.38101959228515625, 0.409210205078125, 0.43740081787109375, 0.4655914306640625, 0.49378204345703125, 0.52197265625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 2.0, 7.0, 11.0, 11.0, 8.0, 12.0, 24.0, 24.0, 36.0, 47.0, 53.0, 70.0, 79.0, 89.0, 98.0, 87.0, 70.0, 58.0, 48.0, 44.0, 30.0, 24.0, 14.0, 18.0, 13.0, 10.0, 7.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9769927263259888, -0.9347792863845825, -0.8925658464431763, -0.8503524661064148, -0.8081390261650085, -0.7659255862236023, -0.7237122058868408, -0.6814987659454346, -0.6392853260040283, -0.5970718860626221, -0.5548584461212158, -0.5126450657844543, -0.4704316258430481, -0.42821818590164185, -0.386004775762558, -0.3437913656234741, -0.30157792568206787, -0.2593644857406616, -0.21715107560157776, -0.1749376505613327, -0.13272422552108765, -0.09051080048084259, -0.048297375440597534, -0.006083965301513672, 0.03612947463989258, 0.07834289968013763, 0.12055632472038269, 0.16276974976062775, 0.2049831748008728, 0.24719659984111786, 0.2894100248813629, 0.3316234350204468, 0.3738369941711426, 0.41605043411254883, 0.4582638442516327, 0.5004772543907166, 0.5426906943321228, 0.584904134273529, 0.6271175146102905, 0.6693309545516968, 0.711544394493103, 0.7537578344345093, 0.7959712743759155, 0.838184654712677, 0.8803980946540833, 0.9226115345954895, 0.964824914932251, 1.0070383548736572, 1.0492517948150635, 1.0914652347564697, 1.133678674697876, 1.1758921146392822, 1.2181055545806885, 1.2603188753128052, 1.3025323152542114, 1.3447457551956177, 1.386959195137024, 1.4291726350784302, 1.4713860750198364, 1.5135995149612427, 1.5558128356933594, 1.5980262756347656, 1.6402397155761719, 1.6824531555175781, 1.7246665954589844]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 10.0, 8.0, 11.0, 10.0, 11.0, 15.0, 19.0, 12.0, 19.0, 28.0, 28.0, 28.0, 23.0, 36.0, 41.0, 44.0, 36.0, 31.0, 44.0, 47.0, 41.0, 46.0, 37.0, 35.0, 35.0, 35.0, 34.0, 33.0, 26.0, 28.0, 29.0, 26.0, 15.0, 15.0, 17.0, 13.0, 14.0, 10.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7832375168800354, -0.7575938701629639, -0.7319502830505371, -0.7063066363334656, -0.680662989616394, -0.6550193428993225, -0.629375696182251, -0.6037321090698242, -0.5780884623527527, -0.5524448156356812, -0.5268012285232544, -0.5011575818061829, -0.47551393508911133, -0.4498702883720398, -0.42422667145729065, -0.3985830545425415, -0.37293940782546997, -0.34729576110839844, -0.3216521441936493, -0.29600852727890015, -0.2703648805618286, -0.24472124874591827, -0.21907761693000793, -0.1934339851140976, -0.16779035329818726, -0.14214672148227692, -0.11650308966636658, -0.09085945785045624, -0.0652158260345459, -0.03957219421863556, -0.01392856240272522, 0.01171506941318512, 0.037358641624450684, 0.06300227344036102, 0.08864590525627136, 0.1142895370721817, 0.13993316888809204, 0.16557680070400238, 0.19122043251991272, 0.21686406433582306, 0.2425076961517334, 0.26815134286880493, 0.2937949597835541, 0.3194385766983032, 0.34508222341537476, 0.3707258701324463, 0.39636948704719543, 0.4220131039619446, 0.4476567506790161, 0.47330039739608765, 0.4989440143108368, 0.5245876312255859, 0.5502312779426575, 0.575874924659729, 0.6015185117721558, 0.6271621584892273, 0.6528058052062988, 0.6784494519233704, 0.7040930986404419, 0.7297366857528687, 0.7553803324699402, 0.7810239791870117, 0.8066675662994385, 0.83231121301651, 0.8579548597335815]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 4.0, 12.0, 8.0, 31.0, 29.0, 40.0, 50.0, 84.0, 139.0, 185.0, 251.0, 369.0, 555.0, 753.0, 1155.0, 1643.0, 2561.0, 3756.0, 5780.0, 8996.0, 14705.0, 24379.0, 43156.0, 80441.0, 171793.0, 311438.0, 179636.0, 84756.0, 44890.0, 25105.0, 14985.0, 9146.0, 5832.0, 3889.0, 2508.0, 1682.0, 1156.0, 848.0, 535.0, 408.0, 258.0, 189.0, 131.0, 87.0, 62.0, 44.0, 25.0, 19.0, 20.0, 11.0, 9.0, 6.0, 6.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.397216796875, -0.3850059509277344, -0.37279510498046875, -0.3605842590332031, -0.3483734130859375, -0.3361625671386719, -0.32395172119140625, -0.3117408752441406, -0.299530029296875, -0.2873191833496094, -0.27510833740234375, -0.2628974914550781, -0.2506866455078125, -0.23847579956054688, -0.22626495361328125, -0.21405410766601562, -0.20184326171875, -0.18963241577148438, -0.17742156982421875, -0.16521072387695312, -0.1529998779296875, -0.14078903198242188, -0.12857818603515625, -0.11636734008789062, -0.104156494140625, -0.09194564819335938, -0.07973480224609375, -0.06752395629882812, -0.0553131103515625, -0.043102264404296875, -0.03089141845703125, -0.018680572509765625, -0.0064697265625, 0.005741119384765625, 0.01795196533203125, 0.030162811279296875, 0.0423736572265625, 0.054584503173828125, 0.06679534912109375, 0.07900619506835938, 0.091217041015625, 0.10342788696289062, 0.11563873291015625, 0.12784957885742188, 0.1400604248046875, 0.15227127075195312, 0.16448211669921875, 0.17669296264648438, 0.18890380859375, 0.20111465454101562, 0.21332550048828125, 0.22553634643554688, 0.2377471923828125, 0.24995803833007812, 0.26216888427734375, 0.2743797302246094, 0.286590576171875, 0.2988014221191406, 0.31101226806640625, 0.3232231140136719, 0.3354339599609375, 0.3476448059082031, 0.35985565185546875, 0.3720664978027344, 0.38427734375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 6.0, 2.0, 8.0, 6.0, 8.0, 9.0, 7.0, 14.0, 15.0, 21.0, 21.0, 18.0, 28.0, 31.0, 33.0, 24.0, 31.0, 38.0, 44.0, 43.0, 27.0, 45.0, 46.0, 45.0, 40.0, 46.0, 23.0, 39.0, 32.0, 41.0, 31.0, 36.0, 26.0, 21.0, 19.0, 13.0, 10.0, 9.0, 10.0, 10.0, 6.0, 9.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.467529296875, -0.4515571594238281, -0.43558502197265625, -0.4196128845214844, -0.4036407470703125, -0.3876686096191406, -0.37169647216796875, -0.3557243347167969, -0.339752197265625, -0.3237800598144531, -0.30780792236328125, -0.2918357849121094, -0.2758636474609375, -0.2598915100097656, -0.24391937255859375, -0.22794723510742188, -0.21197509765625, -0.19600296020507812, -0.18003082275390625, -0.16405868530273438, -0.1480865478515625, -0.13211441040039062, -0.11614227294921875, -0.10017013549804688, -0.084197998046875, -0.06822586059570312, -0.05225372314453125, -0.036281585693359375, -0.0203094482421875, -0.004337310791015625, 0.01163482666015625, 0.027606964111328125, 0.0435791015625, 0.059551239013671875, 0.07552337646484375, 0.09149551391601562, 0.1074676513671875, 0.12343978881835938, 0.13941192626953125, 0.15538406372070312, 0.171356201171875, 0.18732833862304688, 0.20330047607421875, 0.21927261352539062, 0.2352447509765625, 0.2512168884277344, 0.26718902587890625, 0.2831611633300781, 0.29913330078125, 0.3151054382324219, 0.33107757568359375, 0.3470497131347656, 0.3630218505859375, 0.3789939880371094, 0.39496612548828125, 0.4109382629394531, 0.426910400390625, 0.4428825378417969, 0.45885467529296875, 0.4748268127441406, 0.4907989501953125, 0.5067710876464844, 0.5227432250976562, 0.5387153625488281, 0.5546875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 10.0, 11.0, 15.0, 19.0, 25.0, 40.0, 50.0, 87.0, 121.0, 226.0, 393.0, 770.0, 1604.0, 4019.0, 11302.0, 38684.0, 175614.0, 592346.0, 167750.0, 37173.0, 10984.0, 3846.0, 1645.0, 757.0, 422.0, 216.0, 130.0, 82.0, 70.0, 45.0, 36.0, 21.0, 11.0, 4.0, 9.0, 4.0, 4.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6591796875, -0.6368255615234375, -0.614471435546875, -0.5921173095703125, -0.56976318359375, -0.5474090576171875, -0.525054931640625, -0.5027008056640625, -0.4803466796875, -0.4579925537109375, -0.435638427734375, -0.4132843017578125, -0.39093017578125, -0.3685760498046875, -0.346221923828125, -0.3238677978515625, -0.301513671875, -0.2791595458984375, -0.256805419921875, -0.2344512939453125, -0.21209716796875, -0.1897430419921875, -0.167388916015625, -0.1450347900390625, -0.1226806640625, -0.1003265380859375, -0.077972412109375, -0.0556182861328125, -0.03326416015625, -0.0109100341796875, 0.011444091796875, 0.0337982177734375, 0.05615234375, 0.0785064697265625, 0.100860595703125, 0.1232147216796875, 0.14556884765625, 0.1679229736328125, 0.190277099609375, 0.2126312255859375, 0.2349853515625, 0.2573394775390625, 0.279693603515625, 0.3020477294921875, 0.32440185546875, 0.3467559814453125, 0.369110107421875, 0.3914642333984375, 0.413818359375, 0.4361724853515625, 0.458526611328125, 0.4808807373046875, 0.50323486328125, 0.5255889892578125, 0.547943115234375, 0.5702972412109375, 0.5926513671875, 0.6150054931640625, 0.637359619140625, 0.6597137451171875, 0.68206787109375, 0.7044219970703125, 0.726776123046875, 0.7491302490234375, 0.771484375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 8.0, 2.0, 3.0, 5.0, 4.0, 9.0, 3.0, 15.0, 16.0, 16.0, 11.0, 18.0, 21.0, 20.0, 22.0, 34.0, 28.0, 31.0, 40.0, 30.0, 30.0, 52.0, 46.0, 31.0, 36.0, 37.0, 42.0, 42.0, 39.0, 35.0, 29.0, 35.0, 33.0, 25.0, 22.0, 22.0, 16.0, 12.0, 18.0, 12.0, 11.0, 10.0, 9.0, 7.0, 8.0, 4.0, 3.0, 3.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.97998046875, -0.9475173950195312, -0.9150543212890625, -0.8825912475585938, -0.850128173828125, -0.8176651000976562, -0.7852020263671875, -0.7527389526367188, -0.72027587890625, -0.6878128051757812, -0.6553497314453125, -0.6228866577148438, -0.590423583984375, -0.5579605102539062, -0.5254974365234375, -0.49303436279296875, -0.4605712890625, -0.42810821533203125, -0.3956451416015625, -0.36318206787109375, -0.330718994140625, -0.29825592041015625, -0.2657928466796875, -0.23332977294921875, -0.20086669921875, -0.16840362548828125, -0.1359405517578125, -0.10347747802734375, -0.071014404296875, -0.03855133056640625, -0.0060882568359375, 0.02637481689453125, 0.058837890625, 0.09130096435546875, 0.1237640380859375, 0.15622711181640625, 0.188690185546875, 0.22115325927734375, 0.2536163330078125, 0.28607940673828125, 0.31854248046875, 0.35100555419921875, 0.3834686279296875, 0.41593170166015625, 0.448394775390625, 0.48085784912109375, 0.5133209228515625, 0.5457839965820312, 0.5782470703125, 0.6107101440429688, 0.6431732177734375, 0.6756362915039062, 0.708099365234375, 0.7405624389648438, 0.7730255126953125, 0.8054885864257812, 0.83795166015625, 0.8704147338867188, 0.9028778076171875, 0.9353408813476562, 0.967803955078125, 1.0002670288085938, 1.0327301025390625, 1.0651931762695312, 1.09765625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 2.0, 5.0, 10.0, 9.0, 11.0, 20.0, 26.0, 41.0, 63.0, 89.0, 133.0, 236.0, 383.0, 614.0, 1075.0, 2224.0, 4633.0, 10843.0, 30540.0, 125972.0, 622456.0, 185615.0, 38995.0, 13142.0, 5604.0, 2588.0, 1322.0, 717.0, 435.0, 263.0, 167.0, 99.0, 58.0, 57.0, 30.0, 29.0, 14.0, 12.0, 6.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1253662109375, -0.12152099609375, -0.11767578125, -0.11383056640625, -0.1099853515625, -0.10614013671875, -0.102294921875, -0.09844970703125, -0.0946044921875, -0.09075927734375, -0.0869140625, -0.08306884765625, -0.0792236328125, -0.07537841796875, -0.071533203125, -0.06768798828125, -0.0638427734375, -0.05999755859375, -0.05615234375, -0.05230712890625, -0.0484619140625, -0.04461669921875, -0.040771484375, -0.03692626953125, -0.0330810546875, -0.02923583984375, -0.025390625, -0.02154541015625, -0.0177001953125, -0.01385498046875, -0.010009765625, -0.00616455078125, -0.0023193359375, 0.00152587890625, 0.00537109375, 0.00921630859375, 0.0130615234375, 0.01690673828125, 0.020751953125, 0.02459716796875, 0.0284423828125, 0.03228759765625, 0.0361328125, 0.03997802734375, 0.0438232421875, 0.04766845703125, 0.051513671875, 0.05535888671875, 0.0592041015625, 0.06304931640625, 0.06689453125, 0.07073974609375, 0.0745849609375, 0.07843017578125, 0.082275390625, 0.08612060546875, 0.0899658203125, 0.09381103515625, 0.09765625, 0.10150146484375, 0.1053466796875, 0.10919189453125, 0.113037109375, 0.11688232421875, 0.1207275390625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 3.0, 8.0, 7.0, 22.0, 24.0, 38.0, 94.0, 202.0, 280.0, 168.0, 66.0, 29.0, 17.0, 17.0, 6.0, 8.0, 4.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014853477478027344, -0.0001431051641702652, -0.00013767555356025696, -0.00013224594295024872, -0.00012681633234024048, -0.00012138672173023224, -0.000115957111120224, -0.00011052750051021576, -0.00010509788990020752, -9.966827929019928e-05, -9.423866868019104e-05, -8.88090580701828e-05, -8.337944746017456e-05, -7.794983685016632e-05, -7.252022624015808e-05, -6.709061563014984e-05, -6.16610050201416e-05, -5.623139441013336e-05, -5.080178380012512e-05, -4.537217319011688e-05, -3.994256258010864e-05, -3.45129519701004e-05, -2.9083341360092163e-05, -2.3653730750083923e-05, -1.8224120140075684e-05, -1.2794509530067444e-05, -7.364898920059204e-06, -1.9352883100509644e-06, 3.4943222999572754e-06, 8.923932909965515e-06, 1.4353543519973755e-05, 1.9783154129981995e-05, 2.5212764739990234e-05, 3.0642375349998474e-05, 3.6071985960006714e-05, 4.1501596570014954e-05, 4.693120718002319e-05, 5.236081779003143e-05, 5.779042840003967e-05, 6.322003901004791e-05, 6.864964962005615e-05, 7.407926023006439e-05, 7.950887084007263e-05, 8.493848145008087e-05, 9.036809206008911e-05, 9.579770267009735e-05, 0.00010122731328010559, 0.00010665692389011383, 0.00011208653450012207, 0.00011751614511013031, 0.00012294575572013855, 0.0001283753663301468, 0.00013380497694015503, 0.00013923458755016327, 0.0001446641981601715, 0.00015009380877017975, 0.000155523419380188, 0.00016095302999019623, 0.00016638264060020447, 0.0001718122512102127, 0.00017724186182022095, 0.0001826714724302292, 0.00018810108304023743, 0.00019353069365024567, 0.0001989603042602539]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 2.0, 3.0, 6.0, 9.0, 12.0, 12.0, 20.0, 26.0, 44.0, 53.0, 93.0, 163.0, 472.0, 1708.0, 9062.0, 84776.0, 867065.0, 74046.0, 8568.0, 1576.0, 383.0, 185.0, 83.0, 46.0, 38.0, 23.0, 15.0, 7.0, 10.0, 16.0, 8.0, 1.0, 1.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.255126953125, -0.24584197998046875, -0.2365570068359375, -0.22727203369140625, -0.217987060546875, -0.20870208740234375, -0.1994171142578125, -0.19013214111328125, -0.18084716796875, -0.17156219482421875, -0.1622772216796875, -0.15299224853515625, -0.143707275390625, -0.13442230224609375, -0.1251373291015625, -0.11585235595703125, -0.1065673828125, -0.09728240966796875, -0.0879974365234375, -0.07871246337890625, -0.069427490234375, -0.06014251708984375, -0.0508575439453125, -0.04157257080078125, -0.03228759765625, -0.02300262451171875, -0.0137176513671875, -0.00443267822265625, 0.004852294921875, 0.01413726806640625, 0.0234222412109375, 0.03270721435546875, 0.0419921875, 0.05127716064453125, 0.0605621337890625, 0.06984710693359375, 0.079132080078125, 0.08841705322265625, 0.0977020263671875, 0.10698699951171875, 0.11627197265625, 0.12555694580078125, 0.1348419189453125, 0.14412689208984375, 0.153411865234375, 0.16269683837890625, 0.1719818115234375, 0.18126678466796875, 0.1905517578125, 0.19983673095703125, 0.2091217041015625, 0.21840667724609375, 0.227691650390625, 0.23697662353515625, 0.2462615966796875, 0.25554656982421875, 0.26483154296875, 0.27411651611328125, 0.2834014892578125, 0.29268646240234375, 0.301971435546875, 0.31125640869140625, 0.3205413818359375, 0.32982635498046875, 0.339111328125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 8.0, 0.0, 3.0, 5.0, 6.0, 3.0, 6.0, 9.0, 7.0, 14.0, 17.0, 20.0, 32.0, 38.0, 49.0, 77.0, 86.0, 109.0, 104.0, 98.0, 79.0, 57.0, 52.0, 40.0, 15.0, 7.0, 9.0, 12.0, 5.0, 6.0, 7.0, 7.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0423583984375, -0.040851593017578125, -0.03934478759765625, -0.037837982177734375, -0.0363311767578125, -0.034824371337890625, -0.03331756591796875, -0.031810760498046875, -0.030303955078125, -0.028797149658203125, -0.02729034423828125, -0.025783538818359375, -0.0242767333984375, -0.022769927978515625, -0.02126312255859375, -0.019756317138671875, -0.01824951171875, -0.016742706298828125, -0.01523590087890625, -0.013729095458984375, -0.0122222900390625, -0.010715484619140625, -0.00920867919921875, -0.007701873779296875, -0.006195068359375, -0.004688262939453125, -0.00318145751953125, -0.001674652099609375, -0.0001678466796875, 0.001338958740234375, 0.00284576416015625, 0.004352569580078125, 0.005859375, 0.007366180419921875, 0.00887298583984375, 0.010379791259765625, 0.0118865966796875, 0.013393402099609375, 0.01490020751953125, 0.016407012939453125, 0.017913818359375, 0.019420623779296875, 0.02092742919921875, 0.022434234619140625, 0.0239410400390625, 0.025447845458984375, 0.02695465087890625, 0.028461456298828125, 0.02996826171875, 0.031475067138671875, 0.03298187255859375, 0.034488677978515625, 0.0359954833984375, 0.037502288818359375, 0.03900909423828125, 0.040515899658203125, 0.042022705078125, 0.043529510498046875, 0.04503631591796875, 0.046543121337890625, 0.0480499267578125, 0.049556732177734375, 0.05106353759765625, 0.052570343017578125, 0.0540771484375]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 6.0, 10.0, 13.0, 48.0, 138.0, 300.0, 284.0, 140.0, 53.0, 13.0, 6.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7234145402908325, -1.645379662513733, -1.5673447847366333, -1.4893099069595337, -1.411275029182434, -1.3332401514053345, -1.2552051544189453, -1.1771702766418457, -1.099135398864746, -1.0211005210876465, -0.9430656433105469, -0.8650307655334473, -0.7869958877563477, -0.708961009979248, -0.6309260725975037, -0.552891194820404, -0.4748563766479492, -0.3968214988708496, -0.31878662109375, -0.240751713514328, -0.1627168357372284, -0.08468195796012878, -0.006647050380706787, 0.07138782739639282, 0.14942270517349243, 0.22745758295059204, 0.30549246072769165, 0.38352736830711365, 0.46156224608421326, 0.5395971536636353, 0.6176320314407349, 0.6956669092178345, 0.7737016677856445, 0.8517365455627441, 0.9297714233398438, 1.0078063011169434, 1.085841178894043, 1.1638760566711426, 1.2419109344482422, 1.3199458122253418, 1.3979806900024414, 1.476015567779541, 1.5540504455566406, 1.6320853233337402, 1.7101202011108398, 1.7881550788879395, 1.866189956665039, 1.9442248344421387, 2.0222597122192383, 2.100294589996338, 2.1783294677734375, 2.256364345550537, 2.3343992233276367, 2.4124341011047363, 2.490468978881836, 2.5685038566589355, 2.6465389728546143, 2.724573850631714, 2.8026087284088135, 2.880643606185913, 2.9586784839630127, 3.0367133617401123, 3.114748239517212, 3.1927831172943115, 3.270817995071411]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 7.0, 5.0, 6.0, 10.0, 6.0, 13.0, 22.0, 14.0, 22.0, 17.0, 27.0, 28.0, 24.0, 36.0, 47.0, 33.0, 30.0, 47.0, 44.0, 42.0, 52.0, 45.0, 36.0, 32.0, 32.0, 45.0, 42.0, 34.0, 36.0, 32.0, 35.0, 24.0, 14.0, 12.0, 13.0, 11.0, 11.0, 10.0, 1.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.49540552496910095, -0.47856956720352173, -0.4617336094379425, -0.4448976516723633, -0.42806169390678406, -0.41122573614120483, -0.394389808177948, -0.3775538206100464, -0.36071789264678955, -0.3438819348812103, -0.3270459771156311, -0.3102100193500519, -0.29337406158447266, -0.27653810381889343, -0.2597021460533142, -0.24286620318889618, -0.22603023052215576, -0.20919427275657654, -0.19235831499099731, -0.1755223572254181, -0.15868639945983887, -0.14185044169425964, -0.1250144988298416, -0.10817854106426239, -0.09134258329868317, -0.07450662553310394, -0.05767067149281502, -0.04083471745252609, -0.02399875968694687, -0.007162801921367645, 0.009673148393630981, 0.026509106159210205, 0.043345093727111816, 0.06018105149269104, 0.07701700925827026, 0.09385295957326889, 0.11068891733884811, 0.12752488255500793, 0.14436082541942596, 0.1611967831850052, 0.1780327409505844, 0.19486869871616364, 0.21170465648174286, 0.2285405993461609, 0.2453765571117401, 0.26221251487731934, 0.27904847264289856, 0.2958844304084778, 0.312720388174057, 0.32955634593963623, 0.34639230370521545, 0.3632282614707947, 0.3800642192363739, 0.3969001770019531, 0.41373610496520996, 0.4305720925331116, 0.4474080204963684, 0.46424397826194763, 0.48107993602752686, 0.4979158937931061, 0.5147518515586853, 0.5315877795219421, 0.5484237670898438, 0.5652596950531006, 0.5820956826210022]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 6.0, 8.0, 12.0, 19.0, 17.0, 45.0, 47.0, 66.0, 95.0, 139.0, 223.0, 298.0, 400.0, 542.0, 805.0, 1194.0, 1783.0, 2511.0, 3643.0, 5385.0, 8093.0, 12271.0, 18494.0, 28566.0, 44604.0, 73856.0, 133460.0, 280382.0, 183934.0, 92881.0, 54460.0, 34101.0, 21735.0, 14236.0, 9588.0, 6459.0, 4417.0, 3087.0, 2124.0, 1389.0, 975.0, 658.0, 496.0, 311.0, 253.0, 135.0, 122.0, 72.0, 58.0, 38.0, 29.0, 13.0, 8.0, 9.0, 4.0, 5.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.1849365234375, -0.17910385131835938, -0.17327117919921875, -0.16743850708007812, -0.1616058349609375, -0.15577316284179688, -0.14994049072265625, -0.14410781860351562, -0.138275146484375, -0.13244247436523438, -0.12660980224609375, -0.12077713012695312, -0.1149444580078125, -0.10911178588867188, -0.10327911376953125, -0.09744644165039062, -0.09161376953125, -0.08578109741210938, -0.07994842529296875, -0.07411575317382812, -0.0682830810546875, -0.062450408935546875, -0.05661773681640625, -0.050785064697265625, -0.044952392578125, -0.039119720458984375, -0.03328704833984375, -0.027454376220703125, -0.0216217041015625, -0.015789031982421875, -0.00995635986328125, -0.004123687744140625, 0.001708984375, 0.007541656494140625, 0.01337432861328125, 0.019207000732421875, 0.0250396728515625, 0.030872344970703125, 0.03670501708984375, 0.042537689208984375, 0.048370361328125, 0.054203033447265625, 0.06003570556640625, 0.06586837768554688, 0.0717010498046875, 0.07753372192382812, 0.08336639404296875, 0.08919906616210938, 0.09503173828125, 0.10086441040039062, 0.10669708251953125, 0.11252975463867188, 0.1183624267578125, 0.12419509887695312, 0.13002777099609375, 0.13586044311523438, 0.141693115234375, 0.14752578735351562, 0.15335845947265625, 0.15919113159179688, 0.1650238037109375, 0.17085647583007812, 0.17668914794921875, 0.18252182006835938, 0.1883544921875]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 5.0, 4.0, 9.0, 10.0, 15.0, 11.0, 17.0, 23.0, 22.0, 12.0, 27.0, 16.0, 20.0, 21.0, 24.0, 36.0, 17.0, 36.0, 28.0, 41.0, 52.0, 61.0, 45.0, 36.0, 38.0, 33.0, 45.0, 31.0, 28.0, 22.0, 35.0, 24.0, 24.0, 18.0, 21.0, 17.0, 11.0, 11.0, 10.0, 9.0, 8.0, 7.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.353515625, -3.24029541015625, -3.1270751953125, -3.01385498046875, -2.900634765625, -2.78741455078125, -2.6741943359375, -2.56097412109375, -2.44775390625, -2.33453369140625, -2.2213134765625, -2.10809326171875, -1.994873046875, -1.88165283203125, -1.7684326171875, -1.65521240234375, -1.5419921875, -1.42877197265625, -1.3155517578125, -1.20233154296875, -1.089111328125, -0.97589111328125, -0.8626708984375, -0.74945068359375, -0.63623046875, -0.52301025390625, -0.4097900390625, -0.29656982421875, -0.183349609375, -0.07012939453125, 0.0430908203125, 0.15631103515625, 0.26953125, 0.38275146484375, 0.4959716796875, 0.60919189453125, 0.722412109375, 0.83563232421875, 0.9488525390625, 1.06207275390625, 1.17529296875, 1.28851318359375, 1.4017333984375, 1.51495361328125, 1.628173828125, 1.74139404296875, 1.8546142578125, 1.96783447265625, 2.0810546875, 2.19427490234375, 2.3074951171875, 2.42071533203125, 2.533935546875, 2.64715576171875, 2.7603759765625, 2.87359619140625, 2.98681640625, 3.10003662109375, 3.2132568359375, 3.32647705078125, 3.439697265625, 3.55291748046875, 3.6661376953125, 3.77935791015625, 3.892578125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 2.0, 3.0, 2.0, 4.0, 4.0, 12.0, 9.0, 18.0, 22.0, 19.0, 22.0, 28.0, 30.0, 32.0, 46.0, 62.0, 80.0, 105.0, 150.0, 305.0, 827.0, 15270.0, 1017048.0, 12811.0, 744.0, 322.0, 138.0, 109.0, 56.0, 55.0, 43.0, 34.0, 23.0, 28.0, 19.0, 11.0, 12.0, 10.0, 5.0, 14.0, 4.0, 4.0, 4.0, 2.0, 5.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-3.357421875, -3.265411376953125, -3.17340087890625, -3.081390380859375, -2.9893798828125, -2.897369384765625, -2.80535888671875, -2.713348388671875, -2.621337890625, -2.529327392578125, -2.43731689453125, -2.345306396484375, -2.2532958984375, -2.161285400390625, -2.06927490234375, -1.977264404296875, -1.88525390625, -1.793243408203125, -1.70123291015625, -1.609222412109375, -1.5172119140625, -1.425201416015625, -1.33319091796875, -1.241180419921875, -1.149169921875, -1.057159423828125, -0.96514892578125, -0.873138427734375, -0.7811279296875, -0.689117431640625, -0.59710693359375, -0.505096435546875, -0.4130859375, -0.321075439453125, -0.22906494140625, -0.137054443359375, -0.0450439453125, 0.046966552734375, 0.13897705078125, 0.230987548828125, 0.322998046875, 0.415008544921875, 0.50701904296875, 0.599029541015625, 0.6910400390625, 0.783050537109375, 0.87506103515625, 0.967071533203125, 1.05908203125, 1.151092529296875, 1.24310302734375, 1.335113525390625, 1.4271240234375, 1.519134521484375, 1.61114501953125, 1.703155517578125, 1.795166015625, 1.887176513671875, 1.97918701171875, 2.071197509765625, 2.1632080078125, 2.255218505859375, 2.34722900390625, 2.439239501953125, 2.53125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 1.0, 3.0, 2.0, 4.0, 5.0, 13.0, 12.0, 16.0, 20.0, 14.0, 26.0, 27.0, 17.0, 28.0, 37.0, 31.0, 35.0, 39.0, 28.0, 46.0, 40.0, 52.0, 53.0, 36.0, 47.0, 45.0, 33.0, 42.0, 28.0, 32.0, 29.0, 27.0, 22.0, 23.0, 19.0, 11.0, 9.0, 10.0, 7.0, 13.0, 4.0, 3.0, 5.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.75390625, -4.6231689453125, -4.492431640625, -4.3616943359375, -4.23095703125, -4.1002197265625, -3.969482421875, -3.8387451171875, -3.7080078125, -3.5772705078125, -3.446533203125, -3.3157958984375, -3.18505859375, -3.0543212890625, -2.923583984375, -2.7928466796875, -2.662109375, -2.5313720703125, -2.400634765625, -2.2698974609375, -2.13916015625, -2.0084228515625, -1.877685546875, -1.7469482421875, -1.6162109375, -1.4854736328125, -1.354736328125, -1.2239990234375, -1.09326171875, -0.9625244140625, -0.831787109375, -0.7010498046875, -0.5703125, -0.4395751953125, -0.308837890625, -0.1781005859375, -0.04736328125, 0.0833740234375, 0.214111328125, 0.3448486328125, 0.4755859375, 0.6063232421875, 0.737060546875, 0.8677978515625, 0.99853515625, 1.1292724609375, 1.260009765625, 1.3907470703125, 1.521484375, 1.6522216796875, 1.782958984375, 1.9136962890625, 2.04443359375, 2.1751708984375, 2.305908203125, 2.4366455078125, 2.5673828125, 2.6981201171875, 2.828857421875, 2.9595947265625, 3.09033203125, 3.2210693359375, 3.351806640625, 3.4825439453125, 3.61328125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 6.0, 11.0, 17.0, 22.0, 25.0, 34.0, 49.0, 116.0, 174.0, 272.0, 488.0, 868.0, 1627.0, 3866.0, 14039.0, 894249.0, 116665.0, 9632.0, 3118.0, 1449.0, 718.0, 424.0, 255.0, 154.0, 74.0, 55.0, 35.0, 38.0, 18.0, 15.0, 12.0, 3.0, 5.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.2314453125, -0.22517013549804688, -0.21889495849609375, -0.21261978149414062, -0.2063446044921875, -0.20006942749023438, -0.19379425048828125, -0.18751907348632812, -0.181243896484375, -0.17496871948242188, -0.16869354248046875, -0.16241836547851562, -0.1561431884765625, -0.14986801147460938, -0.14359283447265625, -0.13731765747070312, -0.13104248046875, -0.12476730346679688, -0.11849212646484375, -0.11221694946289062, -0.1059417724609375, -0.09966659545898438, -0.09339141845703125, -0.08711624145507812, -0.080841064453125, -0.07456588745117188, -0.06829071044921875, -0.062015533447265625, -0.0557403564453125, -0.049465179443359375, -0.04319000244140625, -0.036914825439453125, -0.0306396484375, -0.024364471435546875, -0.01808929443359375, -0.011814117431640625, -0.0055389404296875, 0.000736236572265625, 0.00701141357421875, 0.013286590576171875, 0.019561767578125, 0.025836944580078125, 0.03211212158203125, 0.038387298583984375, 0.0446624755859375, 0.050937652587890625, 0.05721282958984375, 0.06348800659179688, 0.06976318359375, 0.07603836059570312, 0.08231353759765625, 0.08858871459960938, 0.0948638916015625, 0.10113906860351562, 0.10741424560546875, 0.11368942260742188, 0.119964599609375, 0.12623977661132812, 0.13251495361328125, 0.13879013061523438, 0.1450653076171875, 0.15134048461914062, 0.15761566162109375, 0.16389083862304688, 0.170166015625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 7.0, 8.0, 17.0, 32.0, 215.0, 595.0, 67.0, 20.0, 9.0, 7.0, 8.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5510787963867188e-05, -2.436526119709015e-05, -2.321973443031311e-05, -2.2074207663536072e-05, -2.0928680896759033e-05, -1.9783154129981995e-05, -1.8637627363204956e-05, -1.7492100596427917e-05, -1.634657382965088e-05, -1.520104706287384e-05, -1.4055520296096802e-05, -1.2909993529319763e-05, -1.1764466762542725e-05, -1.0618939995765686e-05, -9.473413228988647e-06, -8.327886462211609e-06, -7.18235969543457e-06, -6.036832928657532e-06, -4.891306161880493e-06, -3.7457793951034546e-06, -2.600252628326416e-06, -1.4547258615493774e-06, -3.0919909477233887e-07, 8.363276720046997e-07, 1.9818544387817383e-06, 3.127381205558777e-06, 4.2729079723358154e-06, 5.418434739112854e-06, 6.563961505889893e-06, 7.709488272666931e-06, 8.85501503944397e-06, 1.0000541806221008e-05, 1.1146068572998047e-05, 1.2291595339775085e-05, 1.3437122106552124e-05, 1.4582648873329163e-05, 1.57281756401062e-05, 1.687370240688324e-05, 1.801922917366028e-05, 1.9164755940437317e-05, 2.0310282707214355e-05, 2.1455809473991394e-05, 2.2601336240768433e-05, 2.374686300754547e-05, 2.489238977432251e-05, 2.603791654109955e-05, 2.7183443307876587e-05, 2.8328970074653625e-05, 2.9474496841430664e-05, 3.06200236082077e-05, 3.176555037498474e-05, 3.291107714176178e-05, 3.405660390853882e-05, 3.520213067531586e-05, 3.6347657442092896e-05, 3.7493184208869934e-05, 3.863871097564697e-05, 3.978423774242401e-05, 4.092976450920105e-05, 4.207529127597809e-05, 4.322081804275513e-05, 4.4366344809532166e-05, 4.5511871576309204e-05, 4.665739834308624e-05, 4.780292510986328e-05]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 12.0, 21.0, 24.0, 21.0, 49.0, 80.0, 103.0, 195.0, 479.0, 973.0, 2485.0, 10857.0, 992173.0, 34409.0, 4017.0, 1347.0, 625.0, 278.0, 170.0, 57.0, 54.0, 38.0, 37.0, 17.0, 12.0, 3.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.3642578125, -0.353759765625, -0.34326171875, -0.332763671875, -0.322265625, -0.311767578125, -0.30126953125, -0.290771484375, -0.2802734375, -0.269775390625, -0.25927734375, -0.248779296875, -0.23828125, -0.227783203125, -0.21728515625, -0.206787109375, -0.1962890625, -0.185791015625, -0.17529296875, -0.164794921875, -0.154296875, -0.143798828125, -0.13330078125, -0.122802734375, -0.1123046875, -0.101806640625, -0.09130859375, -0.080810546875, -0.0703125, -0.059814453125, -0.04931640625, -0.038818359375, -0.0283203125, -0.017822265625, -0.00732421875, 0.003173828125, 0.013671875, 0.024169921875, 0.03466796875, 0.045166015625, 0.0556640625, 0.066162109375, 0.07666015625, 0.087158203125, 0.09765625, 0.108154296875, 0.11865234375, 0.129150390625, 0.1396484375, 0.150146484375, 0.16064453125, 0.171142578125, 0.181640625, 0.192138671875, 0.20263671875, 0.213134765625, 0.2236328125, 0.234130859375, 0.24462890625, 0.255126953125, 0.265625, 0.276123046875, 0.28662109375, 0.297119140625, 0.3076171875]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 15.0, 33.0, 88.0, 694.0, 93.0, 32.0, 20.0, 6.0, 4.0, 4.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.145263671875, -0.14129066467285156, -0.13731765747070312, -0.1333446502685547, -0.12937164306640625, -0.1253986358642578, -0.12142562866210938, -0.11745262145996094, -0.1134796142578125, -0.10950660705566406, -0.10553359985351562, -0.10156059265136719, -0.09758758544921875, -0.09361457824707031, -0.08964157104492188, -0.08566856384277344, -0.081695556640625, -0.07772254943847656, -0.07374954223632812, -0.06977653503417969, -0.06580352783203125, -0.06183052062988281, -0.057857513427734375, -0.05388450622558594, -0.0499114990234375, -0.04593849182128906, -0.041965484619140625, -0.03799247741699219, -0.03401947021484375, -0.030046463012695312, -0.026073455810546875, -0.022100448608398438, -0.01812744140625, -0.014154434204101562, -0.010181427001953125, -0.0062084197998046875, -0.00223541259765625, 0.0017375946044921875, 0.005710601806640625, 0.009683609008789062, 0.0136566162109375, 0.017629623413085938, 0.021602630615234375, 0.025575637817382812, 0.02954864501953125, 0.03352165222167969, 0.037494659423828125, 0.04146766662597656, 0.045440673828125, 0.04941368103027344, 0.053386688232421875, 0.05735969543457031, 0.06133270263671875, 0.06530570983886719, 0.06927871704101562, 0.07325172424316406, 0.0772247314453125, 0.08119773864746094, 0.08517074584960938, 0.08914375305175781, 0.09311676025390625, 0.09708976745605469, 0.10106277465820312, 0.10503578186035156, 0.1090087890625]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 26.0, 929.0, 67.0, 0.0, 0.0, 1.0], "bins": [-40.947471618652344, -40.26072311401367, -39.573974609375, -38.887229919433594, -38.20048141479492, -37.51373291015625, -36.82698440551758, -36.140235900878906, -35.453487396240234, -34.76673889160156, -34.07999038696289, -33.39324188232422, -32.70649719238281, -32.01974868774414, -31.33300018310547, -30.646251678466797, -29.959505081176758, -29.272756576538086, -28.586009979248047, -27.899261474609375, -27.212512969970703, -26.52576446533203, -25.839017868041992, -25.15226936340332, -24.46552276611328, -23.77877426147461, -23.09202766418457, -22.4052791595459, -21.718530654907227, -21.031784057617188, -20.345035552978516, -19.658287048339844, -18.971540451049805, -18.284791946411133, -17.598045349121094, -16.911296844482422, -16.22454833984375, -15.537800788879395, -14.851053237915039, -14.164304733276367, -13.477556228637695, -12.79080867767334, -12.104060173034668, -11.417312622070312, -10.73056411743164, -10.043816566467285, -9.35706901550293, -8.670320510864258, -7.9835734367370605, -7.296825408935547, -6.610077857971191, -5.923329830169678, -5.236581802368164, -4.54983377456665, -3.863086223602295, -3.1763381958007812, -2.4895901679992676, -1.8028422594070435, -1.1160943508148193, -0.42934656143188477, 0.2574014663696289, 0.9441494941711426, 1.630897045135498, 2.3176450729370117, 3.0043931007385254]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 5.0, 5.0, 2.0, 8.0, 7.0, 12.0, 12.0, 14.0, 18.0, 22.0, 21.0, 28.0, 25.0, 21.0, 26.0, 33.0, 38.0, 40.0, 43.0, 43.0, 41.0, 40.0, 46.0, 50.0, 37.0, 35.0, 47.0, 24.0, 43.0, 27.0, 20.0, 29.0, 26.0, 24.0, 17.0, 17.0, 11.0, 8.0, 8.0, 12.0, 5.0, 4.0, 3.0, 1.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.156064033508301, -5.960081100463867, -5.764098644256592, -5.568115711212158, -5.372132778167725, -5.176150321960449, -4.980167388916016, -4.784184455871582, -4.588201999664307, -4.392219066619873, -4.196236610412598, -4.000253677368164, -3.8042709827423096, -3.608288288116455, -3.4123053550720215, -3.216322660446167, -3.0203397274017334, -2.824357032775879, -2.6283740997314453, -2.432391405105591, -2.2364087104797363, -2.0404257774353027, -1.8444430828094482, -1.6484603881835938, -1.4524775743484497, -1.2564947605133057, -1.0605120658874512, -0.8645292520523071, -0.6685464978218079, -0.4725637435913086, -0.27658092975616455, -0.08059823513031006, 0.11538457870483398, 0.31136733293533325, 0.5073500871658325, 0.7033329010009766, 0.8993156552314758, 1.095298409461975, 1.2912812232971191, 1.4872639179229736, 1.6832467317581177, 1.8792295455932617, 2.075212240219116, 2.2711949348449707, 2.4671778678894043, 2.663160562515259, 2.8591432571411133, 3.055126190185547, 3.2511088848114014, 3.447091579437256, 3.6430745124816895, 3.839057207107544, 4.035039901733398, 4.231022834777832, 4.427005767822266, 4.622988224029541, 4.818971157073975, 5.014954090118408, 5.210936546325684, 5.406919479370117, 5.602902412414551, 5.798884868621826, 5.99486780166626, 6.190850257873535, 6.386833190917969]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 1.0, 4.0, 2.0, 6.0, 4.0, 10.0, 8.0, 14.0, 13.0, 18.0, 24.0, 22.0, 26.0, 24.0, 50.0, 47.0, 87.0, 184.0, 441.0, 1176.0, 4386.0, 21286.0, 874982.0, 3238203.0, 43019.0, 7062.0, 1899.0, 622.0, 256.0, 109.0, 60.0, 41.0, 36.0, 35.0, 21.0, 19.0, 19.0, 17.0, 13.0, 8.0, 5.0, 5.0, 3.0, 7.0, 3.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.84375, -1.782623291015625, -1.72149658203125, -1.660369873046875, -1.5992431640625, -1.538116455078125, -1.47698974609375, -1.415863037109375, -1.354736328125, -1.293609619140625, -1.23248291015625, -1.171356201171875, -1.1102294921875, -1.049102783203125, -0.98797607421875, -0.926849365234375, -0.86572265625, -0.804595947265625, -0.74346923828125, -0.682342529296875, -0.6212158203125, -0.560089111328125, -0.49896240234375, -0.437835693359375, -0.376708984375, -0.315582275390625, -0.25445556640625, -0.193328857421875, -0.1322021484375, -0.071075439453125, -0.00994873046875, 0.051177978515625, 0.1123046875, 0.173431396484375, 0.23455810546875, 0.295684814453125, 0.3568115234375, 0.417938232421875, 0.47906494140625, 0.540191650390625, 0.601318359375, 0.662445068359375, 0.72357177734375, 0.784698486328125, 0.8458251953125, 0.906951904296875, 0.96807861328125, 1.029205322265625, 1.09033203125, 1.151458740234375, 1.21258544921875, 1.273712158203125, 1.3348388671875, 1.395965576171875, 1.45709228515625, 1.518218994140625, 1.579345703125, 1.640472412109375, 1.70159912109375, 1.762725830078125, 1.8238525390625, 1.884979248046875, 1.94610595703125, 2.007232666015625, 2.068359375]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 11.0, 14.0, 9.0, 14.0, 15.0, 17.0, 20.0, 29.0, 35.0, 44.0, 47.0, 39.0, 52.0, 54.0, 61.0, 56.0, 50.0, 67.0, 56.0, 51.0, 57.0, 40.0, 38.0, 32.0, 24.0, 14.0, 19.0, 12.0, 9.0, 7.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.447998046875, -0.4272346496582031, -0.40647125244140625, -0.3857078552246094, -0.3649444580078125, -0.3441810607910156, -0.32341766357421875, -0.3026542663574219, -0.281890869140625, -0.2611274719238281, -0.24036407470703125, -0.21960067749023438, -0.1988372802734375, -0.17807388305664062, -0.15731048583984375, -0.13654708862304688, -0.11578369140625, -0.09502029418945312, -0.07425689697265625, -0.053493499755859375, -0.0327301025390625, -0.011966705322265625, 0.00879669189453125, 0.029560089111328125, 0.050323486328125, 0.07108688354492188, 0.09185028076171875, 0.11261367797851562, 0.1333770751953125, 0.15414047241210938, 0.17490386962890625, 0.19566726684570312, 0.2164306640625, 0.23719406127929688, 0.25795745849609375, 0.2787208557128906, 0.2994842529296875, 0.3202476501464844, 0.34101104736328125, 0.3617744445800781, 0.382537841796875, 0.4033012390136719, 0.42406463623046875, 0.4448280334472656, 0.4655914306640625, 0.4863548278808594, 0.5071182250976562, 0.5278816223144531, 0.54864501953125, 0.5694084167480469, 0.5901718139648438, 0.6109352111816406, 0.6316986083984375, 0.6524620056152344, 0.6732254028320312, 0.6939888000488281, 0.714752197265625, 0.7355155944824219, 0.7562789916992188, 0.7770423889160156, 0.7978057861328125, 0.8185691833496094, 0.8393325805664062, 0.8600959777832031, 0.880859375]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 8.0, 22.0, 101.0, 4193788.0, 310.0, 37.0, 11.0, 11.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.2421875, -13.4971923828125, -11.752197265625, -10.0072021484375, -8.26220703125, -6.5172119140625, -4.772216796875, -3.0272216796875, -1.2822265625, 0.4627685546875, 2.207763671875, 3.9527587890625, 5.69775390625, 7.4427490234375, 9.187744140625, 10.9327392578125, 12.677734375, 14.4227294921875, 16.167724609375, 17.9127197265625, 19.65771484375, 21.4027099609375, 23.147705078125, 24.8927001953125, 26.6376953125, 28.3826904296875, 30.127685546875, 31.8726806640625, 33.61767578125, 35.3626708984375, 37.107666015625, 38.8526611328125, 40.59765625, 42.3426513671875, 44.087646484375, 45.8326416015625, 47.57763671875, 49.3226318359375, 51.067626953125, 52.8126220703125, 54.5576171875, 56.3026123046875, 58.047607421875, 59.7926025390625, 61.53759765625, 63.2825927734375, 65.027587890625, 66.7725830078125, 68.517578125, 70.2625732421875, 72.007568359375, 73.7525634765625, 75.49755859375, 77.2425537109375, 78.987548828125, 80.7325439453125, 82.4775390625, 84.2225341796875, 85.967529296875, 87.7125244140625, 89.45751953125, 91.2025146484375, 92.947509765625, 94.6925048828125, 96.4375]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 5.0, 7.0, 21.0, 21.0, 30.0, 39.0, 74.0, 127.0, 311.0, 957.0, 1422.0, 588.0, 196.0, 113.0, 62.0, 38.0, 26.0, 17.0, 10.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.296875, -0.282928466796875, -0.26898193359375, -0.255035400390625, -0.2410888671875, -0.227142333984375, -0.21319580078125, -0.199249267578125, -0.185302734375, -0.171356201171875, -0.15740966796875, -0.143463134765625, -0.1295166015625, -0.115570068359375, -0.10162353515625, -0.087677001953125, -0.07373046875, -0.059783935546875, -0.04583740234375, -0.031890869140625, -0.0179443359375, -0.003997802734375, 0.00994873046875, 0.023895263671875, 0.037841796875, 0.051788330078125, 0.06573486328125, 0.079681396484375, 0.0936279296875, 0.107574462890625, 0.12152099609375, 0.135467529296875, 0.1494140625, 0.163360595703125, 0.17730712890625, 0.191253662109375, 0.2052001953125, 0.219146728515625, 0.23309326171875, 0.247039794921875, 0.260986328125, 0.274932861328125, 0.28887939453125, 0.302825927734375, 0.3167724609375, 0.330718994140625, 0.34466552734375, 0.358612060546875, 0.37255859375, 0.386505126953125, 0.40045166015625, 0.414398193359375, 0.4283447265625, 0.442291259765625, 0.45623779296875, 0.470184326171875, 0.484130859375, 0.498077392578125, 0.51202392578125, 0.525970458984375, 0.5399169921875, 0.553863525390625, 0.56781005859375, 0.581756591796875, 0.595703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 5.0, 4.0, 9.0, 15.0, 27.0, 42.0, 60.0, 104.0, 142.0, 186.0, 165.0, 99.0, 57.0, 31.0, 26.0, 23.0, 12.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5449100136756897, -0.5015302300453186, -0.4581504464149475, -0.4147706627845764, -0.3713908791542053, -0.32801109552383423, -0.28463128209114075, -0.24125149846076965, -0.19787171483039856, -0.15449193120002747, -0.11111214011907578, -0.06773234903812408, -0.02435256540775299, 0.019027218222618103, 0.06240701675415039, 0.10578680038452148, 0.14916658401489258, 0.19254636764526367, 0.23592615127563477, 0.27930593490600586, 0.32268571853637695, 0.36606550216674805, 0.40944531559944153, 0.4528250992298126, 0.4962048828601837, 0.5395846962928772, 0.5829644799232483, 0.6263442635536194, 0.6697240471839905, 0.7131038308143616, 0.7564836144447327, 0.7998633980751038, 0.8432432413101196, 0.8866230249404907, 0.9300028085708618, 0.9733825922012329, 1.016762375831604, 1.060142159461975, 1.1035219430923462, 1.1469017267227173, 1.1902815103530884, 1.2336612939834595, 1.2770410776138306, 1.3204208612442017, 1.3638006448745728, 1.4071804285049438, 1.450560212135315, 1.493939995765686, 1.5373198986053467, 1.5806996822357178, 1.6240794658660889, 1.66745924949646, 1.710839033126831, 1.7542188167572021, 1.7975986003875732, 1.8409783840179443, 1.8843581676483154, 1.9277379512786865, 1.9711177349090576, 2.0144975185394287, 2.0578773021698, 2.101257085800171, 2.144636869430542, 2.188016653060913, 2.231396436691284]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 5.0, 3.0, 6.0, 10.0, 10.0, 11.0, 15.0, 19.0, 23.0, 24.0, 32.0, 35.0, 34.0, 31.0, 29.0, 32.0, 49.0, 38.0, 44.0, 48.0, 57.0, 48.0, 34.0, 43.0, 50.0, 33.0, 27.0, 40.0, 30.0, 24.0, 20.0, 18.0, 16.0, 17.0, 8.0, 11.0, 12.0, 4.0, 5.0, 3.0, 3.0, 1.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5113065838813782, -0.49378257989883423, -0.47625860571861267, -0.4587346315383911, -0.44121062755584717, -0.4236866235733032, -0.40616264939308167, -0.3886386752128601, -0.37111467123031616, -0.3535906672477722, -0.33606669306755066, -0.3185427188873291, -0.30101871490478516, -0.2834947109222412, -0.26597073674201965, -0.2484467476606369, -0.23092275857925415, -0.2133987694978714, -0.19587478041648865, -0.1783507913351059, -0.16082680225372314, -0.1433028131723404, -0.12577882409095764, -0.10825483500957489, -0.09073084592819214, -0.07320685684680939, -0.055682867765426636, -0.038158878684043884, -0.020634889602661133, -0.0031109005212783813, 0.01441308856010437, 0.03193707764148712, 0.0494610071182251, 0.06698499619960785, 0.0845089852809906, 0.10203297436237335, 0.1195569634437561, 0.13708095252513885, 0.1546049416065216, 0.17212893068790436, 0.1896529197692871, 0.20717690885066986, 0.2247008979320526, 0.24222488701343536, 0.2597488760948181, 0.27727288007736206, 0.2947968542575836, 0.3123208284378052, 0.3298448324203491, 0.34736883640289307, 0.3648928105831146, 0.3824167847633362, 0.3999407887458801, 0.4174647927284241, 0.43498876690864563, 0.4525127410888672, 0.47003674507141113, 0.4875607490539551, 0.505084753036499, 0.5226086974143982, 0.5401327013969421, 0.5576567053794861, 0.5751806497573853, 0.5927046537399292, 0.6102286577224731]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 9.0, 11.0, 11.0, 20.0, 30.0, 35.0, 60.0, 91.0, 157.0, 229.0, 345.0, 525.0, 852.0, 1356.0, 2300.0, 3898.0, 7022.0, 13536.0, 28545.0, 64499.0, 172676.0, 395900.0, 211852.0, 76748.0, 32839.0, 15962.0, 8160.0, 4315.0, 2485.0, 1489.0, 932.0, 587.0, 385.0, 228.0, 147.0, 100.0, 73.0, 49.0, 35.0, 23.0, 19.0, 9.0, 10.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.293212890625, -0.28421783447265625, -0.2752227783203125, -0.26622772216796875, -0.257232666015625, -0.24823760986328125, -0.2392425537109375, -0.23024749755859375, -0.22125244140625, -0.21225738525390625, -0.2032623291015625, -0.19426727294921875, -0.185272216796875, -0.17627716064453125, -0.1672821044921875, -0.15828704833984375, -0.1492919921875, -0.14029693603515625, -0.1313018798828125, -0.12230682373046875, -0.113311767578125, -0.10431671142578125, -0.0953216552734375, -0.08632659912109375, -0.07733154296875, -0.06833648681640625, -0.0593414306640625, -0.05034637451171875, -0.041351318359375, -0.03235626220703125, -0.0233612060546875, -0.01436614990234375, -0.00537109375, 0.00362396240234375, 0.0126190185546875, 0.02161407470703125, 0.030609130859375, 0.03960418701171875, 0.0485992431640625, 0.05759429931640625, 0.06658935546875, 0.07558441162109375, 0.0845794677734375, 0.09357452392578125, 0.102569580078125, 0.11156463623046875, 0.1205596923828125, 0.12955474853515625, 0.1385498046875, 0.14754486083984375, 0.1565399169921875, 0.16553497314453125, 0.174530029296875, 0.18352508544921875, 0.1925201416015625, 0.20151519775390625, 0.21051025390625, 0.21950531005859375, 0.2285003662109375, 0.23749542236328125, 0.246490478515625, 0.25548553466796875, 0.2644805908203125, 0.27347564697265625, 0.282470703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 8.0, 10.0, 9.0, 17.0, 12.0, 21.0, 24.0, 31.0, 41.0, 33.0, 31.0, 36.0, 36.0, 34.0, 57.0, 59.0, 59.0, 41.0, 53.0, 45.0, 51.0, 41.0, 34.0, 35.0, 43.0, 30.0, 20.0, 19.0, 18.0, 7.0, 18.0, 3.0, 9.0, 3.0, 3.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.339111328125, -0.32689666748046875, -0.3146820068359375, -0.30246734619140625, -0.290252685546875, -0.27803802490234375, -0.2658233642578125, -0.25360870361328125, -0.24139404296875, -0.22917938232421875, -0.2169647216796875, -0.20475006103515625, -0.192535400390625, -0.18032073974609375, -0.1681060791015625, -0.15589141845703125, -0.1436767578125, -0.13146209716796875, -0.1192474365234375, -0.10703277587890625, -0.094818115234375, -0.08260345458984375, -0.0703887939453125, -0.05817413330078125, -0.04595947265625, -0.03374481201171875, -0.0215301513671875, -0.00931549072265625, 0.002899169921875, 0.01511383056640625, 0.0273284912109375, 0.03954315185546875, 0.0517578125, 0.06397247314453125, 0.0761871337890625, 0.08840179443359375, 0.100616455078125, 0.11283111572265625, 0.1250457763671875, 0.13726043701171875, 0.14947509765625, 0.16168975830078125, 0.1739044189453125, 0.18611907958984375, 0.198333740234375, 0.21054840087890625, 0.2227630615234375, 0.23497772216796875, 0.2471923828125, 0.25940704345703125, 0.2716217041015625, 0.28383636474609375, 0.296051025390625, 0.30826568603515625, 0.3204803466796875, 0.33269500732421875, 0.34490966796875, 0.35712432861328125, 0.3693389892578125, 0.38155364990234375, 0.393768310546875, 0.40598297119140625, 0.4181976318359375, 0.43041229248046875, 0.442626953125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 2.0, 3.0, 4.0, 4.0, 6.0, 14.0, 11.0, 8.0, 22.0, 33.0, 49.0, 95.0, 123.0, 216.0, 392.0, 681.0, 1404.0, 3334.0, 8996.0, 28500.0, 113722.0, 499199.0, 299948.0, 63492.0, 17577.0, 5957.0, 2388.0, 1051.0, 529.0, 297.0, 171.0, 100.0, 68.0, 47.0, 26.0, 30.0, 14.0, 10.0, 9.0, 9.0, 6.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.392578125, -0.3812980651855469, -0.37001800537109375, -0.3587379455566406, -0.3474578857421875, -0.3361778259277344, -0.32489776611328125, -0.3136177062988281, -0.302337646484375, -0.2910575866699219, -0.27977752685546875, -0.2684974670410156, -0.2572174072265625, -0.24593734741210938, -0.23465728759765625, -0.22337722778320312, -0.21209716796875, -0.20081710815429688, -0.18953704833984375, -0.17825698852539062, -0.1669769287109375, -0.15569686889648438, -0.14441680908203125, -0.13313674926757812, -0.121856689453125, -0.11057662963867188, -0.09929656982421875, -0.08801651000976562, -0.0767364501953125, -0.06545639038085938, -0.05417633056640625, -0.042896270751953125, -0.0316162109375, -0.020336151123046875, -0.00905609130859375, 0.002223968505859375, 0.0135040283203125, 0.024784088134765625, 0.03606414794921875, 0.047344207763671875, 0.058624267578125, 0.06990432739257812, 0.08118438720703125, 0.09246444702148438, 0.1037445068359375, 0.11502456665039062, 0.12630462646484375, 0.13758468627929688, 0.14886474609375, 0.16014480590820312, 0.17142486572265625, 0.18270492553710938, 0.1939849853515625, 0.20526504516601562, 0.21654510498046875, 0.22782516479492188, 0.239105224609375, 0.2503852844238281, 0.26166534423828125, 0.2729454040527344, 0.2842254638671875, 0.2955055236816406, 0.30678558349609375, 0.3180656433105469, 0.329345703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 4.0, 8.0, 6.0, 10.0, 15.0, 10.0, 16.0, 14.0, 17.0, 17.0, 21.0, 32.0, 30.0, 32.0, 28.0, 33.0, 43.0, 42.0, 54.0, 40.0, 29.0, 47.0, 50.0, 30.0, 33.0, 33.0, 34.0, 29.0, 13.0, 19.0, 22.0, 21.0, 26.0, 16.0, 20.0, 14.0, 20.0, 9.0, 16.0, 13.0, 3.0, 12.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.57666015625, -0.5589218139648438, -0.5411834716796875, -0.5234451293945312, -0.505706787109375, -0.48796844482421875, -0.4702301025390625, -0.45249176025390625, -0.43475341796875, -0.41701507568359375, -0.3992767333984375, -0.38153839111328125, -0.363800048828125, -0.34606170654296875, -0.3283233642578125, -0.31058502197265625, -0.2928466796875, -0.27510833740234375, -0.2573699951171875, -0.23963165283203125, -0.221893310546875, -0.20415496826171875, -0.1864166259765625, -0.16867828369140625, -0.15093994140625, -0.13320159912109375, -0.1154632568359375, -0.09772491455078125, -0.079986572265625, -0.06224822998046875, -0.0445098876953125, -0.02677154541015625, -0.009033203125, 0.00870513916015625, 0.0264434814453125, 0.04418182373046875, 0.061920166015625, 0.07965850830078125, 0.0973968505859375, 0.11513519287109375, 0.13287353515625, 0.15061187744140625, 0.1683502197265625, 0.18608856201171875, 0.203826904296875, 0.22156524658203125, 0.2393035888671875, 0.25704193115234375, 0.2747802734375, 0.29251861572265625, 0.3102569580078125, 0.32799530029296875, 0.345733642578125, 0.36347198486328125, 0.3812103271484375, 0.39894866943359375, 0.41668701171875, 0.43442535400390625, 0.4521636962890625, 0.46990203857421875, 0.487640380859375, 0.5053787231445312, 0.5231170654296875, 0.5408554077148438, 0.55859375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 9.0, 12.0, 10.0, 20.0, 33.0, 41.0, 46.0, 79.0, 118.0, 180.0, 309.0, 586.0, 1259.0, 2802.0, 7479.0, 25836.0, 123278.0, 604784.0, 222153.0, 41322.0, 10983.0, 3818.0, 1578.0, 833.0, 389.0, 247.0, 121.0, 85.0, 50.0, 27.0, 16.0, 12.0, 17.0, 7.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.1011962890625, -0.09857845306396484, -0.09596061706542969, -0.09334278106689453, -0.09072494506835938, -0.08810710906982422, -0.08548927307128906, -0.0828714370727539, -0.08025360107421875, -0.0776357650756836, -0.07501792907714844, -0.07240009307861328, -0.06978225708007812, -0.06716442108154297, -0.06454658508300781, -0.061928749084472656, -0.0593109130859375, -0.056693077087402344, -0.05407524108886719, -0.05145740509033203, -0.048839569091796875, -0.04622173309326172, -0.04360389709472656, -0.040986061096191406, -0.03836822509765625, -0.035750389099121094, -0.03313255310058594, -0.03051471710205078, -0.027896881103515625, -0.02527904510498047, -0.022661209106445312, -0.020043373107910156, -0.017425537109375, -0.014807701110839844, -0.012189865112304688, -0.009572029113769531, -0.006954193115234375, -0.004336357116699219, -0.0017185211181640625, 0.0008993148803710938, 0.00351715087890625, 0.006134986877441406, 0.008752822875976562, 0.011370658874511719, 0.013988494873046875, 0.01660633087158203, 0.019224166870117188, 0.021842002868652344, 0.0244598388671875, 0.027077674865722656, 0.029695510864257812, 0.03231334686279297, 0.034931182861328125, 0.03754901885986328, 0.04016685485839844, 0.042784690856933594, 0.04540252685546875, 0.048020362854003906, 0.05063819885253906, 0.05325603485107422, 0.055873870849609375, 0.05849170684814453, 0.06110954284667969, 0.06372737884521484, 0.06634521484375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 6.0, 4.0, 10.0, 10.0, 10.0, 20.0, 24.0, 29.0, 38.0, 47.0, 88.0, 100.0, 136.0, 122.0, 86.0, 71.0, 53.0, 34.0, 36.0, 20.0, 9.0, 4.0, 6.0, 11.0, 3.0, 5.0, 10.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.404783248901367e-05, -4.2280182242393494e-05, -4.0512531995773315e-05, -3.874488174915314e-05, -3.697723150253296e-05, -3.520958125591278e-05, -3.34419310092926e-05, -3.1674280762672424e-05, -2.9906630516052246e-05, -2.8138980269432068e-05, -2.637133002281189e-05, -2.460367977619171e-05, -2.2836029529571533e-05, -2.1068379282951355e-05, -1.9300729036331177e-05, -1.7533078789711e-05, -1.576542854309082e-05, -1.3997778296470642e-05, -1.2230128049850464e-05, -1.0462477803230286e-05, -8.694827556610107e-06, -6.927177309989929e-06, -5.159527063369751e-06, -3.3918768167495728e-06, -1.6242265701293945e-06, 1.434236764907837e-07, 1.911073923110962e-06, 3.67872416973114e-06, 5.446374416351318e-06, 7.214024662971497e-06, 8.981674909591675e-06, 1.0749325156211853e-05, 1.2516975402832031e-05, 1.428462564945221e-05, 1.6052275896072388e-05, 1.7819926142692566e-05, 1.9587576389312744e-05, 2.1355226635932922e-05, 2.31228768825531e-05, 2.489052712917328e-05, 2.6658177375793457e-05, 2.8425827622413635e-05, 3.0193477869033813e-05, 3.196112811565399e-05, 3.372877836227417e-05, 3.549642860889435e-05, 3.7264078855514526e-05, 3.9031729102134705e-05, 4.079937934875488e-05, 4.256702959537506e-05, 4.433467984199524e-05, 4.610233008861542e-05, 4.7869980335235596e-05, 4.9637630581855774e-05, 5.140528082847595e-05, 5.317293107509613e-05, 5.494058132171631e-05, 5.670823156833649e-05, 5.8475881814956665e-05, 6.024353206157684e-05, 6.201118230819702e-05, 6.37788325548172e-05, 6.554648280143738e-05, 6.731413304805756e-05, 6.908178329467773e-05]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 8.0, 2.0, 7.0, 3.0, 4.0, 2.0, 5.0, 10.0, 25.0, 13.0, 21.0, 23.0, 22.0, 37.0, 51.0, 70.0, 241.0, 14388.0, 1029056.0, 4094.0, 149.0, 79.0, 48.0, 25.0, 34.0, 28.0, 15.0, 10.0, 14.0, 12.0, 7.0, 10.0, 6.0, 4.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.396484375, -0.38385772705078125, -0.3712310791015625, -0.35860443115234375, -0.345977783203125, -0.33335113525390625, -0.3207244873046875, -0.30809783935546875, -0.29547119140625, -0.28284454345703125, -0.2702178955078125, -0.25759124755859375, -0.244964599609375, -0.23233795166015625, -0.2197113037109375, -0.20708465576171875, -0.1944580078125, -0.18183135986328125, -0.1692047119140625, -0.15657806396484375, -0.143951416015625, -0.13132476806640625, -0.1186981201171875, -0.10607147216796875, -0.09344482421875, -0.08081817626953125, -0.0681915283203125, -0.05556488037109375, -0.042938232421875, -0.03031158447265625, -0.0176849365234375, -0.00505828857421875, 0.007568359375, 0.02019500732421875, 0.0328216552734375, 0.04544830322265625, 0.058074951171875, 0.07070159912109375, 0.0833282470703125, 0.09595489501953125, 0.10858154296875, 0.12120819091796875, 0.1338348388671875, 0.14646148681640625, 0.159088134765625, 0.17171478271484375, 0.1843414306640625, 0.19696807861328125, 0.2095947265625, 0.22222137451171875, 0.2348480224609375, 0.24747467041015625, 0.260101318359375, 0.27272796630859375, 0.2853546142578125, 0.29798126220703125, 0.31060791015625, 0.32323455810546875, 0.3358612060546875, 0.34848785400390625, 0.361114501953125, 0.37374114990234375, 0.3863677978515625, 0.39899444580078125, 0.41162109375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 1.0, 3.0, 4.0, 6.0, 14.0, 8.0, 7.0, 8.0, 13.0, 19.0, 27.0, 33.0, 33.0, 46.0, 49.0, 49.0, 55.0, 67.0, 53.0, 73.0, 59.0, 52.0, 61.0, 47.0, 34.0, 27.0, 24.0, 26.0, 17.0, 17.0, 13.0, 10.0, 9.0, 7.0, 8.0, 4.0, 6.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0164337158203125, -0.015799522399902344, -0.015165328979492188, -0.014531135559082031, -0.013896942138671875, -0.013262748718261719, -0.012628555297851562, -0.011994361877441406, -0.01136016845703125, -0.010725975036621094, -0.010091781616210938, -0.009457588195800781, -0.008823394775390625, -0.008189201354980469, -0.0075550079345703125, -0.006920814514160156, -0.00628662109375, -0.005652427673339844, -0.0050182342529296875, -0.004384040832519531, -0.003749847412109375, -0.0031156539916992188, -0.0024814605712890625, -0.0018472671508789062, -0.00121307373046875, -0.0005788803100585938, 5.53131103515625e-05, 0.0006895065307617188, 0.001323699951171875, 0.0019578933715820312, 0.0025920867919921875, 0.0032262802124023438, 0.0038604736328125, 0.004494667053222656, 0.0051288604736328125, 0.005763053894042969, 0.006397247314453125, 0.007031440734863281, 0.0076656341552734375, 0.008299827575683594, 0.00893402099609375, 0.009568214416503906, 0.010202407836914062, 0.010836601257324219, 0.011470794677734375, 0.012104988098144531, 0.012739181518554688, 0.013373374938964844, 0.014007568359375, 0.014641761779785156, 0.015275955200195312, 0.01591014862060547, 0.016544342041015625, 0.01717853546142578, 0.017812728881835938, 0.018446922302246094, 0.01908111572265625, 0.019715309143066406, 0.020349502563476562, 0.02098369598388672, 0.021617889404296875, 0.02225208282470703, 0.022886276245117188, 0.023520469665527344, 0.0241546630859375]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 3.0, 11.0, 14.0, 26.0, 35.0, 62.0, 100.0, 150.0, 172.0, 146.0, 123.0, 51.0, 53.0, 20.0, 13.0, 9.0, 7.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.477413535118103, -0.4553607404232025, -0.4333079755306244, -0.4112551808357239, -0.38920241594314575, -0.36714962124824524, -0.3450968265533447, -0.3230440616607666, -0.3009912669658661, -0.2789384722709656, -0.25688570737838745, -0.23483291268348694, -0.21278013288974762, -0.1907273530960083, -0.1686745584011078, -0.14662177860736847, -0.12456899881362915, -0.10251621901988983, -0.08046343177556992, -0.05841064453125, -0.03635786473751068, -0.014305084943771362, 0.00774770975112915, 0.02980048954486847, 0.05185326933860779, 0.0739060491323471, 0.09595883637666702, 0.11801162362098694, 0.14006440341472626, 0.16211718320846558, 0.1841699779033661, 0.2062227576971054, 0.22827553749084473, 0.25032833218574524, 0.27238109707832336, 0.2944338917732239, 0.316486656665802, 0.3385394513607025, 0.360592246055603, 0.38264501094818115, 0.40469780564308167, 0.4267506003379822, 0.4488033652305603, 0.4708561599254608, 0.49290895462036133, 0.5149617195129395, 0.5370144844055176, 0.5590673089027405, 0.5811200737953186, 0.6031728386878967, 0.6252256631851196, 0.6472784280776978, 0.6693311929702759, 0.691383957862854, 0.7134367823600769, 0.735489547252655, 0.7575423717498779, 0.779595136642456, 0.801647961139679, 0.8237007260322571, 0.8457534909248352, 0.8678063154220581, 0.8898590803146362, 0.9119118452072144, 0.9339646100997925]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 6.0, 7.0, 8.0, 10.0, 17.0, 19.0, 29.0, 29.0, 44.0, 30.0, 31.0, 44.0, 48.0, 46.0, 45.0, 49.0, 62.0, 52.0, 56.0, 59.0, 45.0, 50.0, 33.0, 34.0, 34.0, 25.0, 23.0, 19.0, 13.0, 11.0, 4.0, 11.0, 2.0, 2.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.374891996383667, -0.3621973395347595, -0.34950268268585205, -0.3368080258369446, -0.3241133689880371, -0.31141871213912964, -0.29872405529022217, -0.2860293984413147, -0.2733347415924072, -0.26064008474349976, -0.24794542789459229, -0.23525077104568481, -0.22255611419677734, -0.20986145734786987, -0.1971667855978012, -0.18447212874889374, -0.17177745699882507, -0.1590828001499176, -0.14638814330101013, -0.13369348645210266, -0.1209988221526146, -0.10830416530370712, -0.09560950100421906, -0.08291484415531158, -0.07022018730640411, -0.05752553045749664, -0.044830869883298874, -0.032136209309101105, -0.019441552460193634, -0.006746895611286163, 0.005947768688201904, 0.018642425537109375, 0.03133705258369446, 0.04403170943260193, 0.0567263700067997, 0.06942103058099747, 0.08211568742990494, 0.09481034427881241, 0.10750500857830048, 0.12019966542720795, 0.13289432227611542, 0.1455889791250229, 0.15828363597393036, 0.17097830772399902, 0.1836729645729065, 0.19636762142181396, 0.20906227827072144, 0.2217569351196289, 0.23445159196853638, 0.24714624881744385, 0.2598409056663513, 0.2725355625152588, 0.28523021936416626, 0.29792487621307373, 0.3106195330619812, 0.32331418991088867, 0.33600884675979614, 0.3487035036087036, 0.3613981604576111, 0.37409281730651855, 0.386787474155426, 0.3994821310043335, 0.41217678785324097, 0.42487144470214844, 0.4375661313533783]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 5.0, 4.0, 8.0, 5.0, 9.0, 18.0, 22.0, 28.0, 32.0, 46.0, 72.0, 92.0, 150.0, 230.0, 318.0, 502.0, 839.0, 1501.0, 2586.0, 4830.0, 9223.0, 18370.0, 38922.0, 87838.0, 220991.0, 365720.0, 165878.0, 67388.0, 30787.0, 14913.0, 7735.0, 3978.0, 2174.0, 1242.0, 721.0, 466.0, 297.0, 182.0, 133.0, 93.0, 53.0, 41.0, 40.0, 26.0, 19.0, 9.0, 9.0, 7.0, 5.0, 2.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1292724609375, -0.12514877319335938, -0.12102508544921875, -0.11690139770507812, -0.1127777099609375, -0.10865402221679688, -0.10453033447265625, -0.10040664672851562, -0.096282958984375, -0.09215927124023438, -0.08803558349609375, -0.08391189575195312, -0.0797882080078125, -0.07566452026367188, -0.07154083251953125, -0.06741714477539062, -0.06329345703125, -0.059169769287109375, -0.05504608154296875, -0.050922393798828125, -0.0467987060546875, -0.042675018310546875, -0.03855133056640625, -0.034427642822265625, -0.030303955078125, -0.026180267333984375, -0.02205657958984375, -0.017932891845703125, -0.0138092041015625, -0.009685516357421875, -0.00556182861328125, -0.001438140869140625, 0.002685546875, 0.006809234619140625, 0.01093292236328125, 0.015056610107421875, 0.0191802978515625, 0.023303985595703125, 0.02742767333984375, 0.031551361083984375, 0.035675048828125, 0.039798736572265625, 0.04392242431640625, 0.048046112060546875, 0.0521697998046875, 0.056293487548828125, 0.06041717529296875, 0.06454086303710938, 0.06866455078125, 0.07278823852539062, 0.07691192626953125, 0.08103561401367188, 0.0851593017578125, 0.08928298950195312, 0.09340667724609375, 0.09753036499023438, 0.101654052734375, 0.10577774047851562, 0.10990142822265625, 0.11402511596679688, 0.1181488037109375, 0.12227249145507812, 0.12639617919921875, 0.13051986694335938, 0.1346435546875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 8.0, 4.0, 9.0, 9.0, 18.0, 17.0, 13.0, 23.0, 13.0, 34.0, 33.0, 26.0, 36.0, 36.0, 46.0, 43.0, 54.0, 64.0, 57.0, 49.0, 42.0, 45.0, 52.0, 38.0, 36.0, 31.0, 29.0, 26.0, 23.0, 13.0, 13.0, 11.0, 11.0, 9.0, 6.0, 8.0, 5.0, 7.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8779296875, -1.8259124755859375, -1.773895263671875, -1.7218780517578125, -1.66986083984375, -1.6178436279296875, -1.565826416015625, -1.5138092041015625, -1.4617919921875, -1.4097747802734375, -1.357757568359375, -1.3057403564453125, -1.25372314453125, -1.2017059326171875, -1.149688720703125, -1.0976715087890625, -1.045654296875, -0.9936370849609375, -0.941619873046875, -0.8896026611328125, -0.83758544921875, -0.7855682373046875, -0.733551025390625, -0.6815338134765625, -0.6295166015625, -0.5774993896484375, -0.525482177734375, -0.4734649658203125, -0.42144775390625, -0.3694305419921875, -0.317413330078125, -0.2653961181640625, -0.21337890625, -0.1613616943359375, -0.109344482421875, -0.0573272705078125, -0.00531005859375, 0.0467071533203125, 0.098724365234375, 0.1507415771484375, 0.2027587890625, 0.2547760009765625, 0.306793212890625, 0.3588104248046875, 0.41082763671875, 0.4628448486328125, 0.514862060546875, 0.5668792724609375, 0.618896484375, 0.6709136962890625, 0.722930908203125, 0.7749481201171875, 0.82696533203125, 0.8789825439453125, 0.930999755859375, 0.9830169677734375, 1.0350341796875, 1.0870513916015625, 1.139068603515625, 1.1910858154296875, 1.24310302734375, 1.2951202392578125, 1.347137451171875, 1.3991546630859375, 1.451171875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 6.0, 4.0, 2.0, 5.0, 7.0, 16.0, 14.0, 24.0, 30.0, 51.0, 45.0, 57.0, 65.0, 80.0, 343.0, 1045766.0, 1505.0, 156.0, 78.0, 53.0, 48.0, 47.0, 44.0, 29.0, 19.0, 20.0, 10.0, 11.0, 8.0, 7.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.91796875, -6.7298583984375, -6.541748046875, -6.3536376953125, -6.16552734375, -5.9774169921875, -5.789306640625, -5.6011962890625, -5.4130859375, -5.2249755859375, -5.036865234375, -4.8487548828125, -4.66064453125, -4.4725341796875, -4.284423828125, -4.0963134765625, -3.908203125, -3.7200927734375, -3.531982421875, -3.3438720703125, -3.15576171875, -2.9676513671875, -2.779541015625, -2.5914306640625, -2.4033203125, -2.2152099609375, -2.027099609375, -1.8389892578125, -1.65087890625, -1.4627685546875, -1.274658203125, -1.0865478515625, -0.8984375, -0.7103271484375, -0.522216796875, -0.3341064453125, -0.14599609375, 0.0421142578125, 0.230224609375, 0.4183349609375, 0.6064453125, 0.7945556640625, 0.982666015625, 1.1707763671875, 1.35888671875, 1.5469970703125, 1.735107421875, 1.9232177734375, 2.111328125, 2.2994384765625, 2.487548828125, 2.6756591796875, 2.86376953125, 3.0518798828125, 3.239990234375, 3.4281005859375, 3.6162109375, 3.8043212890625, 3.992431640625, 4.1805419921875, 4.36865234375, 4.5567626953125, 4.744873046875, 4.9329833984375, 5.12109375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 6.0, 4.0, 2.0, 4.0, 8.0, 18.0, 12.0, 27.0, 31.0, 50.0, 50.0, 50.0, 50.0, 66.0, 67.0, 79.0, 61.0, 58.0, 63.0, 49.0, 49.0, 48.0, 43.0, 27.0, 21.0, 19.0, 10.0, 11.0, 8.0, 8.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.755859375, -2.6807861328125, -2.605712890625, -2.5306396484375, -2.45556640625, -2.3804931640625, -2.305419921875, -2.2303466796875, -2.1552734375, -2.0802001953125, -2.005126953125, -1.9300537109375, -1.85498046875, -1.7799072265625, -1.704833984375, -1.6297607421875, -1.5546875, -1.4796142578125, -1.404541015625, -1.3294677734375, -1.25439453125, -1.1793212890625, -1.104248046875, -1.0291748046875, -0.9541015625, -0.8790283203125, -0.803955078125, -0.7288818359375, -0.65380859375, -0.5787353515625, -0.503662109375, -0.4285888671875, -0.353515625, -0.2784423828125, -0.203369140625, -0.1282958984375, -0.05322265625, 0.0218505859375, 0.096923828125, 0.1719970703125, 0.2470703125, 0.3221435546875, 0.397216796875, 0.4722900390625, 0.54736328125, 0.6224365234375, 0.697509765625, 0.7725830078125, 0.84765625, 0.9227294921875, 0.997802734375, 1.0728759765625, 1.14794921875, 1.2230224609375, 1.298095703125, 1.3731689453125, 1.4482421875, 1.5233154296875, 1.598388671875, 1.6734619140625, 1.74853515625, 1.8236083984375, 1.898681640625, 1.9737548828125, 2.048828125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 3.0, 4.0, 13.0, 6.0, 10.0, 11.0, 16.0, 28.0, 56.0, 119.0, 909.0, 47024.0, 995990.0, 3841.0, 290.0, 99.0, 41.0, 22.0, 18.0, 11.0, 15.0, 12.0, 3.0, 4.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2939453125, -0.2842254638671875, -0.274505615234375, -0.2647857666015625, -0.25506591796875, -0.2453460693359375, -0.235626220703125, -0.2259063720703125, -0.2161865234375, -0.2064666748046875, -0.196746826171875, -0.1870269775390625, -0.17730712890625, -0.1675872802734375, -0.157867431640625, -0.1481475830078125, -0.138427734375, -0.1287078857421875, -0.118988037109375, -0.1092681884765625, -0.09954833984375, -0.0898284912109375, -0.080108642578125, -0.0703887939453125, -0.0606689453125, -0.0509490966796875, -0.041229248046875, -0.0315093994140625, -0.02178955078125, -0.0120697021484375, -0.002349853515625, 0.0073699951171875, 0.01708984375, 0.0268096923828125, 0.036529541015625, 0.0462493896484375, 0.05596923828125, 0.0656890869140625, 0.075408935546875, 0.0851287841796875, 0.0948486328125, 0.1045684814453125, 0.114288330078125, 0.1240081787109375, 0.13372802734375, 0.1434478759765625, 0.153167724609375, 0.1628875732421875, 0.172607421875, 0.1823272705078125, 0.192047119140625, 0.2017669677734375, 0.21148681640625, 0.2212066650390625, 0.230926513671875, 0.2406463623046875, 0.2503662109375, 0.2600860595703125, 0.269805908203125, 0.2795257568359375, 0.28924560546875, 0.2989654541015625, 0.308685302734375, 0.3184051513671875, 0.328125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 2.0, 9.0, 11.0, 11.0, 22.0, 24.0, 53.0, 76.0, 184.0, 223.0, 162.0, 68.0, 49.0, 29.0, 21.0, 7.0, 9.0, 12.0, 7.0, 5.0, 5.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.110004425048828e-05, -2.0592473447322845e-05, -2.008490264415741e-05, -1.9577331840991974e-05, -1.9069761037826538e-05, -1.8562190234661102e-05, -1.8054619431495667e-05, -1.754704862833023e-05, -1.7039477825164795e-05, -1.653190702199936e-05, -1.6024336218833923e-05, -1.5516765415668488e-05, -1.5009194612503052e-05, -1.4501623809337616e-05, -1.399405300617218e-05, -1.3486482203006744e-05, -1.2978911399841309e-05, -1.2471340596675873e-05, -1.1963769793510437e-05, -1.1456198990345001e-05, -1.0948628187179565e-05, -1.044105738401413e-05, -9.933486580848694e-06, -9.425915777683258e-06, -8.918344974517822e-06, -8.410774171352386e-06, -7.90320336818695e-06, -7.395632565021515e-06, -6.888061761856079e-06, -6.380490958690643e-06, -5.8729201555252075e-06, -5.365349352359772e-06, -4.857778549194336e-06, -4.3502077460289e-06, -3.842636942863464e-06, -3.3350661396980286e-06, -2.8274953365325928e-06, -2.319924533367157e-06, -1.8123537302017212e-06, -1.3047829270362854e-06, -7.972121238708496e-07, -2.896413207054138e-07, 2.1792948246002197e-07, 7.255002856254578e-07, 1.2330710887908936e-06, 1.7406418919563293e-06, 2.248212695121765e-06, 2.755783498287201e-06, 3.2633543014526367e-06, 3.7709251046180725e-06, 4.278495907783508e-06, 4.786066710948944e-06, 5.29363751411438e-06, 5.801208317279816e-06, 6.3087791204452515e-06, 6.816349923610687e-06, 7.323920726776123e-06, 7.831491529941559e-06, 8.339062333106995e-06, 8.84663313627243e-06, 9.354203939437866e-06, 9.861774742603302e-06, 1.0369345545768738e-05, 1.0876916348934174e-05, 1.138448715209961e-05]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 7.0, 8.0, 7.0, 6.0, 10.0, 31.0, 43.0, 45.0, 147.0, 408.0, 2067.0, 22442.0, 948740.0, 69620.0, 3908.0, 698.0, 151.0, 80.0, 50.0, 24.0, 16.0, 14.0, 8.0, 4.0, 1.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.177734375, -0.1726055145263672, -0.16747665405273438, -0.16234779357910156, -0.15721893310546875, -0.15209007263183594, -0.14696121215820312, -0.1418323516845703, -0.1367034912109375, -0.1315746307373047, -0.12644577026367188, -0.12131690979003906, -0.11618804931640625, -0.11105918884277344, -0.10593032836914062, -0.10080146789550781, -0.095672607421875, -0.09054374694824219, -0.08541488647460938, -0.08028602600097656, -0.07515716552734375, -0.07002830505371094, -0.06489944458007812, -0.05977058410644531, -0.0546417236328125, -0.04951286315917969, -0.044384002685546875, -0.03925514221191406, -0.03412628173828125, -0.028997421264648438, -0.023868560791015625, -0.018739700317382812, -0.01361083984375, -0.008481979370117188, -0.003353118896484375, 0.0017757415771484375, 0.00690460205078125, 0.012033462524414062, 0.017162322998046875, 0.022291183471679688, 0.0274200439453125, 0.03254890441894531, 0.037677764892578125, 0.04280662536621094, 0.04793548583984375, 0.05306434631347656, 0.058193206787109375, 0.06332206726074219, 0.068450927734375, 0.07357978820800781, 0.07870864868164062, 0.08383750915527344, 0.08896636962890625, 0.09409523010253906, 0.09922409057617188, 0.10435295104980469, 0.1094818115234375, 0.11461067199707031, 0.11973953247070312, 0.12486839294433594, 0.12999725341796875, 0.13512611389160156, 0.14025497436523438, 0.1453838348388672, 0.1505126953125]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 1.0, 4.0, 9.0, 14.0, 17.0, 22.0, 28.0, 41.0, 65.0, 91.0, 110.0, 137.0, 141.0, 91.0, 48.0, 44.0, 30.0, 21.0, 25.0, 11.0, 13.0, 12.0, 5.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0243988037109375, -0.023578405380249023, -0.022758007049560547, -0.02193760871887207, -0.021117210388183594, -0.020296812057495117, -0.01947641372680664, -0.018656015396118164, -0.017835617065429688, -0.01701521873474121, -0.016194820404052734, -0.015374422073364258, -0.014554023742675781, -0.013733625411987305, -0.012913227081298828, -0.012092828750610352, -0.011272430419921875, -0.010452032089233398, -0.009631633758544922, -0.008811235427856445, -0.007990837097167969, -0.007170438766479492, -0.006350040435791016, -0.005529642105102539, -0.0047092437744140625, -0.003888845443725586, -0.0030684471130371094, -0.002248048782348633, -0.0014276504516601562, -0.0006072521209716797, 0.00021314620971679688, 0.0010335445404052734, 0.00185394287109375, 0.0026743412017822266, 0.003494739532470703, 0.00431513786315918, 0.005135536193847656, 0.005955934524536133, 0.006776332855224609, 0.007596731185913086, 0.008417129516601562, 0.009237527847290039, 0.010057926177978516, 0.010878324508666992, 0.011698722839355469, 0.012519121170043945, 0.013339519500732422, 0.014159917831420898, 0.014980316162109375, 0.01580071449279785, 0.016621112823486328, 0.017441511154174805, 0.01826190948486328, 0.019082307815551758, 0.019902706146240234, 0.02072310447692871, 0.021543502807617188, 0.022363901138305664, 0.02318429946899414, 0.024004697799682617, 0.024825096130371094, 0.02564549446105957, 0.026465892791748047, 0.027286291122436523, 0.028106689453125]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 13.0, 35.0, 115.0, 333.0, 351.0, 114.0, 38.0, 9.0, 8.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8259516954421997, -0.7229790091514587, -0.6200063228607178, -0.5170336365699768, -0.41406095027923584, -0.3110882639884949, -0.2081155776977539, -0.10514289140701294, -0.0021702051162719727, 0.100802481174469, 0.20377516746520996, 0.3067478537559509, 0.4097205400466919, 0.5126932263374329, 0.6156659126281738, 0.7186385989189148, 0.8216112852096558, 0.9245839715003967, 1.0275566577911377, 1.1305294036865234, 1.2335020303726196, 1.3364746570587158, 1.4394474029541016, 1.5424201488494873, 1.6453927755355835, 1.7483654022216797, 1.8513381481170654, 1.9543108940124512, 2.057283401489258, 2.1602561473846436, 2.2632288932800293, 2.366201639175415, 2.469174385070801, 2.5721471309661865, 2.6751198768615723, 2.778092384338379, 2.8810651302337646, 2.9840378761291504, 3.087010383605957, 3.1899831295013428, 3.2929558753967285, 3.3959286212921143, 3.4989013671875, 3.6018738746643066, 3.7048466205596924, 3.807819366455078, 3.9107918739318848, 4.01376485824585, 4.116737365722656, 4.219709873199463, 4.322682857513428, 4.425655364990234, 4.528628349304199, 4.631600856781006, 4.7345733642578125, 4.837546348571777, 4.940518856048584, 5.043491363525391, 5.1464643478393555, 5.249436855316162, 5.352409362792969, 5.455382347106934, 5.55835485458374, 5.661327838897705, 5.764300346374512]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 8.0, 7.0, 6.0, 11.0, 12.0, 17.0, 15.0, 17.0, 19.0, 30.0, 24.0, 31.0, 43.0, 29.0, 30.0, 38.0, 35.0, 40.0, 43.0, 50.0, 57.0, 40.0, 48.0, 33.0, 42.0, 33.0, 42.0, 26.0, 33.0, 34.0, 30.0, 16.0, 14.0, 15.0, 9.0, 8.0, 10.0, 4.0, 5.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4271254539489746, -2.3518643379211426, -2.2766032218933105, -2.2013418674468994, -2.1260807514190674, -2.0508196353912354, -1.9755585193634033, -1.9002974033355713, -1.8250361680984497, -1.7497750520706177, -1.674513816833496, -1.599252700805664, -1.523991584777832, -1.4487303495407104, -1.3734692335128784, -1.2982079982757568, -1.2229468822479248, -1.1476857662200928, -1.0724245309829712, -0.9971634149551392, -0.9219022393226624, -0.8466410636901855, -0.7713799476623535, -0.6961187720298767, -0.6208575963973999, -0.5455964207649231, -0.4703352749347687, -0.39507412910461426, -0.31981295347213745, -0.24455177783966064, -0.16929063200950623, -0.0940294861793518, -0.018768310546875, 0.05649285018444061, 0.13175401091575623, 0.20701517164707184, 0.28227633237838745, 0.35753750801086426, 0.4327986538410187, 0.5080597996711731, 0.5833209753036499, 0.6585821509361267, 0.7338433265686035, 0.8091044425964355, 0.8843656182289124, 0.9596267938613892, 1.0348879098892212, 1.1101491451263428, 1.1854102611541748, 1.2606713771820068, 1.3359326124191284, 1.4111937284469604, 1.486454963684082, 1.561716079711914, 1.636977195739746, 1.7122383117675781, 1.7874995470046997, 1.8627606630325317, 1.9380218982696533, 2.0132830142974854, 2.0885441303253174, 2.1638054847717285, 2.2390666007995605, 2.3143277168273926, 2.3895888328552246]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 5.0, 3.0, 5.0, 5.0, 14.0, 10.0, 8.0, 13.0, 13.0, 18.0, 24.0, 26.0, 31.0, 31.0, 69.0, 130.0, 366.0, 1186.0, 4414.0, 29050.0, 3083652.0, 1051195.0, 18500.0, 3691.0, 1058.0, 363.0, 123.0, 64.0, 47.0, 37.0, 28.0, 30.0, 14.0, 13.0, 14.0, 13.0, 7.0, 9.0, 5.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.89453125, -1.836944580078125, -1.77935791015625, -1.721771240234375, -1.6641845703125, -1.606597900390625, -1.54901123046875, -1.491424560546875, -1.433837890625, -1.376251220703125, -1.31866455078125, -1.261077880859375, -1.2034912109375, -1.145904541015625, -1.08831787109375, -1.030731201171875, -0.97314453125, -0.915557861328125, -0.85797119140625, -0.800384521484375, -0.7427978515625, -0.685211181640625, -0.62762451171875, -0.570037841796875, -0.512451171875, -0.454864501953125, -0.39727783203125, -0.339691162109375, -0.2821044921875, -0.224517822265625, -0.16693115234375, -0.109344482421875, -0.0517578125, 0.005828857421875, 0.06341552734375, 0.121002197265625, 0.1785888671875, 0.236175537109375, 0.29376220703125, 0.351348876953125, 0.408935546875, 0.466522216796875, 0.52410888671875, 0.581695556640625, 0.6392822265625, 0.696868896484375, 0.75445556640625, 0.812042236328125, 0.86962890625, 0.927215576171875, 0.98480224609375, 1.042388916015625, 1.0999755859375, 1.157562255859375, 1.21514892578125, 1.272735595703125, 1.330322265625, 1.387908935546875, 1.44549560546875, 1.503082275390625, 1.5606689453125, 1.618255615234375, 1.67584228515625, 1.733428955078125, 1.791015625]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 13.0, 15.0, 18.0, 22.0, 23.0, 29.0, 40.0, 31.0, 43.0, 69.0, 74.0, 64.0, 54.0, 61.0, 84.0, 58.0, 54.0, 56.0, 45.0, 30.0, 35.0, 22.0, 16.0, 9.0, 9.0, 7.0, 5.0, 4.0, 2.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2958984375, -0.2823486328125, -0.268798828125, -0.2552490234375, -0.24169921875, -0.2281494140625, -0.214599609375, -0.2010498046875, -0.1875, -0.1739501953125, -0.160400390625, -0.1468505859375, -0.13330078125, -0.1197509765625, -0.106201171875, -0.0926513671875, -0.0791015625, -0.0655517578125, -0.052001953125, -0.0384521484375, -0.02490234375, -0.0113525390625, 0.002197265625, 0.0157470703125, 0.029296875, 0.0428466796875, 0.056396484375, 0.0699462890625, 0.08349609375, 0.0970458984375, 0.110595703125, 0.1241455078125, 0.1376953125, 0.1512451171875, 0.164794921875, 0.1783447265625, 0.19189453125, 0.2054443359375, 0.218994140625, 0.2325439453125, 0.24609375, 0.2596435546875, 0.273193359375, 0.2867431640625, 0.30029296875, 0.3138427734375, 0.327392578125, 0.3409423828125, 0.3544921875, 0.3680419921875, 0.381591796875, 0.3951416015625, 0.40869140625, 0.4222412109375, 0.435791015625, 0.4493408203125, 0.462890625, 0.4764404296875, 0.489990234375, 0.5035400390625, 0.51708984375, 0.5306396484375, 0.544189453125, 0.5577392578125, 0.5712890625]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 7.0, 5.0, 20.0, 40.0, 148.0, 432.0, 10353.0, 4181463.0, 1370.0, 298.0, 91.0, 29.0, 8.0, 4.0, 2.0, 4.0, 7.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.62890625, -5.37640380859375, -5.1239013671875, -4.87139892578125, -4.618896484375, -4.36639404296875, -4.1138916015625, -3.86138916015625, -3.60888671875, -3.35638427734375, -3.1038818359375, -2.85137939453125, -2.598876953125, -2.34637451171875, -2.0938720703125, -1.84136962890625, -1.5888671875, -1.33636474609375, -1.0838623046875, -0.83135986328125, -0.578857421875, -0.32635498046875, -0.0738525390625, 0.17864990234375, 0.43115234375, 0.68365478515625, 0.9361572265625, 1.18865966796875, 1.441162109375, 1.69366455078125, 1.9461669921875, 2.19866943359375, 2.451171875, 2.70367431640625, 2.9561767578125, 3.20867919921875, 3.461181640625, 3.71368408203125, 3.9661865234375, 4.21868896484375, 4.47119140625, 4.72369384765625, 4.9761962890625, 5.22869873046875, 5.481201171875, 5.73370361328125, 5.9862060546875, 6.23870849609375, 6.4912109375, 6.74371337890625, 6.9962158203125, 7.24871826171875, 7.501220703125, 7.75372314453125, 8.0062255859375, 8.25872802734375, 8.51123046875, 8.76373291015625, 9.0162353515625, 9.26873779296875, 9.521240234375, 9.77374267578125, 10.0262451171875, 10.27874755859375, 10.53125]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 4.0, 3.0, 7.0, 4.0, 8.0, 14.0, 12.0, 19.0, 30.0, 46.0, 68.0, 78.0, 149.0, 285.0, 612.0, 1065.0, 811.0, 360.0, 170.0, 89.0, 77.0, 39.0, 34.0, 26.0, 18.0, 13.0, 11.0, 7.0, 4.0, 4.0, 3.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2861328125, -0.2781181335449219, -0.27010345458984375, -0.2620887756347656, -0.2540740966796875, -0.24605941772460938, -0.23804473876953125, -0.23003005981445312, -0.222015380859375, -0.21400070190429688, -0.20598602294921875, -0.19797134399414062, -0.1899566650390625, -0.18194198608398438, -0.17392730712890625, -0.16591262817382812, -0.15789794921875, -0.14988327026367188, -0.14186859130859375, -0.13385391235351562, -0.1258392333984375, -0.11782455444335938, -0.10980987548828125, -0.10179519653320312, -0.093780517578125, -0.08576583862304688, -0.07775115966796875, -0.06973648071289062, -0.0617218017578125, -0.053707122802734375, -0.04569244384765625, -0.037677764892578125, -0.0296630859375, -0.021648406982421875, -0.01363372802734375, -0.005619049072265625, 0.0023956298828125, 0.010410308837890625, 0.01842498779296875, 0.026439666748046875, 0.034454345703125, 0.042469024658203125, 0.05048370361328125, 0.058498382568359375, 0.0665130615234375, 0.07452774047851562, 0.08254241943359375, 0.09055709838867188, 0.09857177734375, 0.10658645629882812, 0.11460113525390625, 0.12261581420898438, 0.1306304931640625, 0.13864517211914062, 0.14665985107421875, 0.15467453002929688, 0.162689208984375, 0.17070388793945312, 0.17871856689453125, 0.18673324584960938, 0.1947479248046875, 0.20276260375976562, 0.21077728271484375, 0.21879196166992188, 0.226806640625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 9.0, 17.0, 35.0, 44.0, 75.0, 125.0, 193.0, 187.0, 122.0, 68.0, 52.0, 26.0, 17.0, 11.0, 7.0, 2.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5024560689926147, -0.4691631495952606, -0.4358702003955841, -0.40257728099823, -0.36928433179855347, -0.33599141240119934, -0.3026984930038452, -0.2694055438041687, -0.23611262440681458, -0.20281969010829926, -0.16952675580978394, -0.1362338364124298, -0.10294090211391449, -0.06964796781539917, -0.036355048418045044, -0.003062114119529724, 0.030230820178985596, 0.06352375447750092, 0.09681668132543564, 0.13010960817337036, 0.16340254247188568, 0.196695476770401, 0.22998839616775513, 0.26328134536743164, 0.29657426476478577, 0.3298671841621399, 0.3631601333618164, 0.39645305275917053, 0.42974597215652466, 0.46303892135620117, 0.4963318407535553, 0.5296247601509094, 0.5629177093505859, 0.5962106585502625, 0.6295035481452942, 0.6627964973449707, 0.6960894465446472, 0.7293823957443237, 0.7626752853393555, 0.795968234539032, 0.8292611837387085, 0.862554132938385, 0.8958470225334167, 0.9291399717330933, 0.9624329209327698, 0.9957258701324463, 1.029018759727478, 1.0623116493225098, 1.095604658126831, 1.1288975477218628, 1.162190556526184, 1.1954834461212158, 1.2287763357162476, 1.2620693445205688, 1.2953622341156006, 1.3286551237106323, 1.361948013305664, 1.3952409029006958, 1.428533911705017, 1.4618268013000488, 1.4951196908950806, 1.5284126996994019, 1.5617055892944336, 1.5949984788894653, 1.6282914876937866]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 8.0, 4.0, 9.0, 16.0, 13.0, 13.0, 11.0, 24.0, 18.0, 21.0, 23.0, 39.0, 40.0, 48.0, 46.0, 49.0, 38.0, 44.0, 64.0, 46.0, 52.0, 38.0, 45.0, 52.0, 33.0, 28.0, 32.0, 43.0, 18.0, 13.0, 19.0, 13.0, 11.0, 9.0, 3.0, 8.0, 2.0, 3.0, 3.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3722960650920868, -0.35986608266830444, -0.3474361002445221, -0.33500614762306213, -0.3225761651992798, -0.31014618277549744, -0.2977162003517151, -0.2852862477302551, -0.2728562653064728, -0.26042628288269043, -0.24799631536006927, -0.23556633293628693, -0.22313636541366577, -0.21070638298988342, -0.19827640056610107, -0.18584643304347992, -0.17341645061969757, -0.16098646819591522, -0.14855650067329407, -0.13612651824951172, -0.12369655072689056, -0.11126656830310822, -0.09883659332990646, -0.08640661835670471, -0.07397664338350296, -0.06154666841030121, -0.04911669343709946, -0.03668671473860741, -0.024256739765405655, -0.011826764792203903, 0.000603213906288147, 0.013033188879489899, 0.02546316385269165, 0.0378931388258934, 0.050323113799095154, 0.0627530962228775, 0.07518306374549866, 0.087613046169281, 0.10004302114248276, 0.11247299611568451, 0.12490297108888626, 0.137332946062088, 0.14976292848587036, 0.16219289600849152, 0.17462287843227386, 0.18705284595489502, 0.19948282837867737, 0.21191281080245972, 0.22434277832508087, 0.23677276074886322, 0.24920272827148438, 0.2616327106952667, 0.2740626931190491, 0.28649264574050903, 0.2989226281642914, 0.31135261058807373, 0.3237825930118561, 0.3362125754356384, 0.3486425578594208, 0.36107251048088074, 0.3735024929046631, 0.38593247532844543, 0.3983624577522278, 0.41079241037368774, 0.4232223927974701]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 6.0, 4.0, 9.0, 8.0, 20.0, 23.0, 28.0, 47.0, 50.0, 75.0, 118.0, 175.0, 274.0, 399.0, 613.0, 966.0, 1692.0, 2866.0, 5055.0, 9299.0, 18621.0, 43428.0, 146776.0, 519884.0, 198565.0, 53478.0, 21740.0, 10668.0, 5629.0, 3165.0, 1802.0, 1067.0, 708.0, 461.0, 275.0, 172.0, 113.0, 84.0, 62.0, 36.0, 23.0, 23.0, 13.0, 9.0, 10.0, 5.0, 3.0, 9.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.18212890625, -0.17552947998046875, -0.1689300537109375, -0.16233062744140625, -0.155731201171875, -0.14913177490234375, -0.1425323486328125, -0.13593292236328125, -0.12933349609375, -0.12273406982421875, -0.1161346435546875, -0.10953521728515625, -0.102935791015625, -0.09633636474609375, -0.0897369384765625, -0.08313751220703125, -0.0765380859375, -0.06993865966796875, -0.0633392333984375, -0.05673980712890625, -0.050140380859375, -0.04354095458984375, -0.0369415283203125, -0.03034210205078125, -0.02374267578125, -0.01714324951171875, -0.0105438232421875, -0.00394439697265625, 0.002655029296875, 0.00925445556640625, 0.0158538818359375, 0.02245330810546875, 0.029052734375, 0.03565216064453125, 0.0422515869140625, 0.04885101318359375, 0.055450439453125, 0.06204986572265625, 0.0686492919921875, 0.07524871826171875, 0.08184814453125, 0.08844757080078125, 0.0950469970703125, 0.10164642333984375, 0.108245849609375, 0.11484527587890625, 0.1214447021484375, 0.12804412841796875, 0.1346435546875, 0.14124298095703125, 0.1478424072265625, 0.15444183349609375, 0.161041259765625, 0.16764068603515625, 0.1742401123046875, 0.18083953857421875, 0.18743896484375, 0.19403839111328125, 0.2006378173828125, 0.20723724365234375, 0.213836669921875, 0.22043609619140625, 0.2270355224609375, 0.23363494873046875, 0.240234375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 4.0, 5.0, 9.0, 6.0, 8.0, 17.0, 23.0, 23.0, 22.0, 33.0, 36.0, 47.0, 54.0, 57.0, 61.0, 60.0, 78.0, 61.0, 59.0, 52.0, 61.0, 48.0, 39.0, 35.0, 35.0, 24.0, 9.0, 11.0, 9.0, 5.0, 7.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26025390625, -0.2511138916015625, -0.241973876953125, -0.2328338623046875, -0.22369384765625, -0.2145538330078125, -0.205413818359375, -0.1962738037109375, -0.1871337890625, -0.1779937744140625, -0.168853759765625, -0.1597137451171875, -0.15057373046875, -0.1414337158203125, -0.132293701171875, -0.1231536865234375, -0.114013671875, -0.1048736572265625, -0.095733642578125, -0.0865936279296875, -0.07745361328125, -0.0683135986328125, -0.059173583984375, -0.0500335693359375, -0.0408935546875, -0.0317535400390625, -0.022613525390625, -0.0134735107421875, -0.00433349609375, 0.0048065185546875, 0.013946533203125, 0.0230865478515625, 0.0322265625, 0.0413665771484375, 0.050506591796875, 0.0596466064453125, 0.06878662109375, 0.0779266357421875, 0.087066650390625, 0.0962066650390625, 0.1053466796875, 0.1144866943359375, 0.123626708984375, 0.1327667236328125, 0.14190673828125, 0.1510467529296875, 0.160186767578125, 0.1693267822265625, 0.178466796875, 0.1876068115234375, 0.196746826171875, 0.2058868408203125, 0.21502685546875, 0.2241668701171875, 0.233306884765625, 0.2424468994140625, 0.2515869140625, 0.2607269287109375, 0.269866943359375, 0.2790069580078125, 0.28814697265625, 0.2972869873046875, 0.306427001953125, 0.3155670166015625, 0.32470703125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 2.0, 8.0, 2.0, 10.0, 23.0, 33.0, 45.0, 74.0, 154.0, 323.0, 810.0, 2030.0, 6321.0, 23856.0, 152287.0, 737888.0, 98991.0, 17819.0, 5017.0, 1637.0, 600.0, 282.0, 134.0, 63.0, 41.0, 26.0, 20.0, 12.0, 11.0, 11.0, 3.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.265625, -0.256591796875, -0.24755859375, -0.238525390625, -0.2294921875, -0.220458984375, -0.21142578125, -0.202392578125, -0.193359375, -0.184326171875, -0.17529296875, -0.166259765625, -0.1572265625, -0.148193359375, -0.13916015625, -0.130126953125, -0.12109375, -0.112060546875, -0.10302734375, -0.093994140625, -0.0849609375, -0.075927734375, -0.06689453125, -0.057861328125, -0.048828125, -0.039794921875, -0.03076171875, -0.021728515625, -0.0126953125, -0.003662109375, 0.00537109375, 0.014404296875, 0.0234375, 0.032470703125, 0.04150390625, 0.050537109375, 0.0595703125, 0.068603515625, 0.07763671875, 0.086669921875, 0.095703125, 0.104736328125, 0.11376953125, 0.122802734375, 0.1318359375, 0.140869140625, 0.14990234375, 0.158935546875, 0.16796875, 0.177001953125, 0.18603515625, 0.195068359375, 0.2041015625, 0.213134765625, 0.22216796875, 0.231201171875, 0.240234375, 0.249267578125, 0.25830078125, 0.267333984375, 0.2763671875, 0.285400390625, 0.29443359375, 0.303466796875, 0.3125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 8.0, 5.0, 8.0, 26.0, 16.0, 31.0, 30.0, 25.0, 44.0, 42.0, 49.0, 48.0, 58.0, 67.0, 70.0, 55.0, 62.0, 43.0, 43.0, 42.0, 36.0, 46.0, 36.0, 26.0, 19.0, 12.0, 12.0, 8.0, 10.0, 9.0, 3.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.50390625, -0.488800048828125, -0.47369384765625, -0.458587646484375, -0.4434814453125, -0.428375244140625, -0.41326904296875, -0.398162841796875, -0.383056640625, -0.367950439453125, -0.35284423828125, -0.337738037109375, -0.3226318359375, -0.307525634765625, -0.29241943359375, -0.277313232421875, -0.26220703125, -0.247100830078125, -0.23199462890625, -0.216888427734375, -0.2017822265625, -0.186676025390625, -0.17156982421875, -0.156463623046875, -0.141357421875, -0.126251220703125, -0.11114501953125, -0.096038818359375, -0.0809326171875, -0.065826416015625, -0.05072021484375, -0.035614013671875, -0.0205078125, -0.005401611328125, 0.00970458984375, 0.024810791015625, 0.0399169921875, 0.055023193359375, 0.07012939453125, 0.085235595703125, 0.100341796875, 0.115447998046875, 0.13055419921875, 0.145660400390625, 0.1607666015625, 0.175872802734375, 0.19097900390625, 0.206085205078125, 0.22119140625, 0.236297607421875, 0.25140380859375, 0.266510009765625, 0.2816162109375, 0.296722412109375, 0.31182861328125, 0.326934814453125, 0.342041015625, 0.357147216796875, 0.37225341796875, 0.387359619140625, 0.4024658203125, 0.417572021484375, 0.43267822265625, 0.447784423828125, 0.462890625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 6.0, 16.0, 17.0, 33.0, 31.0, 42.0, 69.0, 97.0, 158.0, 221.0, 370.0, 616.0, 1136.0, 2112.0, 4125.0, 8627.0, 21913.0, 77474.0, 462809.0, 369217.0, 64244.0, 19250.0, 7884.0, 3692.0, 1825.0, 974.0, 562.0, 347.0, 249.0, 128.0, 84.0, 51.0, 51.0, 26.0, 34.0, 16.0, 9.0, 8.0, 3.0, 6.0, 8.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.046844482421875, -0.045330047607421875, -0.04381561279296875, -0.042301177978515625, -0.0407867431640625, -0.039272308349609375, -0.03775787353515625, -0.036243438720703125, -0.03472900390625, -0.033214569091796875, -0.03170013427734375, -0.030185699462890625, -0.0286712646484375, -0.027156829833984375, -0.02564239501953125, -0.024127960205078125, -0.022613525390625, -0.021099090576171875, -0.01958465576171875, -0.018070220947265625, -0.0165557861328125, -0.015041351318359375, -0.01352691650390625, -0.012012481689453125, -0.010498046875, -0.008983612060546875, -0.00746917724609375, -0.005954742431640625, -0.0044403076171875, -0.002925872802734375, -0.00141143798828125, 0.000102996826171875, 0.001617431640625, 0.003131866455078125, 0.00464630126953125, 0.006160736083984375, 0.0076751708984375, 0.009189605712890625, 0.01070404052734375, 0.012218475341796875, 0.01373291015625, 0.015247344970703125, 0.01676177978515625, 0.018276214599609375, 0.0197906494140625, 0.021305084228515625, 0.02281951904296875, 0.024333953857421875, 0.025848388671875, 0.027362823486328125, 0.02887725830078125, 0.030391693115234375, 0.0319061279296875, 0.033420562744140625, 0.03493499755859375, 0.036449432373046875, 0.0379638671875, 0.039478302001953125, 0.04099273681640625, 0.042507171630859375, 0.0440216064453125, 0.045536041259765625, 0.04705047607421875, 0.048564910888671875, 0.050079345703125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 7.0, 9.0, 20.0, 24.0, 38.0, 70.0, 106.0, 157.0, 174.0, 140.0, 82.0, 66.0, 27.0, 14.0, 16.0, 10.0, 6.0, 8.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.029273986816406e-05, -3.904476761817932e-05, -3.779679536819458e-05, -3.654882311820984e-05, -3.53008508682251e-05, -3.4052878618240356e-05, -3.2804906368255615e-05, -3.1556934118270874e-05, -3.0308961868286133e-05, -2.906098961830139e-05, -2.781301736831665e-05, -2.656504511833191e-05, -2.5317072868347168e-05, -2.4069100618362427e-05, -2.2821128368377686e-05, -2.1573156118392944e-05, -2.0325183868408203e-05, -1.9077211618423462e-05, -1.782923936843872e-05, -1.658126711845398e-05, -1.5333294868469238e-05, -1.4085322618484497e-05, -1.2837350368499756e-05, -1.1589378118515015e-05, -1.0341405868530273e-05, -9.093433618545532e-06, -7.845461368560791e-06, -6.59748911857605e-06, -5.349516868591309e-06, -4.101544618606567e-06, -2.853572368621826e-06, -1.605600118637085e-06, -3.5762786865234375e-07, 8.903443813323975e-07, 2.1383166313171387e-06, 3.38628888130188e-06, 4.634261131286621e-06, 5.882233381271362e-06, 7.1302056312561035e-06, 8.378177881240845e-06, 9.626150131225586e-06, 1.0874122381210327e-05, 1.2122094631195068e-05, 1.337006688117981e-05, 1.461803913116455e-05, 1.5866011381149292e-05, 1.7113983631134033e-05, 1.8361955881118774e-05, 1.9609928131103516e-05, 2.0857900381088257e-05, 2.2105872631072998e-05, 2.335384488105774e-05, 2.460181713104248e-05, 2.584978938102722e-05, 2.7097761631011963e-05, 2.8345733880996704e-05, 2.9593706130981445e-05, 3.0841678380966187e-05, 3.208965063095093e-05, 3.333762288093567e-05, 3.458559513092041e-05, 3.583356738090515e-05, 3.708153963088989e-05, 3.8329511880874634e-05, 3.9577484130859375e-05]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 9.0, 7.0, 18.0, 27.0, 60.0, 127.0, 316.0, 1329.0, 8343.0, 139053.0, 865889.0, 29092.0, 3271.0, 610.0, 203.0, 85.0, 40.0, 29.0, 15.0, 11.0, 3.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1500244140625, -0.14577007293701172, -0.14151573181152344, -0.13726139068603516, -0.13300704956054688, -0.1287527084350586, -0.12449836730957031, -0.12024402618408203, -0.11598968505859375, -0.11173534393310547, -0.10748100280761719, -0.1032266616821289, -0.09897232055664062, -0.09471797943115234, -0.09046363830566406, -0.08620929718017578, -0.0819549560546875, -0.07770061492919922, -0.07344627380371094, -0.06919193267822266, -0.06493759155273438, -0.060683250427246094, -0.05642890930175781, -0.05217456817626953, -0.04792022705078125, -0.04366588592529297, -0.03941154479980469, -0.035157203674316406, -0.030902862548828125, -0.026648521423339844, -0.022394180297851562, -0.01813983917236328, -0.013885498046875, -0.009631156921386719, -0.0053768157958984375, -0.0011224746704101562, 0.003131866455078125, 0.007386207580566406, 0.011640548706054688, 0.01589488983154297, 0.02014923095703125, 0.02440357208251953, 0.028657913208007812, 0.032912254333496094, 0.037166595458984375, 0.041420936584472656, 0.04567527770996094, 0.04992961883544922, 0.0541839599609375, 0.05843830108642578, 0.06269264221191406, 0.06694698333740234, 0.07120132446289062, 0.0754556655883789, 0.07971000671386719, 0.08396434783935547, 0.08821868896484375, 0.09247303009033203, 0.09672737121582031, 0.1009817123413086, 0.10523605346679688, 0.10949039459228516, 0.11374473571777344, 0.11799907684326172, 0.12225341796875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 5.0, 1.0, 3.0, 3.0, 5.0, 5.0, 10.0, 9.0, 9.0, 18.0, 15.0, 10.0, 23.0, 40.0, 24.0, 48.0, 46.0, 55.0, 75.0, 70.0, 73.0, 72.0, 69.0, 44.0, 45.0, 40.0, 29.0, 25.0, 30.0, 16.0, 19.0, 18.0, 13.0, 5.0, 8.0, 3.0, 3.0, 5.0, 3.0, 1.0, 4.0, 0.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.01088714599609375, -0.010561227798461914, -0.010235309600830078, -0.009909391403198242, -0.009583473205566406, -0.00925755500793457, -0.008931636810302734, -0.008605718612670898, -0.008279800415039062, -0.007953882217407227, -0.007627964019775391, -0.007302045822143555, -0.006976127624511719, -0.006650209426879883, -0.006324291229248047, -0.005998373031616211, -0.005672454833984375, -0.005346536636352539, -0.005020618438720703, -0.004694700241088867, -0.004368782043457031, -0.004042863845825195, -0.0037169456481933594, -0.0033910274505615234, -0.0030651092529296875, -0.0027391910552978516, -0.0024132728576660156, -0.0020873546600341797, -0.0017614364624023438, -0.0014355182647705078, -0.0011096000671386719, -0.0007836818695068359, -0.000457763671875, -0.00013184547424316406, 0.00019407272338867188, 0.0005199909210205078, 0.0008459091186523438, 0.0011718273162841797, 0.0014977455139160156, 0.0018236637115478516, 0.0021495819091796875, 0.0024755001068115234, 0.0028014183044433594, 0.0031273365020751953, 0.0034532546997070312, 0.003779172897338867, 0.004105091094970703, 0.004431009292602539, 0.004756927490234375, 0.005082845687866211, 0.005408763885498047, 0.005734682083129883, 0.006060600280761719, 0.006386518478393555, 0.006712436676025391, 0.0070383548736572266, 0.0073642730712890625, 0.0076901912689208984, 0.008016109466552734, 0.00834202766418457, 0.008667945861816406, 0.008993864059448242, 0.009319782257080078, 0.009645700454711914, 0.00997161865234375]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 12.0, 11.0, 14.0, 13.0, 21.0, 24.0, 45.0, 55.0, 72.0, 112.0, 113.0, 129.0, 107.0, 64.0, 41.0, 47.0, 31.0, 21.0, 16.0, 9.0, 8.0, 5.0, 8.0, 2.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3130538761615753, -0.30230289697647095, -0.29155194759368896, -0.2808009684085846, -0.2700500190258026, -0.25929903984069824, -0.24854807555675507, -0.2377971112728119, -0.2270461469888687, -0.21629518270492554, -0.20554421842098236, -0.19479325413703918, -0.18404227495193481, -0.17329132556915283, -0.16254034638404846, -0.15178938210010529, -0.1410384178161621, -0.13028745353221893, -0.11953648924827576, -0.10878551751375198, -0.09803455322980881, -0.08728358894586563, -0.07653261721134186, -0.06578165292739868, -0.055030688643455505, -0.04427972435951233, -0.033528756350278854, -0.02277778834104538, -0.012026824057102203, -0.001275859773159027, 0.009475111961364746, 0.020226076245307922, 0.03097701072692871, 0.04172797501087189, 0.05247894302010536, 0.06322991102933884, 0.07398087531328201, 0.08473183959722519, 0.09548281133174896, 0.10623377561569214, 0.11698473989963531, 0.1277357041835785, 0.13848666846752167, 0.14923763275146484, 0.1599886119365692, 0.1707395613193512, 0.18149054050445557, 0.19224150478839874, 0.20299246907234192, 0.2137434333562851, 0.22449439764022827, 0.23524537682533264, 0.24599632620811462, 0.256747305393219, 0.267498254776001, 0.27824923396110535, 0.2890002131462097, 0.2997511923313141, 0.31050214171409607, 0.32125312089920044, 0.3320040702819824, 0.3427550494670868, 0.35350602865219116, 0.36425697803497314, 0.3750079274177551]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 9.0, 11.0, 10.0, 21.0, 10.0, 20.0, 20.0, 35.0, 21.0, 39.0, 52.0, 51.0, 61.0, 52.0, 47.0, 70.0, 65.0, 67.0, 47.0, 48.0, 46.0, 43.0, 31.0, 29.0, 23.0, 24.0, 9.0, 13.0, 8.0, 8.0, 4.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23378704488277435, -0.2255488783121109, -0.21731069684028625, -0.2090725302696228, -0.20083436369895935, -0.1925961971282959, -0.18435801565647125, -0.1761198490858078, -0.16788166761398315, -0.1596435010433197, -0.15140531957149506, -0.1431671530008316, -0.13492898643016815, -0.1266908049583435, -0.11845263838768005, -0.1102144718170166, -0.10197630524635315, -0.0937381312251091, -0.08549996465444565, -0.0772617906332016, -0.06902362406253815, -0.0607854500412941, -0.05254727602005005, -0.0443091057240963, -0.03607093542814255, -0.027832765132188797, -0.019594592973589897, -0.011356420814990997, -0.0031182505190372467, 0.005119919776916504, 0.013358093798160553, 0.021596264094114304, 0.029834449291229248, 0.038072619587183, 0.04631078988313675, 0.0545489639043808, 0.06278713047504425, 0.0710253044962883, 0.07926347851753235, 0.0875016450881958, 0.09573981910943985, 0.1039779931306839, 0.11221615970134735, 0.1204543337225914, 0.12869250774383545, 0.1369306743144989, 0.14516884088516235, 0.153407022356987, 0.16164518892765045, 0.1698833554983139, 0.17812153697013855, 0.186359703540802, 0.19459787011146545, 0.2028360366821289, 0.21107421815395355, 0.219312384724617, 0.22755056619644165, 0.2357887327671051, 0.24402691423892975, 0.2522650957107544, 0.26050326228141785, 0.2687414288520813, 0.27697959542274475, 0.2852177619934082, 0.29345592856407166]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 2.0, 9.0, 6.0, 13.0, 22.0, 36.0, 37.0, 58.0, 94.0, 140.0, 195.0, 277.0, 422.0, 728.0, 1172.0, 1996.0, 3694.0, 7413.0, 16022.0, 39532.0, 115221.0, 402043.0, 311053.0, 88605.0, 32041.0, 13562.0, 6249.0, 3267.0, 1805.0, 1009.0, 592.0, 428.0, 257.0, 167.0, 103.0, 73.0, 63.0, 43.0, 40.0, 23.0, 9.0, 11.0, 6.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10504150390625, -0.10164070129394531, -0.09823989868164062, -0.09483909606933594, -0.09143829345703125, -0.08803749084472656, -0.08463668823242188, -0.08123588562011719, -0.0778350830078125, -0.07443428039550781, -0.07103347778320312, -0.06763267517089844, -0.06423187255859375, -0.06083106994628906, -0.057430267333984375, -0.05402946472167969, -0.050628662109375, -0.04722785949707031, -0.043827056884765625, -0.04042625427246094, -0.03702545166015625, -0.03362464904785156, -0.030223846435546875, -0.026823043823242188, -0.0234222412109375, -0.020021438598632812, -0.016620635986328125, -0.013219833374023438, -0.00981903076171875, -0.0064182281494140625, -0.003017425537109375, 0.0003833770751953125, 0.0037841796875, 0.0071849822998046875, 0.010585784912109375, 0.013986587524414062, 0.01738739013671875, 0.020788192749023438, 0.024188995361328125, 0.027589797973632812, 0.0309906005859375, 0.03439140319824219, 0.037792205810546875, 0.04119300842285156, 0.04459381103515625, 0.04799461364746094, 0.051395416259765625, 0.05479621887207031, 0.058197021484375, 0.06159782409667969, 0.06499862670898438, 0.06839942932128906, 0.07180023193359375, 0.07520103454589844, 0.07860183715820312, 0.08200263977050781, 0.0854034423828125, 0.08880424499511719, 0.09220504760742188, 0.09560585021972656, 0.09900665283203125, 0.10240745544433594, 0.10580825805664062, 0.10920906066894531, 0.11260986328125]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 6.0, 2.0, 6.0, 7.0, 5.0, 11.0, 17.0, 18.0, 27.0, 14.0, 29.0, 31.0, 36.0, 37.0, 47.0, 47.0, 49.0, 36.0, 50.0, 63.0, 63.0, 61.0, 53.0, 52.0, 27.0, 37.0, 27.0, 27.0, 21.0, 16.0, 14.0, 14.0, 13.0, 7.0, 8.0, 10.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.62158203125, -0.603240966796875, -0.58489990234375, -0.566558837890625, -0.5482177734375, -0.529876708984375, -0.51153564453125, -0.493194580078125, -0.474853515625, -0.456512451171875, -0.43817138671875, -0.419830322265625, -0.4014892578125, -0.383148193359375, -0.36480712890625, -0.346466064453125, -0.328125, -0.309783935546875, -0.29144287109375, -0.273101806640625, -0.2547607421875, -0.236419677734375, -0.21807861328125, -0.199737548828125, -0.181396484375, -0.163055419921875, -0.14471435546875, -0.126373291015625, -0.1080322265625, -0.089691162109375, -0.07135009765625, -0.053009033203125, -0.03466796875, -0.016326904296875, 0.00201416015625, 0.020355224609375, 0.0386962890625, 0.057037353515625, 0.07537841796875, 0.093719482421875, 0.112060546875, 0.130401611328125, 0.14874267578125, 0.167083740234375, 0.1854248046875, 0.203765869140625, 0.22210693359375, 0.240447998046875, 0.2587890625, 0.277130126953125, 0.29547119140625, 0.313812255859375, 0.3321533203125, 0.350494384765625, 0.36883544921875, 0.387176513671875, 0.405517578125, 0.423858642578125, 0.44219970703125, 0.460540771484375, 0.4788818359375, 0.497222900390625, 0.51556396484375, 0.533905029296875, 0.55224609375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 2.0, 9.0, 10.0, 10.0, 6.0, 20.0, 21.0, 25.0, 31.0, 23.0, 29.0, 37.0, 26.0, 37.0, 43.0, 48.0, 67.0, 374.0, 1043886.0, 3353.0, 78.0, 45.0, 35.0, 42.0, 45.0, 35.0, 29.0, 30.0, 23.0, 16.0, 20.0, 19.0, 15.0, 7.0, 9.0, 7.0, 9.0, 8.0, 5.0, 7.0, 3.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0], "bins": [-2.23828125, -2.171844482421875, -2.10540771484375, -2.038970947265625, -1.9725341796875, -1.906097412109375, -1.83966064453125, -1.773223876953125, -1.706787109375, -1.640350341796875, -1.57391357421875, -1.507476806640625, -1.4410400390625, -1.374603271484375, -1.30816650390625, -1.241729736328125, -1.17529296875, -1.108856201171875, -1.04241943359375, -0.975982666015625, -0.9095458984375, -0.843109130859375, -0.77667236328125, -0.710235595703125, -0.643798828125, -0.577362060546875, -0.51092529296875, -0.444488525390625, -0.3780517578125, -0.311614990234375, -0.24517822265625, -0.178741455078125, -0.1123046875, -0.045867919921875, 0.02056884765625, 0.087005615234375, 0.1534423828125, 0.219879150390625, 0.28631591796875, 0.352752685546875, 0.419189453125, 0.485626220703125, 0.55206298828125, 0.618499755859375, 0.6849365234375, 0.751373291015625, 0.81781005859375, 0.884246826171875, 0.95068359375, 1.017120361328125, 1.08355712890625, 1.149993896484375, 1.2164306640625, 1.282867431640625, 1.34930419921875, 1.415740966796875, 1.482177734375, 1.548614501953125, 1.61505126953125, 1.681488037109375, 1.7479248046875, 1.814361572265625, 1.88079833984375, 1.947235107421875, 2.013671875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 3.0, 10.0, 11.0, 9.0, 10.0, 21.0, 23.0, 30.0, 28.0, 28.0, 42.0, 28.0, 34.0, 37.0, 51.0, 43.0, 41.0, 56.0, 50.0, 32.0, 42.0, 30.0, 38.0, 42.0, 36.0, 44.0, 22.0, 21.0, 17.0, 14.0, 21.0, 10.0, 11.0, 13.0, 11.0, 4.0, 4.0, 7.0, 8.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0], "bins": [-0.54345703125, -0.5277862548828125, -0.512115478515625, -0.4964447021484375, -0.48077392578125, -0.4651031494140625, -0.449432373046875, -0.4337615966796875, -0.4180908203125, -0.4024200439453125, -0.386749267578125, -0.3710784912109375, -0.35540771484375, -0.3397369384765625, -0.324066162109375, -0.3083953857421875, -0.292724609375, -0.2770538330078125, -0.261383056640625, -0.2457122802734375, -0.23004150390625, -0.2143707275390625, -0.198699951171875, -0.1830291748046875, -0.1673583984375, -0.1516876220703125, -0.136016845703125, -0.1203460693359375, -0.10467529296875, -0.0890045166015625, -0.073333740234375, -0.0576629638671875, -0.0419921875, -0.0263214111328125, -0.010650634765625, 0.0050201416015625, 0.02069091796875, 0.0363616943359375, 0.052032470703125, 0.0677032470703125, 0.0833740234375, 0.0990447998046875, 0.114715576171875, 0.1303863525390625, 0.14605712890625, 0.1617279052734375, 0.177398681640625, 0.1930694580078125, 0.208740234375, 0.2244110107421875, 0.240081787109375, 0.2557525634765625, 0.27142333984375, 0.2870941162109375, 0.302764892578125, 0.3184356689453125, 0.3341064453125, 0.3497772216796875, 0.365447998046875, 0.3811187744140625, 0.39678955078125, 0.4124603271484375, 0.428131103515625, 0.4438018798828125, 0.45947265625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 7.0, 4.0, 3.0, 8.0, 5.0, 17.0, 16.0, 37.0, 52.0, 149.0, 320.0, 1250.0, 11520.0, 952338.0, 78973.0, 2863.0, 557.0, 179.0, 102.0, 46.0, 37.0, 20.0, 13.0, 8.0, 6.0, 5.0, 6.0, 5.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1253662109375, -0.11932182312011719, -0.11327743530273438, -0.10723304748535156, -0.10118865966796875, -0.09514427185058594, -0.08909988403320312, -0.08305549621582031, -0.0770111083984375, -0.07096672058105469, -0.06492233276367188, -0.05887794494628906, -0.05283355712890625, -0.04678916931152344, -0.040744781494140625, -0.03470039367675781, -0.028656005859375, -0.022611618041992188, -0.016567230224609375, -0.010522842407226562, -0.00447845458984375, 0.0015659332275390625, 0.007610321044921875, 0.013654708862304688, 0.0196990966796875, 0.025743484497070312, 0.031787872314453125, 0.03783226013183594, 0.04387664794921875, 0.04992103576660156, 0.055965423583984375, 0.06200981140136719, 0.06805419921875, 0.07409858703613281, 0.08014297485351562, 0.08618736267089844, 0.09223175048828125, 0.09827613830566406, 0.10432052612304688, 0.11036491394042969, 0.1164093017578125, 0.12245368957519531, 0.12849807739257812, 0.13454246520996094, 0.14058685302734375, 0.14663124084472656, 0.15267562866210938, 0.1587200164794922, 0.164764404296875, 0.1708087921142578, 0.17685317993164062, 0.18289756774902344, 0.18894195556640625, 0.19498634338378906, 0.20103073120117188, 0.2070751190185547, 0.2131195068359375, 0.2191638946533203, 0.22520828247070312, 0.23125267028808594, 0.23729705810546875, 0.24334144592285156, 0.24938583374023438, 0.2554302215576172, 0.261474609375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 9.0, 5.0, 3.0, 3.0, 7.0, 10.0, 7.0, 11.0, 26.0, 31.0, 30.0, 49.0, 66.0, 111.0, 129.0, 137.0, 104.0, 81.0, 48.0, 35.0, 30.0, 18.0, 10.0, 7.0, 8.0, 3.0, 7.0, 4.0, 1.0, 3.0, 4.0, 5.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.0311603546142578e-05, -1.0007061064243317e-05, -9.702518582344055e-06, -9.397976100444794e-06, -9.093433618545532e-06, -8.78889113664627e-06, -8.48434865474701e-06, -8.179806172847748e-06, -7.875263690948486e-06, -7.570721209049225e-06, -7.266178727149963e-06, -6.961636245250702e-06, -6.6570937633514404e-06, -6.352551281452179e-06, -6.0480087995529175e-06, -5.743466317653656e-06, -5.4389238357543945e-06, -5.134381353855133e-06, -4.829838871955872e-06, -4.52529639005661e-06, -4.220753908157349e-06, -3.916211426258087e-06, -3.6116689443588257e-06, -3.307126462459564e-06, -3.0025839805603027e-06, -2.6980414986610413e-06, -2.3934990167617798e-06, -2.0889565348625183e-06, -1.7844140529632568e-06, -1.4798715710639954e-06, -1.1753290891647339e-06, -8.707866072654724e-07, -5.662441253662109e-07, -2.6170164346694946e-07, 4.284083843231201e-08, 3.473833203315735e-07, 6.51925802230835e-07, 9.564682841300964e-07, 1.261010766029358e-06, 1.5655532479286194e-06, 1.8700957298278809e-06, 2.1746382117271423e-06, 2.479180693626404e-06, 2.7837231755256653e-06, 3.0882656574249268e-06, 3.3928081393241882e-06, 3.6973506212234497e-06, 4.001893103122711e-06, 4.306435585021973e-06, 4.610978066921234e-06, 4.915520548820496e-06, 5.220063030719757e-06, 5.5246055126190186e-06, 5.82914799451828e-06, 6.1336904764175415e-06, 6.438232958316803e-06, 6.7427754402160645e-06, 7.047317922115326e-06, 7.351860404014587e-06, 7.656402885913849e-06, 7.96094536781311e-06, 8.265487849712372e-06, 8.570030331611633e-06, 8.874572813510895e-06, 9.179115295410156e-06]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 7.0, 7.0, 6.0, 18.0, 10.0, 24.0, 45.0, 67.0, 107.0, 203.0, 442.0, 921.0, 2390.0, 7765.0, 40146.0, 751812.0, 215915.0, 20373.0, 4933.0, 1802.0, 714.0, 370.0, 207.0, 107.0, 58.0, 36.0, 23.0, 12.0, 10.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.1103515625, -0.10735416412353516, -0.10435676574707031, -0.10135936737060547, -0.09836196899414062, -0.09536457061767578, -0.09236717224121094, -0.0893697738647461, -0.08637237548828125, -0.0833749771118164, -0.08037757873535156, -0.07738018035888672, -0.07438278198242188, -0.07138538360595703, -0.06838798522949219, -0.06539058685302734, -0.0623931884765625, -0.059395790100097656, -0.05639839172363281, -0.05340099334716797, -0.050403594970703125, -0.04740619659423828, -0.04440879821777344, -0.041411399841308594, -0.03841400146484375, -0.035416603088378906, -0.03241920471191406, -0.02942180633544922, -0.026424407958984375, -0.02342700958251953, -0.020429611206054688, -0.017432212829589844, -0.014434814453125, -0.011437416076660156, -0.008440017700195312, -0.005442619323730469, -0.002445220947265625, 0.0005521774291992188, 0.0035495758056640625, 0.006546974182128906, 0.00954437255859375, 0.012541770935058594, 0.015539169311523438, 0.01853656768798828, 0.021533966064453125, 0.02453136444091797, 0.027528762817382812, 0.030526161193847656, 0.0335235595703125, 0.036520957946777344, 0.03951835632324219, 0.04251575469970703, 0.045513153076171875, 0.04851055145263672, 0.05150794982910156, 0.054505348205566406, 0.05750274658203125, 0.060500144958496094, 0.06349754333496094, 0.06649494171142578, 0.06949234008789062, 0.07248973846435547, 0.07548713684082031, 0.07848453521728516, 0.08148193359375]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 7.0, 4.0, 7.0, 5.0, 4.0, 13.0, 19.0, 24.0, 18.0, 32.0, 64.0, 99.0, 104.0, 209.0, 114.0, 92.0, 58.0, 34.0, 27.0, 23.0, 14.0, 5.0, 10.0, 6.0, 5.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.021820068359375, -0.020803451538085938, -0.019786834716796875, -0.018770217895507812, -0.01775360107421875, -0.016736984252929688, -0.015720367431640625, -0.014703750610351562, -0.0136871337890625, -0.012670516967773438, -0.011653900146484375, -0.010637283325195312, -0.00962066650390625, -0.008604049682617188, -0.007587432861328125, -0.0065708160400390625, -0.00555419921875, -0.0045375823974609375, -0.003520965576171875, -0.0025043487548828125, -0.00148773193359375, -0.0004711151123046875, 0.000545501708984375, 0.0015621185302734375, 0.0025787353515625, 0.0035953521728515625, 0.004611968994140625, 0.0056285858154296875, 0.00664520263671875, 0.0076618194580078125, 0.008678436279296875, 0.009695053100585938, 0.010711669921875, 0.011728286743164062, 0.012744903564453125, 0.013761520385742188, 0.01477813720703125, 0.015794754028320312, 0.016811370849609375, 0.017827987670898438, 0.0188446044921875, 0.019861221313476562, 0.020877838134765625, 0.021894454956054688, 0.02291107177734375, 0.023927688598632812, 0.024944305419921875, 0.025960922241210938, 0.0269775390625, 0.027994155883789062, 0.029010772705078125, 0.030027389526367188, 0.03104400634765625, 0.03206062316894531, 0.033077239990234375, 0.03409385681152344, 0.0351104736328125, 0.03612709045410156, 0.037143707275390625, 0.03816032409667969, 0.03917694091796875, 0.04019355773925781, 0.041210174560546875, 0.04222679138183594, 0.043243408203125]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 9.0, 30.0, 63.0, 198.0, 349.0, 213.0, 82.0, 30.0, 18.0, 4.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.687655448913574, -2.624556064605713, -2.5614569187164307, -2.4983575344085693, -2.435258150100708, -2.372159004211426, -2.3090596199035645, -2.245960235595703, -2.182861089706421, -2.1197617053985596, -2.0566625595092773, -1.993563175201416, -1.9304639101028442, -1.8673646450042725, -1.8042652606964111, -1.7411659955978394, -1.678066611289978, -1.6149673461914062, -1.551867961883545, -1.4887686967849731, -1.4256694316864014, -1.36257004737854, -1.2994707822799683, -1.2363715171813965, -1.1732721328735352, -1.1101728677749634, -1.047073483467102, -0.9839742183685303, -0.9208749532699585, -0.8577756285667419, -0.7946763038635254, -0.7315770387649536, -0.6684778928756714, -0.6053785681724548, -0.5422793030738831, -0.4791799783706665, -0.41608068346977234, -0.3529813885688782, -0.2898820638656616, -0.22678276896476746, -0.1636834740638733, -0.10058417171239853, -0.03748486936092377, 0.025614440441131592, 0.08871373534202576, 0.15181303024291992, 0.21491235494613647, 0.27801164984703064, 0.3411109447479248, 0.40421023964881897, 0.46730953454971313, 0.5304088592529297, 0.5935081243515015, 0.656607449054718, 0.7197067737579346, 0.7828060388565063, 0.8459053635597229, 0.9090046882629395, 0.9721039533615112, 1.035203218460083, 1.0983026027679443, 1.1614018678665161, 1.224501132965088, 1.2876005172729492, 1.350699782371521]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 6.0, 4.0, 5.0, 11.0, 11.0, 12.0, 9.0, 20.0, 23.0, 27.0, 24.0, 26.0, 40.0, 38.0, 37.0, 37.0, 35.0, 53.0, 42.0, 48.0, 43.0, 48.0, 43.0, 48.0, 37.0, 32.0, 37.0, 26.0, 35.0, 20.0, 32.0, 24.0, 15.0, 16.0, 15.0, 8.0, 3.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8283340334892273, -0.8035085797309875, -0.7786831855773926, -0.7538577318191528, -0.7290323376655579, -0.7042068839073181, -0.6793814897537231, -0.6545560359954834, -0.6297305822372437, -0.6049051284790039, -0.5800797343254089, -0.5552542805671692, -0.5304288864135742, -0.5056034326553345, -0.4807780086994171, -0.45595258474349976, -0.4311271905899048, -0.4063017666339874, -0.38147634267807007, -0.3566508889198303, -0.33182549476623535, -0.3070000410079956, -0.28217461705207825, -0.2573491930961609, -0.23252376914024353, -0.20769834518432617, -0.1828729212284088, -0.15804748237133026, -0.1332220584154129, -0.10839663445949554, -0.08357119560241699, -0.058745771646499634, -0.033920347690582275, -0.009094920009374619, 0.01573050767183304, 0.040555939078330994, 0.06538136303424835, 0.09020678699016571, 0.11503222584724426, 0.13985764980316162, 0.16468307375907898, 0.18950849771499634, 0.2143339216709137, 0.23915936052799225, 0.2639847993850708, 0.28881019353866577, 0.3136356472969055, 0.3384610712528229, 0.36328649520874023, 0.3881119191646576, 0.41293734312057495, 0.4377627968788147, 0.46258819103240967, 0.4874136447906494, 0.5122390985488892, 0.5370644927024841, 0.5618898868560791, 0.5867153406143188, 0.6115407347679138, 0.6363661885261536, 0.6611915826797485, 0.6860170364379883, 0.710842490196228, 0.735667884349823, 0.7604933381080627]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 5.0, 5.0, 4.0, 9.0, 10.0, 15.0, 20.0, 21.0, 38.0, 38.0, 65.0, 106.0, 173.0, 271.0, 447.0, 826.0, 1448.0, 3037.0, 6493.0, 19750.0, 170285.0, 3270290.0, 668688.0, 34601.0, 9210.0, 3880.0, 1998.0, 1010.0, 605.0, 323.0, 226.0, 140.0, 82.0, 64.0, 35.0, 25.0, 14.0, 9.0, 6.0, 8.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7021484375, -0.67999267578125, -0.6578369140625, -0.63568115234375, -0.613525390625, -0.59136962890625, -0.5692138671875, -0.54705810546875, -0.52490234375, -0.50274658203125, -0.4805908203125, -0.45843505859375, -0.436279296875, -0.41412353515625, -0.3919677734375, -0.36981201171875, -0.34765625, -0.32550048828125, -0.3033447265625, -0.28118896484375, -0.259033203125, -0.23687744140625, -0.2147216796875, -0.19256591796875, -0.17041015625, -0.14825439453125, -0.1260986328125, -0.10394287109375, -0.081787109375, -0.05963134765625, -0.0374755859375, -0.01531982421875, 0.0068359375, 0.02899169921875, 0.0511474609375, 0.07330322265625, 0.095458984375, 0.11761474609375, 0.1397705078125, 0.16192626953125, 0.18408203125, 0.20623779296875, 0.2283935546875, 0.25054931640625, 0.272705078125, 0.29486083984375, 0.3170166015625, 0.33917236328125, 0.361328125, 0.38348388671875, 0.4056396484375, 0.42779541015625, 0.449951171875, 0.47210693359375, 0.4942626953125, 0.51641845703125, 0.53857421875, 0.56072998046875, 0.5828857421875, 0.60504150390625, 0.627197265625, 0.64935302734375, 0.6715087890625, 0.69366455078125, 0.7158203125]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 5.0, 5.0, 11.0, 6.0, 8.0, 13.0, 12.0, 14.0, 19.0, 17.0, 26.0, 31.0, 43.0, 42.0, 62.0, 56.0, 57.0, 65.0, 47.0, 67.0, 52.0, 51.0, 39.0, 33.0, 44.0, 42.0, 25.0, 27.0, 27.0, 14.0, 12.0, 7.0, 7.0, 6.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.302978515625, -0.2938880920410156, -0.28479766845703125, -0.2757072448730469, -0.2666168212890625, -0.2575263977050781, -0.24843597412109375, -0.23934555053710938, -0.230255126953125, -0.22116470336914062, -0.21207427978515625, -0.20298385620117188, -0.1938934326171875, -0.18480300903320312, -0.17571258544921875, -0.16662216186523438, -0.15753173828125, -0.14844131469726562, -0.13935089111328125, -0.13026046752929688, -0.1211700439453125, -0.11207962036132812, -0.10298919677734375, -0.09389877319335938, -0.084808349609375, -0.07571792602539062, -0.06662750244140625, -0.057537078857421875, -0.0484466552734375, -0.039356231689453125, -0.03026580810546875, -0.021175384521484375, -0.0120849609375, -0.002994537353515625, 0.00609588623046875, 0.015186309814453125, 0.0242767333984375, 0.033367156982421875, 0.04245758056640625, 0.051548004150390625, 0.060638427734375, 0.06972885131835938, 0.07881927490234375, 0.08790969848632812, 0.0970001220703125, 0.10609054565429688, 0.11518096923828125, 0.12427139282226562, 0.13336181640625, 0.14245223999023438, 0.15154266357421875, 0.16063308715820312, 0.1697235107421875, 0.17881393432617188, 0.18790435791015625, 0.19699478149414062, 0.206085205078125, 0.21517562866210938, 0.22426605224609375, 0.23335647583007812, 0.2424468994140625, 0.2515373229980469, 0.26062774658203125, 0.2697181701660156, 0.27880859375]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 4.0, 11.0, 9.0, 8.0, 6.0, 11.0, 19.0, 25.0, 29.0, 56.0, 101.0, 187.0, 657.0, 3553.0, 69914.0, 4088250.0, 28278.0, 2256.0, 488.0, 167.0, 75.0, 49.0, 39.0, 29.0, 11.0, 5.0, 9.0, 10.0, 5.0, 2.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4072265625, -1.3576507568359375, -1.308074951171875, -1.2584991455078125, -1.20892333984375, -1.1593475341796875, -1.109771728515625, -1.0601959228515625, -1.0106201171875, -0.9610443115234375, -0.911468505859375, -0.8618927001953125, -0.81231689453125, -0.7627410888671875, -0.713165283203125, -0.6635894775390625, -0.614013671875, -0.5644378662109375, -0.514862060546875, -0.4652862548828125, -0.41571044921875, -0.3661346435546875, -0.316558837890625, -0.2669830322265625, -0.2174072265625, -0.1678314208984375, -0.118255615234375, -0.0686798095703125, -0.01910400390625, 0.0304718017578125, 0.080047607421875, 0.1296234130859375, 0.17919921875, 0.2287750244140625, 0.278350830078125, 0.3279266357421875, 0.37750244140625, 0.4270782470703125, 0.476654052734375, 0.5262298583984375, 0.5758056640625, 0.6253814697265625, 0.674957275390625, 0.7245330810546875, 0.77410888671875, 0.8236846923828125, 0.873260498046875, 0.9228363037109375, 0.972412109375, 1.0219879150390625, 1.071563720703125, 1.1211395263671875, 1.17071533203125, 1.2202911376953125, 1.269866943359375, 1.3194427490234375, 1.3690185546875, 1.4185943603515625, 1.468170166015625, 1.5177459716796875, 1.56732177734375, 1.6168975830078125, 1.666473388671875, 1.7160491943359375, 1.765625]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 3.0, 6.0, 9.0, 7.0, 8.0, 14.0, 22.0, 31.0, 52.0, 49.0, 89.0, 165.0, 328.0, 624.0, 1000.0, 753.0, 386.0, 207.0, 92.0, 54.0, 49.0, 24.0, 16.0, 15.0, 12.0, 8.0, 5.0, 8.0, 10.0, 8.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.1834716796875, -0.17847251892089844, -0.17347335815429688, -0.1684741973876953, -0.16347503662109375, -0.1584758758544922, -0.15347671508789062, -0.14847755432128906, -0.1434783935546875, -0.13847923278808594, -0.13348007202148438, -0.1284809112548828, -0.12348175048828125, -0.11848258972167969, -0.11348342895507812, -0.10848426818847656, -0.103485107421875, -0.09848594665527344, -0.09348678588867188, -0.08848762512207031, -0.08348846435546875, -0.07848930358886719, -0.07349014282226562, -0.06849098205566406, -0.0634918212890625, -0.05849266052246094, -0.053493499755859375, -0.04849433898925781, -0.04349517822265625, -0.03849601745605469, -0.033496856689453125, -0.028497695922851562, -0.02349853515625, -0.018499374389648438, -0.013500213623046875, -0.008501052856445312, -0.00350189208984375, 0.0014972686767578125, 0.006496429443359375, 0.011495590209960938, 0.0164947509765625, 0.021493911743164062, 0.026493072509765625, 0.03149223327636719, 0.03649139404296875, 0.04149055480957031, 0.046489715576171875, 0.05148887634277344, 0.056488037109375, 0.06148719787597656, 0.06648635864257812, 0.07148551940917969, 0.07648468017578125, 0.08148384094238281, 0.08648300170898438, 0.09148216247558594, 0.0964813232421875, 0.10148048400878906, 0.10647964477539062, 0.11147880554199219, 0.11647796630859375, 0.12147712707519531, 0.12647628784179688, 0.13147544860839844, 0.136474609375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 5.0, 8.0, 7.0, 6.0, 17.0, 15.0, 32.0, 51.0, 67.0, 78.0, 109.0, 156.0, 116.0, 102.0, 67.0, 58.0, 42.0, 22.0, 21.0, 9.0, 6.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37770017981529236, -0.3595159947872162, -0.3413317799568176, -0.32314759492874146, -0.3049634099006653, -0.2867791950702667, -0.26859501004219055, -0.250410795211792, -0.23222661018371582, -0.21404241025447845, -0.1958582103252411, -0.17767402529716492, -0.15948982536792755, -0.14130562543869019, -0.12312143296003342, -0.10493724048137665, -0.08675304055213928, -0.06856884062290192, -0.05038464814424515, -0.03220045194029808, -0.014016255736351013, 0.0041679441928863525, 0.02235213667154312, 0.04053632915019989, 0.058720529079437256, 0.07690472900867462, 0.09508892148733139, 0.11327311396598816, 0.13145731389522552, 0.1496415138244629, 0.16782569885253906, 0.18600989878177643, 0.20419412851333618, 0.22237832844257355, 0.2405625283718109, 0.2587467133998871, 0.27693092823028564, 0.2951151132583618, 0.313299298286438, 0.33148348331451416, 0.3496676981449127, 0.3678518831729889, 0.38603609800338745, 0.4042202830314636, 0.4224044680595398, 0.44058868288993835, 0.4587728679180145, 0.4769570827484131, 0.49514126777648926, 0.5133254528045654, 0.5315096378326416, 0.5496938824653625, 0.5678780674934387, 0.5860622525215149, 0.6042464375495911, 0.6224306225776672, 0.6406148672103882, 0.6587990522384644, 0.6769832372665405, 0.6951674818992615, 0.7133516669273376, 0.7315358519554138, 0.74972003698349, 0.7679042220115662, 0.7860884070396423]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 8.0, 4.0, 4.0, 11.0, 13.0, 11.0, 9.0, 20.0, 21.0, 22.0, 38.0, 37.0, 43.0, 35.0, 32.0, 37.0, 50.0, 46.0, 44.0, 37.0, 44.0, 39.0, 34.0, 45.0, 42.0, 53.0, 30.0, 32.0, 27.0, 28.0, 20.0, 20.0, 9.0, 12.0, 14.0, 11.0, 7.0, 2.0, 3.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2518153488636017, -0.24294771254062653, -0.23408006131649017, -0.22521242499351501, -0.21634477376937866, -0.2074771374464035, -0.19860950112342834, -0.189741849899292, -0.18087421357631683, -0.17200657725334167, -0.16313892602920532, -0.15427128970623016, -0.145403653383255, -0.13653600215911865, -0.1276683658361435, -0.11880072206258774, -0.10993307828903198, -0.10106543451547623, -0.09219779074192047, -0.08333015441894531, -0.07446251064538956, -0.0655948668718338, -0.056727226823568344, -0.04785958677530289, -0.03899194300174713, -0.030124301090836525, -0.02125665917992592, -0.012389017269015312, -0.003521375358104706, 0.00534626841545105, 0.014213908463716507, 0.023081548511981964, 0.03194919228553772, 0.040816836059093475, 0.04968447610735893, 0.05855211615562439, 0.06741975992918015, 0.0762874037027359, 0.08515504002571106, 0.09402268379926682, 0.10289032757282257, 0.11175797134637833, 0.12062561511993408, 0.12949325144290924, 0.1383608877658844, 0.14722853899002075, 0.1560961753129959, 0.16496381163597107, 0.17383146286010742, 0.18269909918308258, 0.19156675040721893, 0.2004343867301941, 0.20930203795433044, 0.2181696742773056, 0.22703731060028076, 0.23590496182441711, 0.24477259814739227, 0.25364023447036743, 0.2625078856945038, 0.27137553691864014, 0.2802431583404541, 0.28911080956459045, 0.2979784607887268, 0.30684608221054077, 0.3157137334346771]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 11.0, 6.0, 17.0, 15.0, 37.0, 59.0, 109.0, 189.0, 389.0, 869.0, 2096.0, 6622.0, 27468.0, 383015.0, 583091.0, 32642.0, 7634.0, 2438.0, 976.0, 390.0, 180.0, 113.0, 71.0, 43.0, 27.0, 12.0, 12.0, 8.0, 11.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2381591796875, -0.22684669494628906, -0.21553421020507812, -0.2042217254638672, -0.19290924072265625, -0.1815967559814453, -0.17028427124023438, -0.15897178649902344, -0.1476593017578125, -0.13634681701660156, -0.12503433227539062, -0.11372184753417969, -0.10240936279296875, -0.09109687805175781, -0.07978439331054688, -0.06847190856933594, -0.057159423828125, -0.04584693908691406, -0.034534454345703125, -0.023221969604492188, -0.01190948486328125, -0.0005970001220703125, 0.010715484619140625, 0.022027969360351562, 0.0333404541015625, 0.04465293884277344, 0.055965423583984375, 0.06727790832519531, 0.07859039306640625, 0.08990287780761719, 0.10121536254882812, 0.11252784729003906, 0.12384033203125, 0.13515281677246094, 0.14646530151367188, 0.1577777862548828, 0.16909027099609375, 0.1804027557373047, 0.19171524047851562, 0.20302772521972656, 0.2143402099609375, 0.22565269470214844, 0.23696517944335938, 0.2482776641845703, 0.25959014892578125, 0.2709026336669922, 0.2822151184082031, 0.29352760314941406, 0.304840087890625, 0.31615257263183594, 0.3274650573730469, 0.3387775421142578, 0.35009002685546875, 0.3614025115966797, 0.3727149963378906, 0.38402748107910156, 0.3953399658203125, 0.40665245056152344, 0.4179649353027344, 0.4292774200439453, 0.44058990478515625, 0.4519023895263672, 0.4632148742675781, 0.47452735900878906, 0.48583984375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 2.0, 7.0, 5.0, 16.0, 14.0, 13.0, 39.0, 47.0, 61.0, 54.0, 71.0, 75.0, 78.0, 82.0, 69.0, 79.0, 78.0, 54.0, 39.0, 36.0, 32.0, 18.0, 16.0, 8.0, 6.0, 6.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1494140625, -0.14076614379882812, -0.13211822509765625, -0.12347030639648438, -0.1148223876953125, -0.10617446899414062, -0.09752655029296875, -0.08887863159179688, -0.080230712890625, -0.07158279418945312, -0.06293487548828125, -0.054286956787109375, -0.0456390380859375, -0.036991119384765625, -0.02834320068359375, -0.019695281982421875, -0.01104736328125, -0.002399444580078125, 0.00624847412109375, 0.014896392822265625, 0.0235443115234375, 0.032192230224609375, 0.04084014892578125, 0.049488067626953125, 0.058135986328125, 0.06678390502929688, 0.07543182373046875, 0.08407974243164062, 0.0927276611328125, 0.10137557983398438, 0.11002349853515625, 0.11867141723632812, 0.1273193359375, 0.13596725463867188, 0.14461517333984375, 0.15326309204101562, 0.1619110107421875, 0.17055892944335938, 0.17920684814453125, 0.18785476684570312, 0.196502685546875, 0.20515060424804688, 0.21379852294921875, 0.22244644165039062, 0.2310943603515625, 0.23974227905273438, 0.24839019775390625, 0.2570381164550781, 0.26568603515625, 0.2743339538574219, 0.28298187255859375, 0.2916297912597656, 0.3002777099609375, 0.3089256286621094, 0.31757354736328125, 0.3262214660644531, 0.334869384765625, 0.3435173034667969, 0.35216522216796875, 0.3608131408691406, 0.3694610595703125, 0.3781089782714844, 0.38675689697265625, 0.3954048156738281, 0.404052734375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 3.0, 7.0, 4.0, 4.0, 7.0, 15.0, 15.0, 17.0, 25.0, 53.0, 90.0, 140.0, 305.0, 643.0, 1651.0, 4650.0, 15976.0, 79999.0, 630864.0, 263139.0, 36709.0, 9221.0, 2919.0, 1129.0, 395.0, 230.0, 122.0, 61.0, 51.0, 30.0, 11.0, 11.0, 9.0, 8.0, 6.0, 6.0, 8.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1776123046875, -0.17235374450683594, -0.16709518432617188, -0.1618366241455078, -0.15657806396484375, -0.1513195037841797, -0.14606094360351562, -0.14080238342285156, -0.1355438232421875, -0.13028526306152344, -0.12502670288085938, -0.11976814270019531, -0.11450958251953125, -0.10925102233886719, -0.10399246215820312, -0.09873390197753906, -0.093475341796875, -0.08821678161621094, -0.08295822143554688, -0.07769966125488281, -0.07244110107421875, -0.06718254089355469, -0.061923980712890625, -0.05666542053222656, -0.0514068603515625, -0.04614830017089844, -0.040889739990234375, -0.03563117980957031, -0.03037261962890625, -0.025114059448242188, -0.019855499267578125, -0.014596939086914062, -0.00933837890625, -0.0040798187255859375, 0.001178741455078125, 0.0064373016357421875, 0.01169586181640625, 0.016954421997070312, 0.022212982177734375, 0.027471542358398438, 0.0327301025390625, 0.03798866271972656, 0.043247222900390625, 0.04850578308105469, 0.05376434326171875, 0.05902290344238281, 0.06428146362304688, 0.06954002380371094, 0.074798583984375, 0.08005714416503906, 0.08531570434570312, 0.09057426452636719, 0.09583282470703125, 0.10109138488769531, 0.10634994506835938, 0.11160850524902344, 0.1168670654296875, 0.12212562561035156, 0.12738418579101562, 0.1326427459716797, 0.13790130615234375, 0.1431598663330078, 0.14841842651367188, 0.15367698669433594, 0.158935546875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 5.0, 11.0, 6.0, 6.0, 6.0, 20.0, 16.0, 7.0, 19.0, 14.0, 28.0, 28.0, 36.0, 40.0, 40.0, 28.0, 47.0, 38.0, 43.0, 42.0, 48.0, 48.0, 57.0, 27.0, 48.0, 35.0, 38.0, 42.0, 37.0, 18.0, 25.0, 19.0, 17.0, 15.0, 13.0, 5.0, 8.0, 3.0, 5.0, 5.0, 3.0, 5.0, 4.0, 4.0, 0.0, 1.0, 2.0, 4.0], "bins": [-0.331787109375, -0.322662353515625, -0.31353759765625, -0.304412841796875, -0.2952880859375, -0.286163330078125, -0.27703857421875, -0.267913818359375, -0.2587890625, -0.249664306640625, -0.24053955078125, -0.231414794921875, -0.2222900390625, -0.213165283203125, -0.20404052734375, -0.194915771484375, -0.185791015625, -0.176666259765625, -0.16754150390625, -0.158416748046875, -0.1492919921875, -0.140167236328125, -0.13104248046875, -0.121917724609375, -0.11279296875, -0.103668212890625, -0.09454345703125, -0.085418701171875, -0.0762939453125, -0.067169189453125, -0.05804443359375, -0.048919677734375, -0.039794921875, -0.030670166015625, -0.02154541015625, -0.012420654296875, -0.0032958984375, 0.005828857421875, 0.01495361328125, 0.024078369140625, 0.033203125, 0.042327880859375, 0.05145263671875, 0.060577392578125, 0.0697021484375, 0.078826904296875, 0.08795166015625, 0.097076416015625, 0.106201171875, 0.115325927734375, 0.12445068359375, 0.133575439453125, 0.1427001953125, 0.151824951171875, 0.16094970703125, 0.170074462890625, 0.17919921875, 0.188323974609375, 0.19744873046875, 0.206573486328125, 0.2156982421875, 0.224822998046875, 0.23394775390625, 0.243072509765625, 0.252197265625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 8.0, 10.0, 12.0, 13.0, 37.0, 40.0, 49.0, 103.0, 141.0, 219.0, 388.0, 616.0, 1215.0, 2223.0, 4602.0, 10938.0, 34632.0, 172833.0, 633183.0, 139494.0, 29456.0, 9636.0, 4001.0, 1979.0, 1151.0, 582.0, 364.0, 191.0, 141.0, 91.0, 63.0, 55.0, 30.0, 14.0, 9.0, 11.0, 8.0, 4.0, 5.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0294036865234375, -0.02843785285949707, -0.02747201919555664, -0.02650618553161621, -0.02554035186767578, -0.02457451820373535, -0.023608684539794922, -0.022642850875854492, -0.021677017211914062, -0.020711183547973633, -0.019745349884033203, -0.018779516220092773, -0.017813682556152344, -0.016847848892211914, -0.015882015228271484, -0.014916181564331055, -0.013950347900390625, -0.012984514236450195, -0.012018680572509766, -0.011052846908569336, -0.010087013244628906, -0.009121179580688477, -0.008155345916748047, -0.007189512252807617, -0.0062236785888671875, -0.005257844924926758, -0.004292011260986328, -0.0033261775970458984, -0.0023603439331054688, -0.001394510269165039, -0.0004286766052246094, 0.0005371570587158203, 0.00150299072265625, 0.0024688243865966797, 0.0034346580505371094, 0.004400491714477539, 0.005366325378417969, 0.0063321590423583984, 0.007297992706298828, 0.008263826370239258, 0.009229660034179688, 0.010195493698120117, 0.011161327362060547, 0.012127161026000977, 0.013092994689941406, 0.014058828353881836, 0.015024662017822266, 0.015990495681762695, 0.016956329345703125, 0.017922163009643555, 0.018887996673583984, 0.019853830337524414, 0.020819664001464844, 0.021785497665405273, 0.022751331329345703, 0.023717164993286133, 0.024682998657226562, 0.025648832321166992, 0.026614665985107422, 0.02758049964904785, 0.02854633331298828, 0.02951216697692871, 0.03047800064086914, 0.03144383430480957, 0.03240966796875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 0.0, 4.0, 6.0, 5.0, 4.0, 8.0, 5.0, 10.0, 19.0, 24.0, 36.0, 50.0, 80.0, 96.0, 122.0, 138.0, 119.0, 75.0, 49.0, 47.0, 31.0, 18.0, 11.0, 14.0, 4.0, 7.0, 3.0, 5.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.0265579223632812e-05, -1.968909054994583e-05, -1.911260187625885e-05, -1.853611320257187e-05, -1.7959624528884888e-05, -1.7383135855197906e-05, -1.6806647181510925e-05, -1.6230158507823944e-05, -1.5653669834136963e-05, -1.5077181160449982e-05, -1.4500692486763e-05, -1.392420381307602e-05, -1.3347715139389038e-05, -1.2771226465702057e-05, -1.2194737792015076e-05, -1.1618249118328094e-05, -1.1041760444641113e-05, -1.0465271770954132e-05, -9.888783097267151e-06, -9.31229442358017e-06, -8.735805749893188e-06, -8.159317076206207e-06, -7.582828402519226e-06, -7.006339728832245e-06, -6.429851055145264e-06, -5.8533623814582825e-06, -5.276873707771301e-06, -4.70038503408432e-06, -4.123896360397339e-06, -3.5474076867103577e-06, -2.9709190130233765e-06, -2.3944303393363953e-06, -1.817941665649414e-06, -1.2414529919624329e-06, -6.649643182754517e-07, -8.847564458847046e-08, 4.880130290985107e-07, 1.064501702785492e-06, 1.6409903764724731e-06, 2.2174790501594543e-06, 2.7939677238464355e-06, 3.3704563975334167e-06, 3.946945071220398e-06, 4.523433744907379e-06, 5.09992241859436e-06, 5.6764110922813416e-06, 6.252899765968323e-06, 6.829388439655304e-06, 7.405877113342285e-06, 7.982365787029266e-06, 8.558854460716248e-06, 9.135343134403229e-06, 9.71183180809021e-06, 1.0288320481777191e-05, 1.0864809155464172e-05, 1.1441297829151154e-05, 1.2017786502838135e-05, 1.2594275176525116e-05, 1.3170763850212097e-05, 1.3747252523899078e-05, 1.432374119758606e-05, 1.490022987127304e-05, 1.5476718544960022e-05, 1.6053207218647003e-05, 1.6629695892333984e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 9.0, 13.0, 10.0, 14.0, 24.0, 32.0, 52.0, 100.0, 181.0, 458.0, 1176.0, 4146.0, 19579.0, 153131.0, 746594.0, 103078.0, 14776.0, 3433.0, 1021.0, 370.0, 148.0, 75.0, 36.0, 34.0, 18.0, 15.0, 9.0, 4.0, 8.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042816162109375, -0.041408538818359375, -0.04000091552734375, -0.038593292236328125, -0.0371856689453125, -0.035778045654296875, -0.03437042236328125, -0.032962799072265625, -0.03155517578125, -0.030147552490234375, -0.02873992919921875, -0.027332305908203125, -0.0259246826171875, -0.024517059326171875, -0.02310943603515625, -0.021701812744140625, -0.020294189453125, -0.018886566162109375, -0.01747894287109375, -0.016071319580078125, -0.0146636962890625, -0.013256072998046875, -0.01184844970703125, -0.010440826416015625, -0.009033203125, -0.007625579833984375, -0.00621795654296875, -0.004810333251953125, -0.0034027099609375, -0.001995086669921875, -0.00058746337890625, 0.000820159912109375, 0.002227783203125, 0.003635406494140625, 0.00504302978515625, 0.006450653076171875, 0.0078582763671875, 0.009265899658203125, 0.01067352294921875, 0.012081146240234375, 0.01348876953125, 0.014896392822265625, 0.01630401611328125, 0.017711639404296875, 0.0191192626953125, 0.020526885986328125, 0.02193450927734375, 0.023342132568359375, 0.024749755859375, 0.026157379150390625, 0.02756500244140625, 0.028972625732421875, 0.0303802490234375, 0.031787872314453125, 0.03319549560546875, 0.034603118896484375, 0.0360107421875, 0.037418365478515625, 0.03882598876953125, 0.040233612060546875, 0.0416412353515625, 0.043048858642578125, 0.04445648193359375, 0.045864105224609375, 0.047271728515625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 3.0, 5.0, 9.0, 10.0, 14.0, 14.0, 17.0, 27.0, 36.0, 41.0, 45.0, 48.0, 63.0, 74.0, 94.0, 118.0, 67.0, 60.0, 36.0, 35.0, 39.0, 31.0, 20.0, 28.0, 17.0, 12.0, 5.0, 6.0, 9.0, 7.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006473541259765625, -0.006262838840484619, -0.006052136421203613, -0.005841434001922607, -0.0056307315826416016, -0.005420029163360596, -0.00520932674407959, -0.004998624324798584, -0.004787921905517578, -0.004577219486236572, -0.004366517066955566, -0.0041558146476745605, -0.003945112228393555, -0.003734409809112549, -0.003523707389831543, -0.003313004970550537, -0.0031023025512695312, -0.0028916001319885254, -0.0026808977127075195, -0.0024701952934265137, -0.002259492874145508, -0.002048790454864502, -0.001838088035583496, -0.0016273856163024902, -0.0014166831970214844, -0.0012059807777404785, -0.0009952783584594727, -0.0007845759391784668, -0.0005738735198974609, -0.0003631711006164551, -0.00015246868133544922, 5.823373794555664e-05, 0.0002689361572265625, 0.00047963857650756836, 0.0006903409957885742, 0.0009010434150695801, 0.001111745834350586, 0.0013224482536315918, 0.0015331506729125977, 0.0017438530921936035, 0.0019545555114746094, 0.0021652579307556152, 0.002375960350036621, 0.002586662769317627, 0.002797365188598633, 0.0030080676078796387, 0.0032187700271606445, 0.0034294724464416504, 0.0036401748657226562, 0.003850877285003662, 0.004061579704284668, 0.004272282123565674, 0.00448298454284668, 0.0046936869621276855, 0.004904389381408691, 0.005115091800689697, 0.005325794219970703, 0.005536496639251709, 0.005747199058532715, 0.005957901477813721, 0.0061686038970947266, 0.006379306316375732, 0.006590008735656738, 0.006800711154937744, 0.00701141357421875]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 11.0, 10.0, 32.0, 34.0, 52.0, 62.0, 90.0, 101.0, 148.0, 119.0, 94.0, 71.0, 55.0, 34.0, 23.0, 19.0, 7.0, 10.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28356653451919556, -0.2743428945541382, -0.2651192545890808, -0.25589561462402344, -0.24667198956012726, -0.23744834959506989, -0.2282247245311737, -0.21900108456611633, -0.20977744460105896, -0.2005538046360016, -0.1913301646709442, -0.18210653960704803, -0.17288289964199066, -0.1636592596769333, -0.1544356346130371, -0.14521199464797974, -0.13598835468292236, -0.126764714717865, -0.11754108220338821, -0.10831744968891144, -0.09909380972385406, -0.08987016975879669, -0.08064653724431992, -0.07142290472984314, -0.06219926476478577, -0.05297562852501869, -0.04375199228525162, -0.03452835604548454, -0.025304719805717468, -0.016081083565950394, -0.006857447326183319, 0.002366185188293457, 0.011589854955673218, 0.020813491195440292, 0.030037127435207367, 0.03926076367497444, 0.048484399914741516, 0.05770803615450859, 0.06693167239427567, 0.07615530490875244, 0.08537894487380981, 0.09460258483886719, 0.10382621735334396, 0.11304984986782074, 0.12227348983287811, 0.13149712979793549, 0.14072075486183167, 0.14994439482688904, 0.1591680347919464, 0.16839167475700378, 0.17761531472206116, 0.18683893978595734, 0.1960625797510147, 0.20528621971607208, 0.21450984477996826, 0.22373348474502563, 0.232957124710083, 0.24218076467514038, 0.25140440464019775, 0.2606280446052551, 0.2698516845703125, 0.2790752947330475, 0.28829893469810486, 0.29752257466316223, 0.3067462146282196]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 4.0, 10.0, 13.0, 18.0, 22.0, 30.0, 45.0, 69.0, 76.0, 68.0, 81.0, 80.0, 77.0, 71.0, 85.0, 74.0, 59.0, 35.0, 32.0, 23.0, 14.0, 11.0, 8.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13032345473766327, -0.12155041843652725, -0.11277738213539124, -0.10400435328483582, -0.0952313095331192, -0.08645828068256378, -0.07768524438142776, -0.06891220808029175, -0.06013917177915573, -0.051366135478019714, -0.0425930991768837, -0.03382006660103798, -0.025047030299901962, -0.016273993998765945, -0.007500961422920227, 0.0012720748782157898, 0.010045111179351807, 0.018818147480487823, 0.02759118191897869, 0.03636421635746956, 0.045137252658605576, 0.05391028895974159, 0.06268332153558731, 0.07145635783672333, 0.08022939413785934, 0.08900243043899536, 0.09777546674013138, 0.1065485030412674, 0.11532153189182281, 0.12409457564353943, 0.13286760449409485, 0.14164063334465027, 0.1504136621952057, 0.1591866910457611, 0.16795973479747772, 0.17673276364803314, 0.18550580739974976, 0.19427883625030518, 0.2030518651008606, 0.2118249088525772, 0.22059795260429382, 0.22937098145484924, 0.23814402520656586, 0.24691705405712128, 0.2556900978088379, 0.2644631266593933, 0.27323615550994873, 0.28200918436050415, 0.29078221321105957, 0.299555242061615, 0.3083282709121704, 0.3171013295650482, 0.32587435841560364, 0.33464738726615906, 0.3434204161167145, 0.3521934747695923, 0.3609665036201477, 0.3697395324707031, 0.37851256132125854, 0.38728561997413635, 0.3960586488246918, 0.4048316776752472, 0.4136047065258026, 0.4223777651786804, 0.43115079402923584]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 10.0, 19.0, 25.0, 47.0, 57.0, 102.0, 190.0, 284.0, 506.0, 929.0, 1525.0, 3015.0, 5802.0, 12667.0, 32302.0, 122543.0, 657589.0, 147304.0, 36200.0, 13835.0, 6325.0, 3309.0, 1687.0, 927.0, 541.0, 308.0, 200.0, 116.0, 60.0, 52.0, 24.0, 20.0, 5.0, 7.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.335205078125, -0.3252143859863281, -0.31522369384765625, -0.3052330017089844, -0.2952423095703125, -0.2852516174316406, -0.27526092529296875, -0.2652702331542969, -0.255279541015625, -0.24528884887695312, -0.23529815673828125, -0.22530746459960938, -0.2153167724609375, -0.20532608032226562, -0.19533538818359375, -0.18534469604492188, -0.17535400390625, -0.16536331176757812, -0.15537261962890625, -0.14538192749023438, -0.1353912353515625, -0.12540054321289062, -0.11540985107421875, -0.10541915893554688, -0.095428466796875, -0.08543777465820312, -0.07544708251953125, -0.06545639038085938, -0.0554656982421875, -0.045475006103515625, -0.03548431396484375, -0.025493621826171875, -0.0155029296875, -0.005512237548828125, 0.00447845458984375, 0.014469146728515625, 0.0244598388671875, 0.034450531005859375, 0.04444122314453125, 0.054431915283203125, 0.064422607421875, 0.07441329956054688, 0.08440399169921875, 0.09439468383789062, 0.1043853759765625, 0.11437606811523438, 0.12436676025390625, 0.13435745239257812, 0.14434814453125, 0.15433883666992188, 0.16432952880859375, 0.17432022094726562, 0.1843109130859375, 0.19430160522460938, 0.20429229736328125, 0.21428298950195312, 0.224273681640625, 0.23426437377929688, 0.24425506591796875, 0.2542457580566406, 0.2642364501953125, 0.2742271423339844, 0.28421783447265625, 0.2942085266113281, 0.30419921875]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 8.0, 9.0, 20.0, 11.0, 31.0, 36.0, 55.0, 64.0, 62.0, 77.0, 93.0, 74.0, 76.0, 84.0, 63.0, 73.0, 52.0, 35.0, 26.0, 20.0, 9.0, 9.0, 7.0, 6.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28125, -0.2651519775390625, -0.249053955078125, -0.2329559326171875, -0.21685791015625, -0.2007598876953125, -0.184661865234375, -0.1685638427734375, -0.1524658203125, -0.1363677978515625, -0.120269775390625, -0.1041717529296875, -0.08807373046875, -0.0719757080078125, -0.055877685546875, -0.0397796630859375, -0.023681640625, -0.0075836181640625, 0.008514404296875, 0.0246124267578125, 0.04071044921875, 0.0568084716796875, 0.072906494140625, 0.0890045166015625, 0.1051025390625, 0.1212005615234375, 0.137298583984375, 0.1533966064453125, 0.16949462890625, 0.1855926513671875, 0.201690673828125, 0.2177886962890625, 0.23388671875, 0.2499847412109375, 0.266082763671875, 0.2821807861328125, 0.29827880859375, 0.3143768310546875, 0.330474853515625, 0.3465728759765625, 0.3626708984375, 0.3787689208984375, 0.394866943359375, 0.4109649658203125, 0.42706298828125, 0.4431610107421875, 0.459259033203125, 0.4753570556640625, 0.491455078125, 0.5075531005859375, 0.523651123046875, 0.5397491455078125, 0.55584716796875, 0.5719451904296875, 0.588043212890625, 0.6041412353515625, 0.6202392578125, 0.6363372802734375, 0.652435302734375, 0.6685333251953125, 0.68463134765625, 0.7007293701171875, 0.716827392578125, 0.7329254150390625, 0.7490234375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 6.0, 3.0, 5.0, 8.0, 14.0, 11.0, 14.0, 13.0, 25.0, 26.0, 42.0, 40.0, 58.0, 75.0, 74.0, 188.0, 409.0, 1666.0, 20922.0, 948494.0, 71593.0, 3587.0, 546.0, 220.0, 140.0, 79.0, 71.0, 51.0, 35.0, 27.0, 26.0, 23.0, 21.0, 10.0, 9.0, 10.0, 5.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.0751953125, -1.044189453125, -1.01318359375, -0.982177734375, -0.951171875, -0.920166015625, -0.88916015625, -0.858154296875, -0.8271484375, -0.796142578125, -0.76513671875, -0.734130859375, -0.703125, -0.672119140625, -0.64111328125, -0.610107421875, -0.5791015625, -0.548095703125, -0.51708984375, -0.486083984375, -0.455078125, -0.424072265625, -0.39306640625, -0.362060546875, -0.3310546875, -0.300048828125, -0.26904296875, -0.238037109375, -0.20703125, -0.176025390625, -0.14501953125, -0.114013671875, -0.0830078125, -0.052001953125, -0.02099609375, 0.010009765625, 0.041015625, 0.072021484375, 0.10302734375, 0.134033203125, 0.1650390625, 0.196044921875, 0.22705078125, 0.258056640625, 0.2890625, 0.320068359375, 0.35107421875, 0.382080078125, 0.4130859375, 0.444091796875, 0.47509765625, 0.506103515625, 0.537109375, 0.568115234375, 0.59912109375, 0.630126953125, 0.6611328125, 0.692138671875, 0.72314453125, 0.754150390625, 0.78515625, 0.816162109375, 0.84716796875, 0.878173828125, 0.9091796875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 8.0, 11.0, 6.0, 6.0, 7.0, 14.0, 14.0, 20.0, 17.0, 27.0, 33.0, 38.0, 44.0, 37.0, 50.0, 45.0, 56.0, 46.0, 59.0, 44.0, 47.0, 49.0, 49.0, 41.0, 47.0, 30.0, 34.0, 23.0, 20.0, 23.0, 11.0, 12.0, 10.0, 9.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33447265625, -0.3241767883300781, -0.31388092041015625, -0.3035850524902344, -0.2932891845703125, -0.2829933166503906, -0.27269744873046875, -0.2624015808105469, -0.252105712890625, -0.24180984497070312, -0.23151397705078125, -0.22121810913085938, -0.2109222412109375, -0.20062637329101562, -0.19033050537109375, -0.18003463745117188, -0.16973876953125, -0.15944290161132812, -0.14914703369140625, -0.13885116577148438, -0.1285552978515625, -0.11825942993164062, -0.10796356201171875, -0.09766769409179688, -0.087371826171875, -0.07707595825195312, -0.06678009033203125, -0.056484222412109375, -0.0461883544921875, -0.035892486572265625, -0.02559661865234375, -0.015300750732421875, -0.0050048828125, 0.005290985107421875, 0.01558685302734375, 0.025882720947265625, 0.0361785888671875, 0.046474456787109375, 0.05677032470703125, 0.06706619262695312, 0.077362060546875, 0.08765792846679688, 0.09795379638671875, 0.10824966430664062, 0.1185455322265625, 0.12884140014648438, 0.13913726806640625, 0.14943313598632812, 0.15972900390625, 0.17002487182617188, 0.18032073974609375, 0.19061660766601562, 0.2009124755859375, 0.21120834350585938, 0.22150421142578125, 0.23180007934570312, 0.242095947265625, 0.2523918151855469, 0.26268768310546875, 0.2729835510253906, 0.2832794189453125, 0.2935752868652344, 0.30387115478515625, 0.3141670227050781, 0.324462890625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 5.0, 6.0, 6.0, 2.0, 7.0, 9.0, 9.0, 7.0, 18.0, 19.0, 52.0, 97.0, 250.0, 886.0, 3959.0, 39459.0, 954423.0, 43568.0, 4198.0, 995.0, 292.0, 117.0, 55.0, 43.0, 22.0, 14.0, 10.0, 8.0, 8.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.18310546875, -0.17729568481445312, -0.17148590087890625, -0.16567611694335938, -0.1598663330078125, -0.15405654907226562, -0.14824676513671875, -0.14243698120117188, -0.136627197265625, -0.13081741333007812, -0.12500762939453125, -0.11919784545898438, -0.1133880615234375, -0.10757827758789062, -0.10176849365234375, -0.09595870971679688, -0.09014892578125, -0.08433914184570312, -0.07852935791015625, -0.07271957397460938, -0.0669097900390625, -0.061100006103515625, -0.05529022216796875, -0.049480438232421875, -0.043670654296875, -0.037860870361328125, -0.03205108642578125, -0.026241302490234375, -0.0204315185546875, -0.014621734619140625, -0.00881195068359375, -0.003002166748046875, 0.0028076171875, 0.008617401123046875, 0.01442718505859375, 0.020236968994140625, 0.0260467529296875, 0.031856536865234375, 0.03766632080078125, 0.043476104736328125, 0.049285888671875, 0.055095672607421875, 0.06090545654296875, 0.06671524047851562, 0.0725250244140625, 0.07833480834960938, 0.08414459228515625, 0.08995437622070312, 0.09576416015625, 0.10157394409179688, 0.10738372802734375, 0.11319351196289062, 0.1190032958984375, 0.12481307983398438, 0.13062286376953125, 0.13643264770507812, 0.142242431640625, 0.14805221557617188, 0.15386199951171875, 0.15967178344726562, 0.1654815673828125, 0.17129135131835938, 0.17710113525390625, 0.18291091918945312, 0.188720703125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 2.0, 4.0, 4.0, 4.0, 14.0, 10.0, 16.0, 33.0, 36.0, 83.0, 153.0, 212.0, 160.0, 83.0, 53.0, 39.0, 25.0, 15.0, 8.0, 11.0, 8.0, 2.0, 7.0, 3.0, 8.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7940998077392578e-05, -1.7449259757995605e-05, -1.6957521438598633e-05, -1.646578311920166e-05, -1.5974044799804688e-05, -1.5482306480407715e-05, -1.4990568161010742e-05, -1.449882984161377e-05, -1.4007091522216797e-05, -1.3515353202819824e-05, -1.3023614883422852e-05, -1.2531876564025879e-05, -1.2040138244628906e-05, -1.1548399925231934e-05, -1.1056661605834961e-05, -1.0564923286437988e-05, -1.0073184967041016e-05, -9.581446647644043e-06, -9.08970832824707e-06, -8.597970008850098e-06, -8.106231689453125e-06, -7.614493370056152e-06, -7.12275505065918e-06, -6.631016731262207e-06, -6.139278411865234e-06, -5.647540092468262e-06, -5.155801773071289e-06, -4.664063453674316e-06, -4.172325134277344e-06, -3.680586814880371e-06, -3.1888484954833984e-06, -2.6971101760864258e-06, -2.205371856689453e-06, -1.7136335372924805e-06, -1.2218952178955078e-06, -7.301568984985352e-07, -2.384185791015625e-07, 2.5331974029541016e-07, 7.450580596923828e-07, 1.2367963790893555e-06, 1.7285346984863281e-06, 2.2202730178833008e-06, 2.7120113372802734e-06, 3.203749656677246e-06, 3.6954879760742188e-06, 4.187226295471191e-06, 4.678964614868164e-06, 5.170702934265137e-06, 5.662441253662109e-06, 6.154179573059082e-06, 6.645917892456055e-06, 7.137656211853027e-06, 7.62939453125e-06, 8.121132850646973e-06, 8.612871170043945e-06, 9.104609489440918e-06, 9.59634780883789e-06, 1.0088086128234863e-05, 1.0579824447631836e-05, 1.1071562767028809e-05, 1.1563301086425781e-05, 1.2055039405822754e-05, 1.2546777725219727e-05, 1.30385160446167e-05, 1.3530254364013672e-05]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 10.0, 10.0, 14.0, 15.0, 24.0, 37.0, 62.0, 100.0, 211.0, 465.0, 1269.0, 3856.0, 17912.0, 304661.0, 686248.0, 26189.0, 4837.0, 1509.0, 557.0, 234.0, 109.0, 67.0, 52.0, 31.0, 21.0, 10.0, 8.0, 5.0, 6.0, 0.0, 4.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.150390625, -0.1461048126220703, -0.14181900024414062, -0.13753318786621094, -0.13324737548828125, -0.12896156311035156, -0.12467575073242188, -0.12038993835449219, -0.1161041259765625, -0.11181831359863281, -0.10753250122070312, -0.10324668884277344, -0.09896087646484375, -0.09467506408691406, -0.09038925170898438, -0.08610343933105469, -0.081817626953125, -0.07753181457519531, -0.07324600219726562, -0.06896018981933594, -0.06467437744140625, -0.06038856506347656, -0.056102752685546875, -0.05181694030761719, -0.0475311279296875, -0.04324531555175781, -0.038959503173828125, -0.03467369079589844, -0.03038787841796875, -0.026102066040039062, -0.021816253662109375, -0.017530441284179688, -0.01324462890625, -0.008958816528320312, -0.004673004150390625, -0.0003871917724609375, 0.00389862060546875, 0.008184432983398438, 0.012470245361328125, 0.016756057739257812, 0.0210418701171875, 0.025327682495117188, 0.029613494873046875, 0.03389930725097656, 0.03818511962890625, 0.04247093200683594, 0.046756744384765625, 0.05104255676269531, 0.055328369140625, 0.05961418151855469, 0.06389999389648438, 0.06818580627441406, 0.07247161865234375, 0.07675743103027344, 0.08104324340820312, 0.08532905578613281, 0.0896148681640625, 0.09390068054199219, 0.09818649291992188, 0.10247230529785156, 0.10675811767578125, 0.11104393005371094, 0.11532974243164062, 0.11961555480957031, 0.1239013671875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 4.0, 8.0, 12.0, 14.0, 13.0, 18.0, 32.0, 39.0, 54.0, 79.0, 117.0, 153.0, 127.0, 76.0, 80.0, 48.0, 37.0, 29.0, 18.0, 12.0, 6.0, 3.0, 5.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.03936767578125, -0.038074493408203125, -0.03678131103515625, -0.035488128662109375, -0.0341949462890625, -0.032901763916015625, -0.03160858154296875, -0.030315399169921875, -0.029022216796875, -0.027729034423828125, -0.02643585205078125, -0.025142669677734375, -0.0238494873046875, -0.022556304931640625, -0.02126312255859375, -0.019969940185546875, -0.0186767578125, -0.017383575439453125, -0.01609039306640625, -0.014797210693359375, -0.0135040283203125, -0.012210845947265625, -0.01091766357421875, -0.009624481201171875, -0.008331298828125, -0.007038116455078125, -0.00574493408203125, -0.004451751708984375, -0.0031585693359375, -0.001865386962890625, -0.00057220458984375, 0.000720977783203125, 0.00201416015625, 0.003307342529296875, 0.00460052490234375, 0.005893707275390625, 0.0071868896484375, 0.008480072021484375, 0.00977325439453125, 0.011066436767578125, 0.012359619140625, 0.013652801513671875, 0.01494598388671875, 0.016239166259765625, 0.0175323486328125, 0.018825531005859375, 0.02011871337890625, 0.021411895751953125, 0.022705078125, 0.023998260498046875, 0.02529144287109375, 0.026584625244140625, 0.0278778076171875, 0.029170989990234375, 0.03046417236328125, 0.031757354736328125, 0.033050537109375, 0.034343719482421875, 0.03563690185546875, 0.036930084228515625, 0.0382232666015625, 0.039516448974609375, 0.04080963134765625, 0.042102813720703125, 0.04339599609375]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 9.0, 23.0, 37.0, 47.0, 140.0, 180.0, 204.0, 153.0, 91.0, 51.0, 22.0, 18.0, 7.0, 9.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5272629857063293, -0.4985676407814026, -0.46987229585647583, -0.44117698073387146, -0.4124816358089447, -0.38378629088401794, -0.3550909757614136, -0.3263956308364868, -0.29770028591156006, -0.2690049409866333, -0.24030961096286774, -0.21161428093910217, -0.18291893601417542, -0.15422359108924866, -0.1255282610654831, -0.09683293104171753, -0.06813758611679077, -0.03944224864244461, -0.01074691116809845, 0.01794842630624771, 0.04664376378059387, 0.07533910870552063, 0.1040344387292862, 0.13272976875305176, 0.16142511367797852, 0.19012045860290527, 0.21881578862667084, 0.2475111186504364, 0.27620646357536316, 0.3049018085002899, 0.3335971236228943, 0.36229246854782104, 0.390987753868103, 0.4196830987930298, 0.44837844371795654, 0.4770737588405609, 0.5057691335678101, 0.5344644784927368, 0.5631597638130188, 0.5918551087379456, 0.6205504536628723, 0.6492457985877991, 0.6779411435127258, 0.7066364884376526, 0.7353317737579346, 0.7640271186828613, 0.7927224636077881, 0.8214178085327148, 0.8501131534576416, 0.8788084983825684, 0.9075038433074951, 0.9361991882324219, 0.9648945331573486, 0.9935898780822754, 1.0222852230072021, 1.050980567932129, 1.0796759128570557, 1.1083712577819824, 1.1370666027069092, 1.165761947631836, 1.1944572925567627, 1.2231526374816895, 1.2518479824066162, 1.280543327331543, 1.3092385530471802]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 7.0, 7.0, 7.0, 9.0, 18.0, 12.0, 22.0, 12.0, 24.0, 30.0, 24.0, 33.0, 35.0, 22.0, 40.0, 38.0, 51.0, 42.0, 53.0, 44.0, 42.0, 54.0, 43.0, 41.0, 37.0, 36.0, 35.0, 32.0, 25.0, 26.0, 16.0, 22.0, 12.0, 13.0, 9.0, 7.0, 10.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37177786231040955, -0.35603827238082886, -0.3402986526489258, -0.3245590627193451, -0.3088194727897644, -0.29307985305786133, -0.27734026312828064, -0.26160067319869995, -0.24586106836795807, -0.2301214635372162, -0.2143818736076355, -0.19864226877689362, -0.18290266394615173, -0.16716307401657104, -0.15142346918582916, -0.13568386435508728, -0.11994427442550659, -0.1042046770453453, -0.08846507966518402, -0.07272547483444214, -0.05698587745428085, -0.04124628007411957, -0.025506675243377686, -0.0097670778632164, 0.005972519516944885, 0.02171211875975132, 0.037451718002557755, 0.05319131910800934, 0.06893091648817062, 0.08467051386833191, 0.10041011869907379, 0.11614971607923508, 0.13188934326171875, 0.14762894809246063, 0.16336853802204132, 0.1791081428527832, 0.1948477327823639, 0.21058733761310577, 0.22632694244384766, 0.24206653237342834, 0.25780612230300903, 0.2735457122325897, 0.2892853319644928, 0.3050249218940735, 0.3207645118236542, 0.33650410175323486, 0.35224372148513794, 0.36798331141471863, 0.3837229311466217, 0.3994625210762024, 0.41520214080810547, 0.43094173073768616, 0.44668132066726685, 0.4624209403991699, 0.4781605303287506, 0.4939001202583313, 0.5096397399902344, 0.5253793597221375, 0.5411189198493958, 0.5568585395812988, 0.5725981593132019, 0.5883377194404602, 0.6040773391723633, 0.6198169589042664, 0.6355565190315247]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 5.0, 5.0, 10.0, 8.0, 8.0, 17.0, 23.0, 31.0, 29.0, 42.0, 69.0, 72.0, 118.0, 177.0, 283.0, 408.0, 656.0, 1187.0, 2088.0, 4385.0, 10444.0, 42519.0, 825234.0, 3049629.0, 222437.0, 20239.0, 7002.0, 3046.0, 1606.0, 884.0, 554.0, 309.0, 223.0, 160.0, 96.0, 57.0, 68.0, 42.0, 29.0, 22.0, 11.0, 15.0, 7.0, 4.0, 5.0, 10.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.423583984375, -0.40959930419921875, -0.3956146240234375, -0.38162994384765625, -0.367645263671875, -0.35366058349609375, -0.3396759033203125, -0.32569122314453125, -0.31170654296875, -0.29772186279296875, -0.2837371826171875, -0.26975250244140625, -0.255767822265625, -0.24178314208984375, -0.2277984619140625, -0.21381378173828125, -0.1998291015625, -0.18584442138671875, -0.1718597412109375, -0.15787506103515625, -0.143890380859375, -0.12990570068359375, -0.1159210205078125, -0.10193634033203125, -0.08795166015625, -0.07396697998046875, -0.0599822998046875, -0.04599761962890625, -0.032012939453125, -0.01802825927734375, -0.0040435791015625, 0.00994110107421875, 0.02392578125, 0.03791046142578125, 0.0518951416015625, 0.06587982177734375, 0.079864501953125, 0.09384918212890625, 0.1078338623046875, 0.12181854248046875, 0.13580322265625, 0.14978790283203125, 0.1637725830078125, 0.17775726318359375, 0.191741943359375, 0.20572662353515625, 0.2197113037109375, 0.23369598388671875, 0.2476806640625, 0.26166534423828125, 0.2756500244140625, 0.28963470458984375, 0.303619384765625, 0.31760406494140625, 0.3315887451171875, 0.34557342529296875, 0.35955810546875, 0.37354278564453125, 0.3875274658203125, 0.40151214599609375, 0.415496826171875, 0.42948150634765625, 0.4434661865234375, 0.45745086669921875, 0.471435546875]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 6.0, 5.0, 10.0, 1.0, 8.0, 6.0, 7.0, 13.0, 8.0, 13.0, 17.0, 16.0, 21.0, 14.0, 32.0, 27.0, 33.0, 30.0, 28.0, 34.0, 38.0, 30.0, 46.0, 33.0, 47.0, 43.0, 43.0, 46.0, 35.0, 32.0, 25.0, 29.0, 28.0, 34.0, 22.0, 15.0, 15.0, 25.0, 20.0, 15.0, 10.0, 7.0, 10.0, 5.0, 2.0, 5.0, 6.0, 2.0, 8.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.184814453125, -0.17955780029296875, -0.1743011474609375, -0.16904449462890625, -0.163787841796875, -0.15853118896484375, -0.1532745361328125, -0.14801788330078125, -0.14276123046875, -0.13750457763671875, -0.1322479248046875, -0.12699127197265625, -0.121734619140625, -0.11647796630859375, -0.1112213134765625, -0.10596466064453125, -0.1007080078125, -0.09545135498046875, -0.0901947021484375, -0.08493804931640625, -0.079681396484375, -0.07442474365234375, -0.0691680908203125, -0.06391143798828125, -0.05865478515625, -0.05339813232421875, -0.0481414794921875, -0.04288482666015625, -0.037628173828125, -0.03237152099609375, -0.0271148681640625, -0.02185821533203125, -0.0166015625, -0.01134490966796875, -0.0060882568359375, -0.00083160400390625, 0.004425048828125, 0.00968170166015625, 0.0149383544921875, 0.02019500732421875, 0.02545166015625, 0.03070831298828125, 0.0359649658203125, 0.04122161865234375, 0.046478271484375, 0.05173492431640625, 0.0569915771484375, 0.06224822998046875, 0.0675048828125, 0.07276153564453125, 0.0780181884765625, 0.08327484130859375, 0.088531494140625, 0.09378814697265625, 0.0990447998046875, 0.10430145263671875, 0.10955810546875, 0.11481475830078125, 0.1200714111328125, 0.12532806396484375, 0.130584716796875, 0.13584136962890625, 0.1410980224609375, 0.14635467529296875, 0.151611328125]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 3.0, 3.0, 6.0, 5.0, 10.0, 7.0, 11.0, 11.0, 15.0, 15.0, 37.0, 39.0, 46.0, 77.0, 122.0, 206.0, 748.0, 5431.0, 1522983.0, 2657565.0, 5659.0, 726.0, 191.0, 91.0, 65.0, 68.0, 31.0, 29.0, 13.0, 15.0, 18.0, 5.0, 9.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.62890625, -1.58489990234375, -1.5408935546875, -1.49688720703125, -1.452880859375, -1.40887451171875, -1.3648681640625, -1.32086181640625, -1.27685546875, -1.23284912109375, -1.1888427734375, -1.14483642578125, -1.100830078125, -1.05682373046875, -1.0128173828125, -0.96881103515625, -0.9248046875, -0.88079833984375, -0.8367919921875, -0.79278564453125, -0.748779296875, -0.70477294921875, -0.6607666015625, -0.61676025390625, -0.57275390625, -0.52874755859375, -0.4847412109375, -0.44073486328125, -0.396728515625, -0.35272216796875, -0.3087158203125, -0.26470947265625, -0.220703125, -0.17669677734375, -0.1326904296875, -0.08868408203125, -0.044677734375, -0.00067138671875, 0.0433349609375, 0.08734130859375, 0.13134765625, 0.17535400390625, 0.2193603515625, 0.26336669921875, 0.307373046875, 0.35137939453125, 0.3953857421875, 0.43939208984375, 0.4833984375, 0.52740478515625, 0.5714111328125, 0.61541748046875, 0.659423828125, 0.70343017578125, 0.7474365234375, 0.79144287109375, 0.83544921875, 0.87945556640625, 0.9234619140625, 0.96746826171875, 1.011474609375, 1.05548095703125, 1.0994873046875, 1.14349365234375, 1.1875]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 2.0, 4.0, 5.0, 11.0, 22.0, 27.0, 31.0, 40.0, 64.0, 126.0, 296.0, 724.0, 1213.0, 808.0, 332.0, 137.0, 70.0, 45.0, 31.0, 23.0, 10.0, 9.0, 16.0, 10.0, 6.0, 4.0, 2.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10369873046875, -0.0993051528930664, -0.09491157531738281, -0.09051799774169922, -0.08612442016601562, -0.08173084259033203, -0.07733726501464844, -0.07294368743896484, -0.06855010986328125, -0.06415653228759766, -0.05976295471191406, -0.05536937713623047, -0.050975799560546875, -0.04658222198486328, -0.04218864440917969, -0.037795066833496094, -0.0334014892578125, -0.029007911682128906, -0.024614334106445312, -0.02022075653076172, -0.015827178955078125, -0.011433601379394531, -0.0070400238037109375, -0.0026464462280273438, 0.00174713134765625, 0.006140708923339844, 0.010534286499023438, 0.014927864074707031, 0.019321441650390625, 0.02371501922607422, 0.028108596801757812, 0.032502174377441406, 0.036895751953125, 0.041289329528808594, 0.04568290710449219, 0.05007648468017578, 0.054470062255859375, 0.05886363983154297, 0.06325721740722656, 0.06765079498291016, 0.07204437255859375, 0.07643795013427734, 0.08083152770996094, 0.08522510528564453, 0.08961868286132812, 0.09401226043701172, 0.09840583801269531, 0.1027994155883789, 0.1071929931640625, 0.1115865707397461, 0.11598014831542969, 0.12037372589111328, 0.12476730346679688, 0.12916088104248047, 0.13355445861816406, 0.13794803619384766, 0.14234161376953125, 0.14673519134521484, 0.15112876892089844, 0.15552234649658203, 0.15991592407226562, 0.16430950164794922, 0.1687030792236328, 0.1730966567993164, 0.177490234375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 6.0, 10.0, 12.0, 31.0, 39.0, 52.0, 82.0, 104.0, 139.0, 110.0, 116.0, 70.0, 59.0, 37.0, 32.0, 27.0, 23.0, 12.0, 9.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2836915850639343, -0.2709067463874817, -0.25812193751335144, -0.24533711373806, -0.23255228996276855, -0.21976745128631592, -0.20698264241218567, -0.19419780373573303, -0.18141299486160278, -0.16862817108631134, -0.1558433473110199, -0.14305852353572845, -0.130273699760437, -0.11748886853456497, -0.10470404475927353, -0.09191922098398209, -0.07913438975811005, -0.0663495659828186, -0.05356474220752716, -0.04077991470694542, -0.027995090931653976, -0.015210263431072235, -0.0024254396557807922, 0.01035938411951065, 0.023144207894802094, 0.035929031670093536, 0.04871385544538498, 0.06149868294596672, 0.07428351044654846, 0.0870683342218399, 0.09985315799713135, 0.11263798177242279, 0.12542280554771423, 0.13820762932300568, 0.15099245309829712, 0.16377727687358856, 0.17656210064888, 0.18934693932533264, 0.2021317481994629, 0.21491658687591553, 0.22770139575004578, 0.24048621952533722, 0.25327104330062866, 0.2660558819770813, 0.27884069085121155, 0.2916255295276642, 0.30441033840179443, 0.31719517707824707, 0.3299800157546997, 0.34276485443115234, 0.3555496633052826, 0.36833450198173523, 0.3811193108558655, 0.3939041495323181, 0.40668895840644836, 0.419473797082901, 0.43225860595703125, 0.4450434446334839, 0.45782825350761414, 0.4706130921840668, 0.483397901058197, 0.49618273973464966, 0.5089675784111023, 0.5217523574829102, 0.5345371961593628]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 5.0, 10.0, 3.0, 5.0, 13.0, 6.0, 13.0, 18.0, 24.0, 15.0, 29.0, 31.0, 34.0, 33.0, 30.0, 36.0, 44.0, 44.0, 41.0, 48.0, 42.0, 53.0, 41.0, 39.0, 39.0, 42.0, 43.0, 36.0, 36.0, 27.0, 22.0, 18.0, 16.0, 16.0, 7.0, 9.0, 8.0, 8.0, 3.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2305736392736435, -0.22390788793563843, -0.21724213659763336, -0.2105763852596283, -0.20391061902046204, -0.19724488258361816, -0.1905791163444519, -0.18391336500644684, -0.17724761366844177, -0.1705818623304367, -0.16391611099243164, -0.15725035965442657, -0.1505846083164215, -0.14391884207725525, -0.13725309073925018, -0.13058733940124512, -0.12392158806324005, -0.11725583672523499, -0.11059008538722992, -0.10392432659864426, -0.09725857526063919, -0.09059282392263412, -0.08392706513404846, -0.0772613137960434, -0.07059556245803833, -0.06392981112003326, -0.0572640560567379, -0.050598300993442535, -0.04393254965543747, -0.037266798317432404, -0.03060104325413704, -0.023935288190841675, -0.017269551753997803, -0.010603798553347588, -0.0039380453526973724, 0.0027277078479528427, 0.009393461048603058, 0.016059212386608124, 0.022724967449903488, 0.029390722513198853, 0.03605647385120392, 0.042722225189208984, 0.04938798025250435, 0.05605373531579971, 0.06271948665380478, 0.06938523799180984, 0.07605099678039551, 0.08271674811840057, 0.08938249945640564, 0.0960482507944107, 0.10271400213241577, 0.10937976092100143, 0.1160455122590065, 0.12271126359701157, 0.12937702238559723, 0.1360427737236023, 0.14270852506160736, 0.14937427639961243, 0.1560400277376175, 0.16270577907562256, 0.16937154531478882, 0.1760372817516327, 0.18270304799079895, 0.18936879932880402, 0.19603455066680908]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 7.0, 5.0, 12.0, 19.0, 25.0, 36.0, 59.0, 69.0, 133.0, 181.0, 259.0, 441.0, 831.0, 1404.0, 2723.0, 5952.0, 14071.0, 41521.0, 170920.0, 560404.0, 179648.0, 42631.0, 14581.0, 6222.0, 2941.0, 1449.0, 789.0, 484.0, 252.0, 183.0, 84.0, 70.0, 40.0, 36.0, 20.0, 14.0, 13.0, 9.0, 2.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.091552734375, -0.0891122817993164, -0.08667182922363281, -0.08423137664794922, -0.08179092407226562, -0.07935047149658203, -0.07691001892089844, -0.07446956634521484, -0.07202911376953125, -0.06958866119384766, -0.06714820861816406, -0.06470775604248047, -0.062267303466796875, -0.05982685089111328, -0.05738639831542969, -0.054945945739746094, -0.0525054931640625, -0.050065040588378906, -0.04762458801269531, -0.04518413543701172, -0.042743682861328125, -0.04030323028564453, -0.03786277770996094, -0.035422325134277344, -0.03298187255859375, -0.030541419982910156, -0.028100967407226562, -0.02566051483154297, -0.023220062255859375, -0.02077960968017578, -0.018339157104492188, -0.015898704528808594, -0.013458251953125, -0.011017799377441406, -0.008577346801757812, -0.006136894226074219, -0.003696441650390625, -0.0012559890747070312, 0.0011844635009765625, 0.0036249160766601562, 0.00606536865234375, 0.008505821228027344, 0.010946273803710938, 0.013386726379394531, 0.015827178955078125, 0.01826763153076172, 0.020708084106445312, 0.023148536682128906, 0.0255889892578125, 0.028029441833496094, 0.030469894409179688, 0.03291034698486328, 0.035350799560546875, 0.03779125213623047, 0.04023170471191406, 0.042672157287597656, 0.04511260986328125, 0.047553062438964844, 0.04999351501464844, 0.05243396759033203, 0.054874420166015625, 0.05731487274169922, 0.05975532531738281, 0.062195777893066406, 0.06463623046875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 3.0, 5.0, 7.0, 13.0, 14.0, 16.0, 18.0, 37.0, 35.0, 36.0, 37.0, 56.0, 42.0, 69.0, 57.0, 64.0, 66.0, 76.0, 50.0, 38.0, 60.0, 50.0, 32.0, 25.0, 31.0, 19.0, 11.0, 4.0, 6.0, 8.0, 4.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.184814453125, -0.178985595703125, -0.17315673828125, -0.167327880859375, -0.1614990234375, -0.155670166015625, -0.14984130859375, -0.144012451171875, -0.13818359375, -0.132354736328125, -0.12652587890625, -0.120697021484375, -0.1148681640625, -0.109039306640625, -0.10321044921875, -0.097381591796875, -0.091552734375, -0.085723876953125, -0.07989501953125, -0.074066162109375, -0.0682373046875, -0.062408447265625, -0.05657958984375, -0.050750732421875, -0.044921875, -0.039093017578125, -0.03326416015625, -0.027435302734375, -0.0216064453125, -0.015777587890625, -0.00994873046875, -0.004119873046875, 0.001708984375, 0.007537841796875, 0.01336669921875, 0.019195556640625, 0.0250244140625, 0.030853271484375, 0.03668212890625, 0.042510986328125, 0.04833984375, 0.054168701171875, 0.05999755859375, 0.065826416015625, 0.0716552734375, 0.077484130859375, 0.08331298828125, 0.089141845703125, 0.094970703125, 0.100799560546875, 0.10662841796875, 0.112457275390625, 0.1182861328125, 0.124114990234375, 0.12994384765625, 0.135772705078125, 0.1416015625, 0.147430419921875, 0.15325927734375, 0.159088134765625, 0.1649169921875, 0.170745849609375, 0.17657470703125, 0.182403564453125, 0.188232421875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 3.0, 5.0, 4.0, 4.0, 5.0, 14.0, 20.0, 29.0, 54.0, 79.0, 163.0, 381.0, 1024.0, 3487.0, 15701.0, 115726.0, 735406.0, 151688.0, 18646.0, 4093.0, 1178.0, 443.0, 170.0, 71.0, 50.0, 36.0, 24.0, 13.0, 7.0, 5.0, 6.0, 7.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12310791015625, -0.11943912506103516, -0.11577033996582031, -0.11210155487060547, -0.10843276977539062, -0.10476398468017578, -0.10109519958496094, -0.0974264144897461, -0.09375762939453125, -0.0900888442993164, -0.08642005920410156, -0.08275127410888672, -0.07908248901367188, -0.07541370391845703, -0.07174491882324219, -0.06807613372802734, -0.0644073486328125, -0.060738563537597656, -0.05706977844238281, -0.05340099334716797, -0.049732208251953125, -0.04606342315673828, -0.04239463806152344, -0.038725852966308594, -0.03505706787109375, -0.031388282775878906, -0.027719497680664062, -0.02405071258544922, -0.020381927490234375, -0.01671314239501953, -0.013044357299804688, -0.009375572204589844, -0.005706787109375, -0.0020380020141601562, 0.0016307830810546875, 0.005299568176269531, 0.008968353271484375, 0.012637138366699219, 0.016305923461914062, 0.019974708557128906, 0.02364349365234375, 0.027312278747558594, 0.030981063842773438, 0.03464984893798828, 0.038318634033203125, 0.04198741912841797, 0.04565620422363281, 0.049324989318847656, 0.0529937744140625, 0.056662559509277344, 0.06033134460449219, 0.06400012969970703, 0.06766891479492188, 0.07133769989013672, 0.07500648498535156, 0.0786752700805664, 0.08234405517578125, 0.0860128402709961, 0.08968162536621094, 0.09335041046142578, 0.09701919555664062, 0.10068798065185547, 0.10435676574707031, 0.10802555084228516, 0.1116943359375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 9.0, 8.0, 11.0, 8.0, 13.0, 14.0, 24.0, 17.0, 27.0, 26.0, 35.0, 35.0, 42.0, 38.0, 45.0, 36.0, 49.0, 52.0, 49.0, 41.0, 44.0, 47.0, 36.0, 42.0, 35.0, 30.0, 35.0, 21.0, 20.0, 16.0, 14.0, 18.0, 11.0, 12.0, 6.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.269775390625, -0.2617378234863281, -0.25370025634765625, -0.24566268920898438, -0.2376251220703125, -0.22958755493164062, -0.22154998779296875, -0.21351242065429688, -0.205474853515625, -0.19743728637695312, -0.18939971923828125, -0.18136215209960938, -0.1733245849609375, -0.16528701782226562, -0.15724945068359375, -0.14921188354492188, -0.14117431640625, -0.13313674926757812, -0.12509918212890625, -0.11706161499023438, -0.1090240478515625, -0.10098648071289062, -0.09294891357421875, -0.08491134643554688, -0.076873779296875, -0.06883621215820312, -0.06079864501953125, -0.052761077880859375, -0.0447235107421875, -0.036685943603515625, -0.02864837646484375, -0.020610809326171875, -0.0125732421875, -0.004535675048828125, 0.00350189208984375, 0.011539459228515625, 0.0195770263671875, 0.027614593505859375, 0.03565216064453125, 0.043689727783203125, 0.051727294921875, 0.059764862060546875, 0.06780242919921875, 0.07583999633789062, 0.0838775634765625, 0.09191513061523438, 0.09995269775390625, 0.10799026489257812, 0.11602783203125, 0.12406539916992188, 0.13210296630859375, 0.14014053344726562, 0.1481781005859375, 0.15621566772460938, 0.16425323486328125, 0.17229080200195312, 0.180328369140625, 0.18836593627929688, 0.19640350341796875, 0.20444107055664062, 0.2124786376953125, 0.22051620483398438, 0.22855377197265625, 0.23659133911132812, 0.24462890625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 0.0, 6.0, 4.0, 4.0, 7.0, 5.0, 19.0, 11.0, 25.0, 23.0, 53.0, 100.0, 190.0, 387.0, 924.0, 2851.0, 10806.0, 67567.0, 760950.0, 178755.0, 19040.0, 4429.0, 1358.0, 530.0, 227.0, 124.0, 74.0, 30.0, 27.0, 11.0, 3.0, 9.0, 5.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0287628173828125, -0.02749466896057129, -0.026226520538330078, -0.024958372116088867, -0.023690223693847656, -0.022422075271606445, -0.021153926849365234, -0.019885778427124023, -0.018617630004882812, -0.0173494815826416, -0.01608133316040039, -0.01481318473815918, -0.013545036315917969, -0.012276887893676758, -0.011008739471435547, -0.009740591049194336, -0.008472442626953125, -0.007204294204711914, -0.005936145782470703, -0.004667997360229492, -0.0033998489379882812, -0.0021317005157470703, -0.0008635520935058594, 0.00040459632873535156, 0.0016727447509765625, 0.0029408931732177734, 0.004209041595458984, 0.005477190017700195, 0.006745338439941406, 0.008013486862182617, 0.009281635284423828, 0.010549783706665039, 0.01181793212890625, 0.013086080551147461, 0.014354228973388672, 0.015622377395629883, 0.016890525817871094, 0.018158674240112305, 0.019426822662353516, 0.020694971084594727, 0.021963119506835938, 0.02323126792907715, 0.02449941635131836, 0.02576756477355957, 0.02703571319580078, 0.028303861618041992, 0.029572010040283203, 0.030840158462524414, 0.032108306884765625, 0.033376455307006836, 0.03464460372924805, 0.03591275215148926, 0.03718090057373047, 0.03844904899597168, 0.03971719741821289, 0.0409853458404541, 0.04225349426269531, 0.04352164268493652, 0.044789791107177734, 0.046057939529418945, 0.047326087951660156, 0.04859423637390137, 0.04986238479614258, 0.05113053321838379, 0.052398681640625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 7.0, 12.0, 9.0, 15.0, 16.0, 27.0, 37.0, 69.0, 74.0, 101.0, 112.0, 151.0, 101.0, 77.0, 55.0, 28.0, 23.0, 22.0, 18.0, 16.0, 9.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3232231140136719e-05, -1.2774020433425903e-05, -1.2315809726715088e-05, -1.1857599020004272e-05, -1.1399388313293457e-05, -1.0941177606582642e-05, -1.0482966899871826e-05, -1.002475619316101e-05, -9.566545486450195e-06, -9.10833477973938e-06, -8.650124073028564e-06, -8.191913366317749e-06, -7.733702659606934e-06, -7.275491952896118e-06, -6.817281246185303e-06, -6.359070539474487e-06, -5.900859832763672e-06, -5.4426491260528564e-06, -4.984438419342041e-06, -4.526227712631226e-06, -4.06801700592041e-06, -3.6098062992095947e-06, -3.1515955924987793e-06, -2.693384885787964e-06, -2.2351741790771484e-06, -1.776963472366333e-06, -1.3187527656555176e-06, -8.605420589447021e-07, -4.023313522338867e-07, 5.587935447692871e-08, 5.140900611877441e-07, 9.723007678985596e-07, 1.430511474609375e-06, 1.8887221813201904e-06, 2.346932888031006e-06, 2.8051435947418213e-06, 3.2633543014526367e-06, 3.721565008163452e-06, 4.179775714874268e-06, 4.637986421585083e-06, 5.0961971282958984e-06, 5.554407835006714e-06, 6.012618541717529e-06, 6.470829248428345e-06, 6.92903995513916e-06, 7.387250661849976e-06, 7.845461368560791e-06, 8.303672075271606e-06, 8.761882781982422e-06, 9.220093488693237e-06, 9.678304195404053e-06, 1.0136514902114868e-05, 1.0594725608825684e-05, 1.1052936315536499e-05, 1.1511147022247314e-05, 1.196935772895813e-05, 1.2427568435668945e-05, 1.288577914237976e-05, 1.3343989849090576e-05, 1.3802200555801392e-05, 1.4260411262512207e-05, 1.4718621969223022e-05, 1.5176832675933838e-05, 1.5635043382644653e-05, 1.609325408935547e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 2.0, 5.0, 4.0, 3.0, 6.0, 8.0, 18.0, 15.0, 21.0, 30.0, 25.0, 45.0, 87.0, 161.0, 279.0, 549.0, 1352.0, 3207.0, 8798.0, 31547.0, 218522.0, 659542.0, 95574.0, 18530.0, 5979.0, 2251.0, 931.0, 426.0, 251.0, 131.0, 80.0, 53.0, 30.0, 23.0, 12.0, 11.0, 6.0, 9.0, 8.0, 8.0, 5.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03094482421875, -0.029987096786499023, -0.029029369354248047, -0.02807164192199707, -0.027113914489746094, -0.026156187057495117, -0.02519845962524414, -0.024240732192993164, -0.023283004760742188, -0.02232527732849121, -0.021367549896240234, -0.020409822463989258, -0.01945209503173828, -0.018494367599487305, -0.017536640167236328, -0.01657891273498535, -0.015621185302734375, -0.014663457870483398, -0.013705730438232422, -0.012748003005981445, -0.011790275573730469, -0.010832548141479492, -0.009874820709228516, -0.008917093276977539, -0.007959365844726562, -0.007001638412475586, -0.006043910980224609, -0.005086183547973633, -0.004128456115722656, -0.0031707286834716797, -0.002213001251220703, -0.0012552738189697266, -0.00029754638671875, 0.0006601810455322266, 0.0016179084777832031, 0.0025756359100341797, 0.0035333633422851562, 0.004491090774536133, 0.005448818206787109, 0.006406545639038086, 0.0073642730712890625, 0.008322000503540039, 0.009279727935791016, 0.010237455368041992, 0.011195182800292969, 0.012152910232543945, 0.013110637664794922, 0.014068365097045898, 0.015026092529296875, 0.01598381996154785, 0.016941547393798828, 0.017899274826049805, 0.01885700225830078, 0.019814729690551758, 0.020772457122802734, 0.02173018455505371, 0.022687911987304688, 0.023645639419555664, 0.02460336685180664, 0.025561094284057617, 0.026518821716308594, 0.02747654914855957, 0.028434276580810547, 0.029392004013061523, 0.0303497314453125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 7.0, 6.0, 8.0, 7.0, 15.0, 16.0, 17.0, 30.0, 39.0, 49.0, 43.0, 58.0, 95.0, 64.0, 93.0, 65.0, 89.0, 60.0, 54.0, 41.0, 24.0, 27.0, 22.0, 14.0, 10.0, 2.0, 5.0, 7.0, 4.0, 4.0, 7.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004848480224609375, -0.0046749114990234375, -0.0045013427734375, -0.0043277740478515625, -0.004154205322265625, -0.0039806365966796875, -0.00380706787109375, -0.0036334991455078125, -0.003459930419921875, -0.0032863616943359375, -0.00311279296875, -0.0029392242431640625, -0.002765655517578125, -0.0025920867919921875, -0.00241851806640625, -0.0022449493408203125, -0.002071380615234375, -0.0018978118896484375, -0.0017242431640625, -0.0015506744384765625, -0.001377105712890625, -0.0012035369873046875, -0.00102996826171875, -0.0008563995361328125, -0.000682830810546875, -0.0005092620849609375, -0.000335693359375, -0.0001621246337890625, 1.1444091796875e-05, 0.0001850128173828125, 0.00035858154296875, 0.0005321502685546875, 0.000705718994140625, 0.0008792877197265625, 0.0010528564453125, 0.0012264251708984375, 0.001399993896484375, 0.0015735626220703125, 0.00174713134765625, 0.0019207000732421875, 0.002094268798828125, 0.0022678375244140625, 0.00244140625, 0.0026149749755859375, 0.002788543701171875, 0.0029621124267578125, 0.00313568115234375, 0.0033092498779296875, 0.003482818603515625, 0.0036563873291015625, 0.0038299560546875, 0.0040035247802734375, 0.004177093505859375, 0.0043506622314453125, 0.00452423095703125, 0.0046977996826171875, 0.004871368408203125, 0.0050449371337890625, 0.005218505859375, 0.0053920745849609375, 0.005565643310546875, 0.0057392120361328125, 0.00591278076171875, 0.0060863494873046875, 0.006259918212890625]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 7.0, 11.0, 16.0, 45.0, 58.0, 144.0, 171.0, 209.0, 129.0, 73.0, 55.0, 35.0, 18.0, 8.0, 8.0, 4.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42667779326438904, -0.4148869514465332, -0.40309613943099976, -0.3913052976131439, -0.3795144557952881, -0.36772364377975464, -0.3559328019618988, -0.34414196014404297, -0.3323511481285095, -0.3205603063106537, -0.30876949429512024, -0.2969786524772644, -0.28518784046173096, -0.2733969986438751, -0.2616061568260193, -0.24981532990932465, -0.23802450299263, -0.22623367607593536, -0.21444284915924072, -0.2026520073413849, -0.19086118042469025, -0.1790703535079956, -0.16727951169013977, -0.15548868477344513, -0.1436978578567505, -0.13190703094005585, -0.12011619657278061, -0.10832536220550537, -0.09653453528881073, -0.08474370837211609, -0.07295287400484085, -0.06116203963756561, -0.04937121272087097, -0.03758038207888603, -0.025789551436901093, -0.013998720794916153, -0.0022078901529312134, 0.009582940489053726, 0.021373771131038666, 0.033164605498313904, 0.044955432415008545, 0.056746263056993484, 0.06853709369897842, 0.08032792806625366, 0.0921187549829483, 0.10390958189964294, 0.11570041626691818, 0.12749125063419342, 0.13928207755088806, 0.1510729044675827, 0.16286373138427734, 0.17465457320213318, 0.18644540011882782, 0.19823622703552246, 0.2100270688533783, 0.22181789577007294, 0.23360872268676758, 0.24539954960346222, 0.25719037652015686, 0.2689812183380127, 0.28077203035354614, 0.292562872171402, 0.3043537139892578, 0.31614452600479126, 0.3279353678226471]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 4.0, 9.0, 2.0, 5.0, 8.0, 14.0, 11.0, 20.0, 19.0, 30.0, 34.0, 51.0, 42.0, 47.0, 55.0, 53.0, 55.0, 71.0, 59.0, 52.0, 60.0, 56.0, 46.0, 51.0, 35.0, 27.0, 26.0, 15.0, 14.0, 4.0, 7.0, 7.0, 7.0, 8.0, 4.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15987694263458252, -0.15445472300052643, -0.14903250336647034, -0.14361026883125305, -0.13818804919719696, -0.13276582956314087, -0.12734359502792358, -0.12192137539386749, -0.1164991557598114, -0.11107693612575531, -0.10565470904111862, -0.10023248195648193, -0.09481026232242584, -0.08938804268836975, -0.08396581560373306, -0.07854358851909637, -0.07312136888504028, -0.06769914925098419, -0.062276922166347504, -0.056854698807001114, -0.051432475447654724, -0.046010252088308334, -0.040588028728961945, -0.035165805369615555, -0.029743582010269165, -0.024321358650922775, -0.018899135291576385, -0.013476911932229996, -0.008054688572883606, -0.002632465213537216, 0.0027897581458091736, 0.008211981505155563, 0.01363418996334076, 0.01905641332268715, 0.02447863668203354, 0.02990086004137993, 0.03532308340072632, 0.04074530676007271, 0.0461675301194191, 0.05158975347876549, 0.05701197683811188, 0.06243420019745827, 0.06785642355680466, 0.07327865064144135, 0.07870087027549744, 0.08412308990955353, 0.08954531699419022, 0.0949675440788269, 0.100389763712883, 0.10581198334693909, 0.11123421043157578, 0.11665643751621246, 0.12207865715026855, 0.12750087678432465, 0.13292309641838074, 0.13834533095359802, 0.1437675505876541, 0.1491897702217102, 0.1546120047569275, 0.16003422439098358, 0.16545644402503967, 0.17087866365909576, 0.17630088329315186, 0.18172311782836914, 0.18714533746242523]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 7.0, 2.0, 8.0, 3.0, 9.0, 16.0, 19.0, 47.0, 56.0, 98.0, 120.0, 180.0, 252.0, 368.0, 561.0, 863.0, 1337.0, 2078.0, 3264.0, 5380.0, 9599.0, 18808.0, 43497.0, 138106.0, 501233.0, 212344.0, 58422.0, 23396.0, 11487.0, 6459.0, 3699.0, 2334.0, 1545.0, 970.0, 631.0, 425.0, 300.0, 194.0, 131.0, 101.0, 56.0, 53.0, 28.0, 26.0, 20.0, 9.0, 2.0, 7.0, 3.0, 6.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.1549072265625, -0.15030288696289062, -0.14569854736328125, -0.14109420776367188, -0.1364898681640625, -0.13188552856445312, -0.12728118896484375, -0.12267684936523438, -0.118072509765625, -0.11346817016601562, -0.10886383056640625, -0.10425949096679688, -0.0996551513671875, -0.09505081176757812, -0.09044647216796875, -0.08584213256835938, -0.08123779296875, -0.07663345336914062, -0.07202911376953125, -0.06742477416992188, -0.0628204345703125, -0.058216094970703125, -0.05361175537109375, -0.049007415771484375, -0.044403076171875, -0.039798736572265625, -0.03519439697265625, -0.030590057373046875, -0.0259857177734375, -0.021381378173828125, -0.01677703857421875, -0.012172698974609375, -0.007568359375, -0.002964019775390625, 0.00164031982421875, 0.006244659423828125, 0.0108489990234375, 0.015453338623046875, 0.02005767822265625, 0.024662017822265625, 0.029266357421875, 0.033870697021484375, 0.03847503662109375, 0.043079376220703125, 0.0476837158203125, 0.052288055419921875, 0.05689239501953125, 0.061496734619140625, 0.06610107421875, 0.07070541381835938, 0.07530975341796875, 0.07991409301757812, 0.0845184326171875, 0.08912277221679688, 0.09372711181640625, 0.09833145141601562, 0.102935791015625, 0.10754013061523438, 0.11214447021484375, 0.11674880981445312, 0.1213531494140625, 0.12595748901367188, 0.13056182861328125, 0.13516616821289062, 0.1397705078125]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 8.0, 13.0, 30.0, 40.0, 55.0, 67.0, 85.0, 103.0, 117.0, 115.0, 94.0, 86.0, 78.0, 40.0, 42.0, 12.0, 13.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.381591796875, -0.3613548278808594, -0.34111785888671875, -0.3208808898925781, -0.3006439208984375, -0.2804069519042969, -0.26016998291015625, -0.23993301391601562, -0.219696044921875, -0.19945907592773438, -0.17922210693359375, -0.15898513793945312, -0.1387481689453125, -0.11851119995117188, -0.09827423095703125, -0.07803726196289062, -0.05780029296875, -0.037563323974609375, -0.01732635498046875, 0.002910614013671875, 0.0231475830078125, 0.043384552001953125, 0.06362152099609375, 0.08385848999023438, 0.104095458984375, 0.12433242797851562, 0.14456939697265625, 0.16480636596679688, 0.1850433349609375, 0.20528030395507812, 0.22551727294921875, 0.24575424194335938, 0.2659912109375, 0.2862281799316406, 0.30646514892578125, 0.3267021179199219, 0.3469390869140625, 0.3671760559082031, 0.38741302490234375, 0.4076499938964844, 0.427886962890625, 0.4481239318847656, 0.46836090087890625, 0.4885978698730469, 0.5088348388671875, 0.5290718078613281, 0.5493087768554688, 0.5695457458496094, 0.58978271484375, 0.6100196838378906, 0.6302566528320312, 0.6504936218261719, 0.6707305908203125, 0.6909675598144531, 0.7112045288085938, 0.7314414978027344, 0.751678466796875, 0.7719154357910156, 0.7921524047851562, 0.8123893737792969, 0.8326263427734375, 0.8528633117675781, 0.8731002807617188, 0.8933372497558594, 0.91357421875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 7.0, 7.0, 17.0, 11.0, 19.0, 18.0, 26.0, 38.0, 46.0, 64.0, 85.0, 95.0, 131.0, 207.0, 379.0, 973.0, 4717.0, 42419.0, 906391.0, 83161.0, 7188.0, 1283.0, 423.0, 236.0, 129.0, 109.0, 85.0, 63.0, 40.0, 44.0, 28.0, 27.0, 19.0, 11.0, 14.0, 8.0, 12.0, 5.0, 4.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.458251953125, -0.4441986083984375, -0.430145263671875, -0.4160919189453125, -0.40203857421875, -0.3879852294921875, -0.373931884765625, -0.3598785400390625, -0.3458251953125, -0.3317718505859375, -0.317718505859375, -0.3036651611328125, -0.28961181640625, -0.2755584716796875, -0.261505126953125, -0.2474517822265625, -0.2333984375, -0.2193450927734375, -0.205291748046875, -0.1912384033203125, -0.17718505859375, -0.1631317138671875, -0.149078369140625, -0.1350250244140625, -0.1209716796875, -0.1069183349609375, -0.092864990234375, -0.0788116455078125, -0.06475830078125, -0.0507049560546875, -0.036651611328125, -0.0225982666015625, -0.008544921875, 0.0055084228515625, 0.019561767578125, 0.0336151123046875, 0.04766845703125, 0.0617218017578125, 0.075775146484375, 0.0898284912109375, 0.1038818359375, 0.1179351806640625, 0.131988525390625, 0.1460418701171875, 0.16009521484375, 0.1741485595703125, 0.188201904296875, 0.2022552490234375, 0.21630859375, 0.2303619384765625, 0.244415283203125, 0.2584686279296875, 0.27252197265625, 0.2865753173828125, 0.300628662109375, 0.3146820068359375, 0.3287353515625, 0.3427886962890625, 0.356842041015625, 0.3708953857421875, 0.38494873046875, 0.3990020751953125, 0.413055419921875, 0.4271087646484375, 0.441162109375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 4.0, 5.0, 10.0, 5.0, 12.0, 14.0, 16.0, 17.0, 26.0, 27.0, 33.0, 24.0, 42.0, 32.0, 43.0, 51.0, 48.0, 45.0, 51.0, 59.0, 51.0, 41.0, 50.0, 32.0, 41.0, 35.0, 29.0, 31.0, 18.0, 19.0, 18.0, 18.0, 13.0, 6.0, 10.0, 5.0, 6.0, 4.0, 5.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.27978515625, -0.2710380554199219, -0.26229095458984375, -0.2535438537597656, -0.2447967529296875, -0.23604965209960938, -0.22730255126953125, -0.21855545043945312, -0.209808349609375, -0.20106124877929688, -0.19231414794921875, -0.18356704711914062, -0.1748199462890625, -0.16607284545898438, -0.15732574462890625, -0.14857864379882812, -0.13983154296875, -0.13108444213867188, -0.12233734130859375, -0.11359024047851562, -0.1048431396484375, -0.09609603881835938, -0.08734893798828125, -0.07860183715820312, -0.069854736328125, -0.061107635498046875, -0.05236053466796875, -0.043613433837890625, -0.0348663330078125, -0.026119232177734375, -0.01737213134765625, -0.008625030517578125, 0.0001220703125, 0.008869171142578125, 0.01761627197265625, 0.026363372802734375, 0.0351104736328125, 0.043857574462890625, 0.05260467529296875, 0.061351776123046875, 0.070098876953125, 0.07884597778320312, 0.08759307861328125, 0.09634017944335938, 0.1050872802734375, 0.11383438110351562, 0.12258148193359375, 0.13132858276367188, 0.14007568359375, 0.14882278442382812, 0.15756988525390625, 0.16631698608398438, 0.1750640869140625, 0.18381118774414062, 0.19255828857421875, 0.20130538940429688, 0.210052490234375, 0.21879959106445312, 0.22754669189453125, 0.23629379272460938, 0.2450408935546875, 0.2537879943847656, 0.26253509521484375, 0.2712821960449219, 0.280029296875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 6.0, 15.0, 13.0, 16.0, 19.0, 42.0, 56.0, 110.0, 229.0, 523.0, 1566.0, 5718.0, 40438.0, 872883.0, 112799.0, 10338.0, 2406.0, 743.0, 265.0, 155.0, 85.0, 39.0, 33.0, 18.0, 9.0, 4.0, 5.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.1707763671875, -0.16598892211914062, -0.16120147705078125, -0.15641403198242188, -0.1516265869140625, -0.14683914184570312, -0.14205169677734375, -0.13726425170898438, -0.132476806640625, -0.12768936157226562, -0.12290191650390625, -0.11811447143554688, -0.1133270263671875, -0.10853958129882812, -0.10375213623046875, -0.09896469116210938, -0.09417724609375, -0.08938980102539062, -0.08460235595703125, -0.07981491088867188, -0.0750274658203125, -0.07024002075195312, -0.06545257568359375, -0.060665130615234375, -0.055877685546875, -0.051090240478515625, -0.04630279541015625, -0.041515350341796875, -0.0367279052734375, -0.031940460205078125, -0.02715301513671875, -0.022365570068359375, -0.017578125, -0.012790679931640625, -0.00800323486328125, -0.003215789794921875, 0.0015716552734375, 0.006359100341796875, 0.01114654541015625, 0.015933990478515625, 0.020721435546875, 0.025508880615234375, 0.03029632568359375, 0.035083770751953125, 0.0398712158203125, 0.044658660888671875, 0.04944610595703125, 0.054233551025390625, 0.05902099609375, 0.06380844116210938, 0.06859588623046875, 0.07338333129882812, 0.0781707763671875, 0.08295822143554688, 0.08774566650390625, 0.09253311157226562, 0.097320556640625, 0.10210800170898438, 0.10689544677734375, 0.11168289184570312, 0.1164703369140625, 0.12125778198242188, 0.12604522705078125, 0.13083267211914062, 0.1356201171875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 2.0, 3.0, 14.0, 10.0, 19.0, 31.0, 28.0, 48.0, 74.0, 88.0, 167.0, 170.0, 97.0, 64.0, 59.0, 25.0, 23.0, 25.0, 11.0, 10.0, 5.0, 7.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5616416931152344e-05, -1.5128403902053833e-05, -1.4640390872955322e-05, -1.4152377843856812e-05, -1.36643648147583e-05, -1.317635178565979e-05, -1.268833875656128e-05, -1.2200325727462769e-05, -1.1712312698364258e-05, -1.1224299669265747e-05, -1.0736286640167236e-05, -1.0248273611068726e-05, -9.760260581970215e-06, -9.272247552871704e-06, -8.784234523773193e-06, -8.296221494674683e-06, -7.808208465576172e-06, -7.320195436477661e-06, -6.83218240737915e-06, -6.34416937828064e-06, -5.856156349182129e-06, -5.368143320083618e-06, -4.880130290985107e-06, -4.392117261886597e-06, -3.904104232788086e-06, -3.416091203689575e-06, -2.9280781745910645e-06, -2.4400651454925537e-06, -1.952052116394043e-06, -1.4640390872955322e-06, -9.760260581970215e-07, -4.880130290985107e-07, 0.0, 4.880130290985107e-07, 9.760260581970215e-07, 1.4640390872955322e-06, 1.952052116394043e-06, 2.4400651454925537e-06, 2.9280781745910645e-06, 3.416091203689575e-06, 3.904104232788086e-06, 4.392117261886597e-06, 4.880130290985107e-06, 5.368143320083618e-06, 5.856156349182129e-06, 6.34416937828064e-06, 6.83218240737915e-06, 7.320195436477661e-06, 7.808208465576172e-06, 8.296221494674683e-06, 8.784234523773193e-06, 9.272247552871704e-06, 9.760260581970215e-06, 1.0248273611068726e-05, 1.0736286640167236e-05, 1.1224299669265747e-05, 1.1712312698364258e-05, 1.2200325727462769e-05, 1.268833875656128e-05, 1.317635178565979e-05, 1.36643648147583e-05, 1.4152377843856812e-05, 1.4640390872955322e-05, 1.5128403902053833e-05, 1.5616416931152344e-05]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 6.0, 2.0, 8.0, 4.0, 7.0, 10.0, 17.0, 23.0, 30.0, 25.0, 54.0, 90.0, 150.0, 351.0, 1019.0, 3974.0, 26115.0, 905590.0, 100095.0, 8219.0, 1714.0, 549.0, 203.0, 88.0, 60.0, 38.0, 27.0, 17.0, 14.0, 14.0, 8.0, 5.0, 8.0, 8.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1922607421875, -0.18556594848632812, -0.17887115478515625, -0.17217636108398438, -0.1654815673828125, -0.15878677368164062, -0.15209197998046875, -0.14539718627929688, -0.138702392578125, -0.13200759887695312, -0.12531280517578125, -0.11861801147460938, -0.1119232177734375, -0.10522842407226562, -0.09853363037109375, -0.09183883666992188, -0.08514404296875, -0.07844924926757812, -0.07175445556640625, -0.06505966186523438, -0.0583648681640625, -0.051670074462890625, -0.04497528076171875, -0.038280487060546875, -0.031585693359375, -0.024890899658203125, -0.01819610595703125, -0.011501312255859375, -0.0048065185546875, 0.001888275146484375, 0.00858306884765625, 0.015277862548828125, 0.02197265625, 0.028667449951171875, 0.03536224365234375, 0.042057037353515625, 0.0487518310546875, 0.055446624755859375, 0.06214141845703125, 0.06883621215820312, 0.075531005859375, 0.08222579956054688, 0.08892059326171875, 0.09561538696289062, 0.1023101806640625, 0.10900497436523438, 0.11569976806640625, 0.12239456176757812, 0.12908935546875, 0.13578414916992188, 0.14247894287109375, 0.14917373657226562, 0.1558685302734375, 0.16256332397460938, 0.16925811767578125, 0.17595291137695312, 0.182647705078125, 0.18934249877929688, 0.19603729248046875, 0.20273208618164062, 0.2094268798828125, 0.21612167358398438, 0.22281646728515625, 0.22951126098632812, 0.2362060546875]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 2.0, 2.0, 4.0, 3.0, 5.0, 7.0, 6.0, 9.0, 9.0, 14.0, 12.0, 34.0, 48.0, 80.0, 123.0, 166.0, 156.0, 98.0, 60.0, 38.0, 28.0, 21.0, 17.0, 14.0, 7.0, 8.0, 7.0, 4.0, 6.0, 4.0, 0.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048309326171875, -0.046781063079833984, -0.04525279998779297, -0.04372453689575195, -0.04219627380371094, -0.04066801071166992, -0.039139747619628906, -0.03761148452758789, -0.036083221435546875, -0.03455495834350586, -0.033026695251464844, -0.03149843215942383, -0.029970169067382812, -0.028441905975341797, -0.02691364288330078, -0.025385379791259766, -0.02385711669921875, -0.022328853607177734, -0.02080059051513672, -0.019272327423095703, -0.017744064331054688, -0.016215801239013672, -0.014687538146972656, -0.01315927505493164, -0.011631011962890625, -0.01010274887084961, -0.008574485778808594, -0.007046222686767578, -0.0055179595947265625, -0.003989696502685547, -0.0024614334106445312, -0.0009331703186035156, 0.0005950927734375, 0.0021233558654785156, 0.0036516189575195312, 0.005179882049560547, 0.0067081451416015625, 0.008236408233642578, 0.009764671325683594, 0.01129293441772461, 0.012821197509765625, 0.01434946060180664, 0.015877723693847656, 0.017405986785888672, 0.018934249877929688, 0.020462512969970703, 0.02199077606201172, 0.023519039154052734, 0.02504730224609375, 0.026575565338134766, 0.02810382843017578, 0.029632091522216797, 0.031160354614257812, 0.03268861770629883, 0.034216880798339844, 0.03574514389038086, 0.037273406982421875, 0.03880167007446289, 0.040329933166503906, 0.04185819625854492, 0.04338645935058594, 0.04491472244262695, 0.04644298553466797, 0.047971248626708984, 0.04949951171875]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 8.0, 18.0, 53.0, 95.0, 233.0, 290.0, 167.0, 77.0, 31.0, 15.0, 9.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5648092031478882, -1.530989170074463, -1.497169017791748, -1.4633489847183228, -1.429528832435608, -1.3957087993621826, -1.3618886470794678, -1.3280686140060425, -1.2942485809326172, -1.260428547859192, -1.226608395576477, -1.1927883625030518, -1.158968210220337, -1.1251481771469116, -1.0913281440734863, -1.0575079917907715, -1.0236878395080566, -0.9898677468299866, -0.9560476541519165, -0.9222276210784912, -0.8884075284004211, -0.8545874357223511, -0.820767343044281, -0.7869472503662109, -0.7531272172927856, -0.7193071246147156, -0.6854870319366455, -0.6516669988632202, -0.6178469061851501, -0.5840268135070801, -0.55020672082901, -0.5163866281509399, -0.48256659507751465, -0.4487465023994446, -0.4149264395236969, -0.38110634684562683, -0.34728628396987915, -0.3134661912918091, -0.279646098613739, -0.24582602083683014, -0.21200594305992126, -0.1781858652830124, -0.14436578750610352, -0.11054569482803345, -0.07672561705112457, -0.0429055392742157, -0.00908544659614563, 0.024734631180763245, 0.05855470895767212, 0.092374786734581, 0.12619486451148987, 0.16001495718955994, 0.1938350349664688, 0.22765511274337769, 0.26147520542144775, 0.2952952980995178, 0.3291153609752655, 0.36293545365333557, 0.39675551652908325, 0.4305756092071533, 0.4643957018852234, 0.49821576476097107, 0.5320358276367188, 0.5658559203147888, 0.5996760129928589]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 6.0, 8.0, 13.0, 24.0, 22.0, 43.0, 54.0, 44.0, 44.0, 74.0, 67.0, 67.0, 70.0, 63.0, 74.0, 58.0, 55.0, 51.0, 37.0, 29.0, 25.0, 18.0, 22.0, 11.0, 8.0, 6.0, 6.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49517568945884705, -0.47226420044898987, -0.4493526816368103, -0.4264411926269531, -0.40352967381477356, -0.3806181848049164, -0.3577066659927368, -0.33479517698287964, -0.31188368797302246, -0.2889721989631653, -0.2660606801509857, -0.24314919114112854, -0.22023767232894897, -0.1973261833190918, -0.17441467940807343, -0.15150317549705505, -0.1285916566848755, -0.10568015277385712, -0.08276864886283875, -0.05985715240240097, -0.0369456484913826, -0.014034144580364227, 0.008877351880073547, 0.03178885579109192, 0.05470035970211029, 0.07761186361312866, 0.10052336752414703, 0.12343486398458481, 0.14634636044502258, 0.16925787925720215, 0.19216936826705933, 0.2150808721780777, 0.23799240589141846, 0.26090389490127563, 0.2838154137134552, 0.3067269027233124, 0.32963842153549194, 0.3525499105453491, 0.3754613995552063, 0.39837291836738586, 0.42128443717956543, 0.4441959261894226, 0.4671074450016022, 0.49001893401145935, 0.5129304528236389, 0.5358419418334961, 0.5587534308433533, 0.5816649198532104, 0.6045764684677124, 0.6274879574775696, 0.6503994464874268, 0.6733109951019287, 0.6962224841117859, 0.7191339731216431, 0.7420454621315002, 0.7649569511413574, 0.7878684401512146, 0.8107799291610718, 0.833691418170929, 0.8566029667854309, 0.8795144557952881, 0.9024259448051453, 0.9253374338150024, 0.9482489824295044, 0.9711604714393616]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 11.0, 7.0, 10.0, 14.0, 23.0, 25.0, 37.0, 45.0, 88.0, 129.0, 172.0, 248.0, 367.0, 560.0, 911.0, 1515.0, 2492.0, 4735.0, 9707.0, 30600.0, 250841.0, 2427804.0, 1311144.0, 115765.0, 20135.0, 7778.0, 3837.0, 1991.0, 1164.0, 712.0, 478.0, 314.0, 185.0, 128.0, 91.0, 59.0, 45.0, 27.0, 25.0, 16.0, 7.0, 10.0, 6.0, 11.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.2822265625, -0.2736320495605469, -0.26503753662109375, -0.2564430236816406, -0.2478485107421875, -0.23925399780273438, -0.23065948486328125, -0.22206497192382812, -0.213470458984375, -0.20487594604492188, -0.19628143310546875, -0.18768692016601562, -0.1790924072265625, -0.17049789428710938, -0.16190338134765625, -0.15330886840820312, -0.14471435546875, -0.13611984252929688, -0.12752532958984375, -0.11893081665039062, -0.1103363037109375, -0.10174179077148438, -0.09314727783203125, -0.08455276489257812, -0.075958251953125, -0.06736373901367188, -0.05876922607421875, -0.050174713134765625, -0.0415802001953125, -0.032985687255859375, -0.02439117431640625, -0.015796661376953125, -0.0072021484375, 0.001392364501953125, 0.00998687744140625, 0.018581390380859375, 0.0271759033203125, 0.035770416259765625, 0.04436492919921875, 0.052959442138671875, 0.061553955078125, 0.07014846801757812, 0.07874298095703125, 0.08733749389648438, 0.0959320068359375, 0.10452651977539062, 0.11312103271484375, 0.12171554565429688, 0.13031005859375, 0.13890457153320312, 0.14749908447265625, 0.15609359741210938, 0.1646881103515625, 0.17328262329101562, 0.18187713623046875, 0.19047164916992188, 0.199066162109375, 0.20766067504882812, 0.21625518798828125, 0.22484970092773438, 0.2334442138671875, 0.24203872680664062, 0.25063323974609375, 0.2592277526855469, 0.267822265625]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 6.0, 4.0, 5.0, 15.0, 8.0, 22.0, 14.0, 18.0, 36.0, 44.0, 49.0, 45.0, 44.0, 53.0, 56.0, 47.0, 62.0, 65.0, 47.0, 49.0, 51.0, 35.0, 39.0, 40.0, 26.0, 26.0, 23.0, 18.0, 15.0, 11.0, 10.0, 6.0, 9.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.2568359375, -0.2503662109375, -0.243896484375, -0.2374267578125, -0.23095703125, -0.2244873046875, -0.218017578125, -0.2115478515625, -0.205078125, -0.1986083984375, -0.192138671875, -0.1856689453125, -0.17919921875, -0.1727294921875, -0.166259765625, -0.1597900390625, -0.1533203125, -0.1468505859375, -0.140380859375, -0.1339111328125, -0.12744140625, -0.1209716796875, -0.114501953125, -0.1080322265625, -0.1015625, -0.0950927734375, -0.088623046875, -0.0821533203125, -0.07568359375, -0.0692138671875, -0.062744140625, -0.0562744140625, -0.0498046875, -0.0433349609375, -0.036865234375, -0.0303955078125, -0.02392578125, -0.0174560546875, -0.010986328125, -0.0045166015625, 0.001953125, 0.0084228515625, 0.014892578125, 0.0213623046875, 0.02783203125, 0.0343017578125, 0.040771484375, 0.0472412109375, 0.0537109375, 0.0601806640625, 0.066650390625, 0.0731201171875, 0.07958984375, 0.0860595703125, 0.092529296875, 0.0989990234375, 0.10546875, 0.1119384765625, 0.118408203125, 0.1248779296875, 0.13134765625, 0.1378173828125, 0.144287109375, 0.1507568359375, 0.1572265625]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 5.0, 3.0, 12.0, 13.0, 13.0, 16.0, 23.0, 28.0, 46.0, 62.0, 127.0, 305.0, 961.0, 5287.0, 94076.0, 4050887.0, 37992.0, 3259.0, 674.0, 225.0, 85.0, 62.0, 35.0, 20.0, 15.0, 7.0, 11.0, 9.0, 7.0, 6.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74169921875, -0.7187957763671875, -0.695892333984375, -0.6729888916015625, -0.65008544921875, -0.6271820068359375, -0.604278564453125, -0.5813751220703125, -0.5584716796875, -0.5355682373046875, -0.512664794921875, -0.4897613525390625, -0.46685791015625, -0.4439544677734375, -0.421051025390625, -0.3981475830078125, -0.375244140625, -0.3523406982421875, -0.329437255859375, -0.3065338134765625, -0.28363037109375, -0.2607269287109375, -0.237823486328125, -0.2149200439453125, -0.1920166015625, -0.1691131591796875, -0.146209716796875, -0.1233062744140625, -0.10040283203125, -0.0774993896484375, -0.054595947265625, -0.0316925048828125, -0.0087890625, 0.0141143798828125, 0.037017822265625, 0.0599212646484375, 0.08282470703125, 0.1057281494140625, 0.128631591796875, 0.1515350341796875, 0.1744384765625, 0.1973419189453125, 0.220245361328125, 0.2431488037109375, 0.26605224609375, 0.2889556884765625, 0.311859130859375, 0.3347625732421875, 0.357666015625, 0.3805694580078125, 0.403472900390625, 0.4263763427734375, 0.44927978515625, 0.4721832275390625, 0.495086669921875, 0.5179901123046875, 0.5408935546875, 0.5637969970703125, 0.586700439453125, 0.6096038818359375, 0.63250732421875, 0.6554107666015625, 0.678314208984375, 0.7012176513671875, 0.72412109375]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 5.0, 6.0, 8.0, 7.0, 14.0, 11.0, 17.0, 25.0, 47.0, 61.0, 99.0, 186.0, 338.0, 566.0, 898.0, 687.0, 468.0, 209.0, 142.0, 70.0, 42.0, 32.0, 33.0, 20.0, 12.0, 19.0, 11.0, 12.0, 5.0, 1.0, 9.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08184814453125, -0.07934188842773438, -0.07683563232421875, -0.07432937622070312, -0.0718231201171875, -0.06931686401367188, -0.06681060791015625, -0.06430435180664062, -0.061798095703125, -0.059291839599609375, -0.05678558349609375, -0.054279327392578125, -0.0517730712890625, -0.049266815185546875, -0.04676055908203125, -0.044254302978515625, -0.041748046875, -0.039241790771484375, -0.03673553466796875, -0.034229278564453125, -0.0317230224609375, -0.029216766357421875, -0.02671051025390625, -0.024204254150390625, -0.021697998046875, -0.019191741943359375, -0.01668548583984375, -0.014179229736328125, -0.0116729736328125, -0.009166717529296875, -0.00666046142578125, -0.004154205322265625, -0.00164794921875, 0.000858306884765625, 0.00336456298828125, 0.005870819091796875, 0.0083770751953125, 0.010883331298828125, 0.01338958740234375, 0.015895843505859375, 0.018402099609375, 0.020908355712890625, 0.02341461181640625, 0.025920867919921875, 0.0284271240234375, 0.030933380126953125, 0.03343963623046875, 0.035945892333984375, 0.0384521484375, 0.040958404541015625, 0.04346466064453125, 0.045970916748046875, 0.0484771728515625, 0.050983428955078125, 0.05348968505859375, 0.055995941162109375, 0.058502197265625, 0.061008453369140625, 0.06351470947265625, 0.06602096557617188, 0.0685272216796875, 0.07103347778320312, 0.07353973388671875, 0.07604598999023438, 0.07855224609375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 8.0, 5.0, 8.0, 16.0, 16.0, 15.0, 28.0, 50.0, 93.0, 134.0, 174.0, 158.0, 97.0, 75.0, 49.0, 28.0, 18.0, 9.0, 9.0, 9.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45745858550071716, -0.4438287913799286, -0.43019899725914, -0.41656923294067383, -0.40293943881988525, -0.3893096446990967, -0.3756798505783081, -0.36205005645751953, -0.34842029213905334, -0.33479049801826477, -0.3211607038974762, -0.30753093957901, -0.29390114545822144, -0.28027135133743286, -0.2666415572166443, -0.2530117630958557, -0.23938198387622833, -0.22575218975543976, -0.21212241053581238, -0.1984926164150238, -0.18486283719539642, -0.17123304307460785, -0.15760326385498047, -0.1439734697341919, -0.13034367561340332, -0.11671388894319534, -0.10308410227298737, -0.08945430815219879, -0.07582452893257141, -0.06219473481178284, -0.04856494814157486, -0.03493516147136688, -0.021305382251739502, -0.00767559465020895, 0.005954192951321602, 0.01958398148417473, 0.033213768154382706, 0.04684355854988098, 0.06047334522008896, 0.07410313189029694, 0.08773291856050491, 0.10136270523071289, 0.11499249190092087, 0.12862227857112885, 0.14225207269191742, 0.1558818519115448, 0.16951164603233337, 0.18314144015312195, 0.19677121937274933, 0.2104010134935379, 0.22403079271316528, 0.23766058683395386, 0.25129038095474243, 0.264920175075531, 0.2785499393939972, 0.29217973351478577, 0.30580952763557434, 0.3194393217563629, 0.3330691158771515, 0.3466988801956177, 0.36032867431640625, 0.3739584684371948, 0.3875882625579834, 0.401218056678772, 0.41484782099723816]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 9.0, 13.0, 9.0, 20.0, 16.0, 20.0, 18.0, 23.0, 33.0, 46.0, 35.0, 46.0, 59.0, 57.0, 39.0, 37.0, 47.0, 40.0, 44.0, 49.0, 54.0, 42.0, 35.0, 36.0, 29.0, 32.0, 26.0, 18.0, 18.0, 16.0, 9.0, 10.0, 4.0, 5.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.21785898506641388, -0.21156637370586395, -0.20527376234531403, -0.1989811509847641, -0.19268853962421417, -0.18639592826366425, -0.18010330200195312, -0.1738106906414032, -0.16751807928085327, -0.16122546792030334, -0.15493285655975342, -0.1486402451992035, -0.14234763383865356, -0.13605502247810364, -0.1297624111175537, -0.12346979230642319, -0.11717718839645386, -0.11088457703590393, -0.104591965675354, -0.09829935431480408, -0.09200674295425415, -0.08571413159370422, -0.0794215127825737, -0.07312890142202377, -0.06683629006147385, -0.06054367870092392, -0.05425106734037399, -0.04795845225453377, -0.04166584089398384, -0.035373229533433914, -0.02908061444759369, -0.022788003087043762, -0.01649537682533264, -0.01020276453346014, -0.003910152241587639, 0.002382460981607437, 0.008675072342157364, 0.01496768370270729, 0.021260298788547516, 0.027552910149097443, 0.03384552150964737, 0.040138132870197296, 0.04643074423074722, 0.05272335931658745, 0.059015970677137375, 0.0653085857629776, 0.07160119712352753, 0.07789380848407745, 0.08418641984462738, 0.09047903120517731, 0.09677164256572723, 0.10306425392627716, 0.10935686528682709, 0.11564947664737701, 0.12194209545850754, 0.12823471426963806, 0.134527325630188, 0.14081993699073792, 0.14711254835128784, 0.15340515971183777, 0.1596977710723877, 0.16599038243293762, 0.17228299379348755, 0.17857560515403748, 0.1848682165145874]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 6.0, 1.0, 3.0, 4.0, 4.0, 4.0, 5.0, 3.0, 7.0, 9.0, 28.0, 21.0, 38.0, 57.0, 64.0, 111.0, 196.0, 266.0, 501.0, 868.0, 1529.0, 2752.0, 5301.0, 12075.0, 41414.0, 328998.0, 560613.0, 64244.0, 15599.0, 6316.0, 3206.0, 1718.0, 1012.0, 612.0, 328.0, 211.0, 139.0, 92.0, 74.0, 35.0, 25.0, 19.0, 7.0, 8.0, 5.0, 4.0, 8.0, 7.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.08587646484375, -0.08328437805175781, -0.08069229125976562, -0.07810020446777344, -0.07550811767578125, -0.07291603088378906, -0.07032394409179688, -0.06773185729980469, -0.0651397705078125, -0.06254768371582031, -0.059955596923828125, -0.05736351013183594, -0.05477142333984375, -0.05217933654785156, -0.049587249755859375, -0.04699516296386719, -0.044403076171875, -0.04181098937988281, -0.039218902587890625, -0.03662681579589844, -0.03403472900390625, -0.03144264221191406, -0.028850555419921875, -0.026258468627929688, -0.0236663818359375, -0.021074295043945312, -0.018482208251953125, -0.015890121459960938, -0.01329803466796875, -0.010705947875976562, -0.008113861083984375, -0.0055217742919921875, -0.0029296875, -0.0003376007080078125, 0.002254486083984375, 0.0048465728759765625, 0.00743865966796875, 0.010030746459960938, 0.012622833251953125, 0.015214920043945312, 0.0178070068359375, 0.020399093627929688, 0.022991180419921875, 0.025583267211914062, 0.02817535400390625, 0.030767440795898438, 0.033359527587890625, 0.03595161437988281, 0.038543701171875, 0.04113578796386719, 0.043727874755859375, 0.04631996154785156, 0.04891204833984375, 0.05150413513183594, 0.054096221923828125, 0.05668830871582031, 0.0592803955078125, 0.06187248229980469, 0.06446456909179688, 0.06705665588378906, 0.06964874267578125, 0.07224082946777344, 0.07483291625976562, 0.07742500305175781, 0.08001708984375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 6.0, 4.0, 8.0, 11.0, 21.0, 17.0, 24.0, 30.0, 37.0, 44.0, 54.0, 58.0, 69.0, 62.0, 64.0, 66.0, 61.0, 64.0, 60.0, 62.0, 42.0, 38.0, 25.0, 28.0, 19.0, 12.0, 9.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1717529296875, -0.16596031188964844, -0.16016769409179688, -0.1543750762939453, -0.14858245849609375, -0.1427898406982422, -0.13699722290039062, -0.13120460510253906, -0.1254119873046875, -0.11961936950683594, -0.11382675170898438, -0.10803413391113281, -0.10224151611328125, -0.09644889831542969, -0.09065628051757812, -0.08486366271972656, -0.079071044921875, -0.07327842712402344, -0.06748580932617188, -0.06169319152832031, -0.05590057373046875, -0.05010795593261719, -0.044315338134765625, -0.03852272033691406, -0.0327301025390625, -0.026937484741210938, -0.021144866943359375, -0.015352249145507812, -0.00955963134765625, -0.0037670135498046875, 0.002025604248046875, 0.007818222045898438, 0.01361083984375, 0.019403457641601562, 0.025196075439453125, 0.030988693237304688, 0.03678131103515625, 0.04257392883300781, 0.048366546630859375, 0.05415916442871094, 0.0599517822265625, 0.06574440002441406, 0.07153701782226562, 0.07732963562011719, 0.08312225341796875, 0.08891487121582031, 0.09470748901367188, 0.10050010681152344, 0.106292724609375, 0.11208534240722656, 0.11787796020507812, 0.12367057800292969, 0.12946319580078125, 0.1352558135986328, 0.14104843139648438, 0.14684104919433594, 0.1526336669921875, 0.15842628479003906, 0.16421890258789062, 0.1700115203857422, 0.17580413818359375, 0.1815967559814453, 0.18738937377929688, 0.19318199157714844, 0.198974609375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 2.0, 5.0, 7.0, 15.0, 10.0, 26.0, 40.0, 56.0, 107.0, 233.0, 532.0, 1370.0, 4996.0, 25992.0, 579441.0, 408577.0, 20509.0, 4315.0, 1354.0, 478.0, 219.0, 94.0, 44.0, 32.0, 29.0, 16.0, 13.0, 4.0, 4.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.127685546875, -0.123809814453125, -0.11993408203125, -0.116058349609375, -0.1121826171875, -0.108306884765625, -0.10443115234375, -0.100555419921875, -0.0966796875, -0.092803955078125, -0.08892822265625, -0.085052490234375, -0.0811767578125, -0.077301025390625, -0.07342529296875, -0.069549560546875, -0.065673828125, -0.061798095703125, -0.05792236328125, -0.054046630859375, -0.0501708984375, -0.046295166015625, -0.04241943359375, -0.038543701171875, -0.03466796875, -0.030792236328125, -0.02691650390625, -0.023040771484375, -0.0191650390625, -0.015289306640625, -0.01141357421875, -0.007537841796875, -0.003662109375, 0.000213623046875, 0.00408935546875, 0.007965087890625, 0.0118408203125, 0.015716552734375, 0.01959228515625, 0.023468017578125, 0.02734375, 0.031219482421875, 0.03509521484375, 0.038970947265625, 0.0428466796875, 0.046722412109375, 0.05059814453125, 0.054473876953125, 0.058349609375, 0.062225341796875, 0.06610107421875, 0.069976806640625, 0.0738525390625, 0.077728271484375, 0.08160400390625, 0.085479736328125, 0.08935546875, 0.093231201171875, 0.09710693359375, 0.100982666015625, 0.1048583984375, 0.108734130859375, 0.11260986328125, 0.116485595703125, 0.120361328125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 3.0, 9.0, 5.0, 10.0, 14.0, 11.0, 17.0, 17.0, 20.0, 25.0, 31.0, 24.0, 32.0, 34.0, 30.0, 45.0, 40.0, 54.0, 43.0, 52.0, 36.0, 41.0, 40.0, 38.0, 40.0, 34.0, 32.0, 32.0, 29.0, 20.0, 24.0, 21.0, 18.0, 17.0, 11.0, 16.0, 8.0, 8.0, 4.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.274658203125, -0.26700592041015625, -0.2593536376953125, -0.25170135498046875, -0.244049072265625, -0.23639678955078125, -0.2287445068359375, -0.22109222412109375, -0.21343994140625, -0.20578765869140625, -0.1981353759765625, -0.19048309326171875, -0.182830810546875, -0.17517852783203125, -0.1675262451171875, -0.15987396240234375, -0.1522216796875, -0.14456939697265625, -0.1369171142578125, -0.12926483154296875, -0.121612548828125, -0.11396026611328125, -0.1063079833984375, -0.09865570068359375, -0.09100341796875, -0.08335113525390625, -0.0756988525390625, -0.06804656982421875, -0.060394287109375, -0.05274200439453125, -0.0450897216796875, -0.03743743896484375, -0.02978515625, -0.02213287353515625, -0.0144805908203125, -0.00682830810546875, 0.000823974609375, 0.00847625732421875, 0.0161285400390625, 0.02378082275390625, 0.03143310546875, 0.03908538818359375, 0.0467376708984375, 0.05438995361328125, 0.062042236328125, 0.06969451904296875, 0.0773468017578125, 0.08499908447265625, 0.0926513671875, 0.10030364990234375, 0.1079559326171875, 0.11560821533203125, 0.123260498046875, 0.13091278076171875, 0.1385650634765625, 0.14621734619140625, 0.15386962890625, 0.16152191162109375, 0.1691741943359375, 0.17682647705078125, 0.184478759765625, 0.19213104248046875, 0.1997833251953125, 0.20743560791015625, 0.215087890625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 6.0, 12.0, 15.0, 16.0, 26.0, 36.0, 54.0, 128.0, 256.0, 606.0, 1897.0, 8058.0, 63085.0, 756528.0, 195760.0, 17067.0, 3280.0, 983.0, 327.0, 178.0, 76.0, 61.0, 34.0, 22.0, 6.0, 15.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0298309326171875, -0.028826475143432617, -0.027822017669677734, -0.02681756019592285, -0.02581310272216797, -0.024808645248413086, -0.023804187774658203, -0.02279973030090332, -0.021795272827148438, -0.020790815353393555, -0.019786357879638672, -0.01878190040588379, -0.017777442932128906, -0.016772985458374023, -0.01576852798461914, -0.014764070510864258, -0.013759613037109375, -0.012755155563354492, -0.01175069808959961, -0.010746240615844727, -0.009741783142089844, -0.008737325668334961, -0.007732868194580078, -0.006728410720825195, -0.0057239532470703125, -0.00471949577331543, -0.003715038299560547, -0.002710580825805664, -0.0017061233520507812, -0.0007016658782958984, 0.0003027915954589844, 0.0013072490692138672, 0.00231170654296875, 0.003316164016723633, 0.004320621490478516, 0.0053250789642333984, 0.006329536437988281, 0.007333993911743164, 0.008338451385498047, 0.00934290885925293, 0.010347366333007812, 0.011351823806762695, 0.012356281280517578, 0.013360738754272461, 0.014365196228027344, 0.015369653701782227, 0.01637411117553711, 0.017378568649291992, 0.018383026123046875, 0.019387483596801758, 0.02039194107055664, 0.021396398544311523, 0.022400856018066406, 0.02340531349182129, 0.024409770965576172, 0.025414228439331055, 0.026418685913085938, 0.02742314338684082, 0.028427600860595703, 0.029432058334350586, 0.03043651580810547, 0.03144097328186035, 0.032445430755615234, 0.03344988822937012, 0.034454345703125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 6.0, 6.0, 11.0, 13.0, 34.0, 48.0, 68.0, 96.0, 154.0, 133.0, 117.0, 87.0, 87.0, 58.0, 29.0, 21.0, 14.0, 10.0, 9.0, 2.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8835067749023438e-05, -1.840386539697647e-05, -1.7972663044929504e-05, -1.7541460692882538e-05, -1.711025834083557e-05, -1.6679055988788605e-05, -1.6247853636741638e-05, -1.581665128469467e-05, -1.5385448932647705e-05, -1.4954246580600739e-05, -1.4523044228553772e-05, -1.4091841876506805e-05, -1.3660639524459839e-05, -1.3229437172412872e-05, -1.2798234820365906e-05, -1.236703246831894e-05, -1.1935830116271973e-05, -1.1504627764225006e-05, -1.107342541217804e-05, -1.0642223060131073e-05, -1.0211020708084106e-05, -9.77981835603714e-06, -9.348616003990173e-06, -8.917413651943207e-06, -8.48621129989624e-06, -8.055008947849274e-06, -7.623806595802307e-06, -7.1926042437553406e-06, -6.761401891708374e-06, -6.3301995396614075e-06, -5.898997187614441e-06, -5.467794835567474e-06, -5.036592483520508e-06, -4.605390131473541e-06, -4.174187779426575e-06, -3.742985427379608e-06, -3.3117830753326416e-06, -2.880580723285675e-06, -2.4493783712387085e-06, -2.018176019191742e-06, -1.5869736671447754e-06, -1.1557713150978088e-06, -7.245689630508423e-07, -2.9336661100387573e-07, 1.3783574104309082e-07, 5.690380930900574e-07, 1.000240445137024e-06, 1.4314427971839905e-06, 1.862645149230957e-06, 2.2938475012779236e-06, 2.72504985332489e-06, 3.1562522053718567e-06, 3.5874545574188232e-06, 4.01865690946579e-06, 4.449859261512756e-06, 4.881061613559723e-06, 5.3122639656066895e-06, 5.743466317653656e-06, 6.1746686697006226e-06, 6.605871021747589e-06, 7.037073373794556e-06, 7.468275725841522e-06, 7.899478077888489e-06, 8.330680429935455e-06, 8.761882781982422e-06]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 5.0, 6.0, 20.0, 25.0, 43.0, 77.0, 130.0, 265.0, 830.0, 3275.0, 22470.0, 565842.0, 433139.0, 18371.0, 2686.0, 713.0, 285.0, 142.0, 90.0, 55.0, 29.0, 23.0, 16.0, 8.0, 5.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.05169677734375, -0.050464630126953125, -0.04923248291015625, -0.048000335693359375, -0.0467681884765625, -0.045536041259765625, -0.04430389404296875, -0.043071746826171875, -0.041839599609375, -0.040607452392578125, -0.03937530517578125, -0.038143157958984375, -0.0369110107421875, -0.035678863525390625, -0.03444671630859375, -0.033214569091796875, -0.031982421875, -0.030750274658203125, -0.02951812744140625, -0.028285980224609375, -0.0270538330078125, -0.025821685791015625, -0.02458953857421875, -0.023357391357421875, -0.022125244140625, -0.020893096923828125, -0.01966094970703125, -0.018428802490234375, -0.0171966552734375, -0.015964508056640625, -0.01473236083984375, -0.013500213623046875, -0.01226806640625, -0.011035919189453125, -0.00980377197265625, -0.008571624755859375, -0.0073394775390625, -0.006107330322265625, -0.00487518310546875, -0.003643035888671875, -0.002410888671875, -0.001178741455078125, 5.340576171875e-05, 0.001285552978515625, 0.0025177001953125, 0.003749847412109375, 0.00498199462890625, 0.006214141845703125, 0.0074462890625, 0.008678436279296875, 0.00991058349609375, 0.011142730712890625, 0.0123748779296875, 0.013607025146484375, 0.01483917236328125, 0.016071319580078125, 0.017303466796875, 0.018535614013671875, 0.01976776123046875, 0.020999908447265625, 0.0222320556640625, 0.023464202880859375, 0.02469635009765625, 0.025928497314453125, 0.02716064453125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 4.0, 15.0, 12.0, 23.0, 30.0, 46.0, 63.0, 109.0, 151.0, 143.0, 122.0, 97.0, 66.0, 36.0, 27.0, 26.0, 16.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.005329132080078125, -0.005089461803436279, -0.004849791526794434, -0.004610121250152588, -0.004370450973510742, -0.0041307806968688965, -0.0038911104202270508, -0.003651440143585205, -0.0034117698669433594, -0.0031720995903015137, -0.002932429313659668, -0.0026927590370178223, -0.0024530887603759766, -0.002213418483734131, -0.001973748207092285, -0.0017340779304504395, -0.0014944076538085938, -0.001254737377166748, -0.0010150671005249023, -0.0007753968238830566, -0.0005357265472412109, -0.00029605627059936523, -5.638599395751953e-05, 0.00018328428268432617, 0.0004229545593261719, 0.0006626248359680176, 0.0009022951126098633, 0.001141965389251709, 0.0013816356658935547, 0.0016213059425354004, 0.001860976219177246, 0.002100646495819092, 0.0023403167724609375, 0.002579987049102783, 0.002819657325744629, 0.0030593276023864746, 0.0032989978790283203, 0.003538668155670166, 0.0037783384323120117, 0.004018008708953857, 0.004257678985595703, 0.004497349262237549, 0.0047370195388793945, 0.00497668981552124, 0.005216360092163086, 0.005456030368804932, 0.005695700645446777, 0.005935370922088623, 0.006175041198730469, 0.0064147114753723145, 0.00665438175201416, 0.006894052028656006, 0.0071337223052978516, 0.007373392581939697, 0.007613062858581543, 0.007852733135223389, 0.008092403411865234, 0.00833207368850708, 0.008571743965148926, 0.008811414241790771, 0.009051084518432617, 0.009290754795074463, 0.009530425071716309, 0.009770095348358154, 0.010009765625]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 6.0, 11.0, 18.0, 27.0, 58.0, 147.0, 282.0, 248.0, 123.0, 40.0, 29.0, 9.0, 8.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61208176612854, -0.5970747470855713, -0.5820677280426025, -0.5670607686042786, -0.5520537495613098, -0.5370467305183411, -0.5220397114753723, -0.5070327520370483, -0.4920257329940796, -0.47701871395111084, -0.4620117247104645, -0.4470047056674957, -0.43199771642684937, -0.4169906973838806, -0.40198370814323425, -0.3869766891002655, -0.37196969985961914, -0.3569626808166504, -0.34195569157600403, -0.3269486725330353, -0.3119416832923889, -0.29693466424942017, -0.2819276750087738, -0.26692065596580505, -0.2519136369228363, -0.23690663278102875, -0.2218996286392212, -0.20689262449741364, -0.19188562035560608, -0.17687860131263733, -0.16187161207199097, -0.14686459302902222, -0.13185760378837585, -0.1168505996465683, -0.10184359550476074, -0.08683659136295319, -0.07182958722114563, -0.05682257562875748, -0.04181557148694992, -0.026808567345142365, -0.011801563203334808, 0.0032054418697953224, 0.018212446942925453, 0.03321945294737816, 0.048226457089185715, 0.06323346495628357, 0.07824046909809113, 0.09324747323989868, 0.10825447738170624, 0.1232614815235138, 0.13826848566532135, 0.1532754898071289, 0.16828249394893646, 0.18328949809074402, 0.19829651713371277, 0.21330350637435913, 0.22831052541732788, 0.24331752955913544, 0.258324533700943, 0.27333155274391174, 0.2883385419845581, 0.30334556102752686, 0.3183525502681732, 0.33335956931114197, 0.34836655855178833]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 5.0, 6.0, 11.0, 11.0, 18.0, 18.0, 14.0, 29.0, 24.0, 43.0, 40.0, 43.0, 59.0, 63.0, 39.0, 58.0, 44.0, 45.0, 67.0, 52.0, 41.0, 43.0, 35.0, 38.0, 38.0, 29.0, 22.0, 15.0, 13.0, 16.0, 8.0, 1.0, 4.0, 7.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.16176283359527588, -0.15728718042373657, -0.15281152725219727, -0.14833585917949677, -0.14386020600795746, -0.13938455283641815, -0.13490888476371765, -0.13043323159217834, -0.12595757842063904, -0.12148192524909973, -0.11700626462697983, -0.11253060400485992, -0.10805495083332062, -0.10357929766178131, -0.09910363703966141, -0.0946279764175415, -0.0901523232460022, -0.08567667007446289, -0.08120100945234299, -0.07672534883022308, -0.07224969565868378, -0.06777404248714447, -0.06329838186502457, -0.05882272496819496, -0.054347068071365356, -0.04987141117453575, -0.045395754277706146, -0.04092009738087654, -0.036444440484046936, -0.03196878358721733, -0.027493126690387726, -0.02301746979355812, -0.018541812896728516, -0.01406615599989891, -0.009590499103069305, -0.0051148422062397, -0.0006391853094100952, 0.00383647158741951, 0.008312128484249115, 0.01278778538107872, 0.017263442277908325, 0.02173909917473793, 0.026214756071567535, 0.03069041296839714, 0.035166069865226746, 0.03964172676205635, 0.044117383658885956, 0.04859304055571556, 0.053068697452545166, 0.05754435434937477, 0.062020011246204376, 0.06649567186832428, 0.07097132503986359, 0.0754469782114029, 0.0799226388335228, 0.0843982994556427, 0.088873952627182, 0.09334960579872131, 0.09782526642084122, 0.10230092704296112, 0.10677658021450043, 0.11125223338603973, 0.11572789400815964, 0.12020355463027954, 0.12467920780181885]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 5.0, 12.0, 20.0, 49.0, 133.0, 355.0, 1129.0, 4424.0, 28807.0, 852978.0, 147007.0, 10483.0, 2203.0, 629.0, 178.0, 63.0, 28.0, 11.0, 5.0, 6.0, 5.0, 1.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34619140625, -0.33371734619140625, -0.3212432861328125, -0.30876922607421875, -0.296295166015625, -0.28382110595703125, -0.2713470458984375, -0.25887298583984375, -0.24639892578125, -0.23392486572265625, -0.2214508056640625, -0.20897674560546875, -0.196502685546875, -0.18402862548828125, -0.1715545654296875, -0.15908050537109375, -0.1466064453125, -0.13413238525390625, -0.1216583251953125, -0.10918426513671875, -0.096710205078125, -0.08423614501953125, -0.0717620849609375, -0.05928802490234375, -0.04681396484375, -0.03433990478515625, -0.0218658447265625, -0.00939178466796875, 0.003082275390625, 0.01555633544921875, 0.0280303955078125, 0.04050445556640625, 0.052978515625, 0.06545257568359375, 0.0779266357421875, 0.09040069580078125, 0.102874755859375, 0.11534881591796875, 0.1278228759765625, 0.14029693603515625, 0.15277099609375, 0.16524505615234375, 0.1777191162109375, 0.19019317626953125, 0.202667236328125, 0.21514129638671875, 0.2276153564453125, 0.24008941650390625, 0.2525634765625, 0.26503753662109375, 0.2775115966796875, 0.28998565673828125, 0.302459716796875, 0.31493377685546875, 0.3274078369140625, 0.33988189697265625, 0.35235595703125, 0.36483001708984375, 0.3773040771484375, 0.38977813720703125, 0.402252197265625, 0.41472625732421875, 0.4272003173828125, 0.43967437744140625, 0.4521484375]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 6.0, 7.0, 10.0, 12.0, 16.0, 13.0, 25.0, 28.0, 42.0, 49.0, 50.0, 52.0, 49.0, 51.0, 48.0, 67.0, 50.0, 58.0, 56.0, 51.0, 39.0, 39.0, 35.0, 33.0, 25.0, 26.0, 16.0, 12.0, 8.0, 10.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.34716796875, -0.3376007080078125, -0.328033447265625, -0.3184661865234375, -0.30889892578125, -0.2993316650390625, -0.289764404296875, -0.2801971435546875, -0.2706298828125, -0.2610626220703125, -0.251495361328125, -0.2419281005859375, -0.23236083984375, -0.2227935791015625, -0.213226318359375, -0.2036590576171875, -0.194091796875, -0.1845245361328125, -0.174957275390625, -0.1653900146484375, -0.15582275390625, -0.1462554931640625, -0.136688232421875, -0.1271209716796875, -0.1175537109375, -0.1079864501953125, -0.098419189453125, -0.0888519287109375, -0.07928466796875, -0.0697174072265625, -0.060150146484375, -0.0505828857421875, -0.041015625, -0.0314483642578125, -0.021881103515625, -0.0123138427734375, -0.00274658203125, 0.0068206787109375, 0.016387939453125, 0.0259552001953125, 0.0355224609375, 0.0450897216796875, 0.054656982421875, 0.0642242431640625, 0.07379150390625, 0.0833587646484375, 0.092926025390625, 0.1024932861328125, 0.112060546875, 0.1216278076171875, 0.131195068359375, 0.1407623291015625, 0.15032958984375, 0.1598968505859375, 0.169464111328125, 0.1790313720703125, 0.1885986328125, 0.1981658935546875, 0.207733154296875, 0.2173004150390625, 0.22686767578125, 0.2364349365234375, 0.246002197265625, 0.2555694580078125, 0.26513671875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 10.0, 7.0, 13.0, 15.0, 23.0, 35.0, 41.0, 71.0, 141.0, 252.0, 664.0, 2605.0, 19770.0, 857151.0, 157851.0, 7577.0, 1364.0, 440.0, 212.0, 103.0, 73.0, 34.0, 29.0, 17.0, 12.0, 10.0, 10.0, 5.0, 7.0, 3.0, 5.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.380615234375, -0.36864471435546875, -0.3566741943359375, -0.34470367431640625, -0.332733154296875, -0.32076263427734375, -0.3087921142578125, -0.29682159423828125, -0.28485107421875, -0.27288055419921875, -0.2609100341796875, -0.24893951416015625, -0.236968994140625, -0.22499847412109375, -0.2130279541015625, -0.20105743408203125, -0.1890869140625, -0.17711639404296875, -0.1651458740234375, -0.15317535400390625, -0.141204833984375, -0.12923431396484375, -0.1172637939453125, -0.10529327392578125, -0.09332275390625, -0.08135223388671875, -0.0693817138671875, -0.05741119384765625, -0.045440673828125, -0.03347015380859375, -0.0214996337890625, -0.00952911376953125, 0.00244140625, 0.01441192626953125, 0.0263824462890625, 0.03835296630859375, 0.050323486328125, 0.06229400634765625, 0.0742645263671875, 0.08623504638671875, 0.09820556640625, 0.11017608642578125, 0.1221466064453125, 0.13411712646484375, 0.146087646484375, 0.15805816650390625, 0.1700286865234375, 0.18199920654296875, 0.1939697265625, 0.20594024658203125, 0.2179107666015625, 0.22988128662109375, 0.241851806640625, 0.25382232666015625, 0.2657928466796875, 0.27776336669921875, 0.28973388671875, 0.30170440673828125, 0.3136749267578125, 0.32564544677734375, 0.337615966796875, 0.34958648681640625, 0.3615570068359375, 0.37352752685546875, 0.385498046875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 5.0, 6.0, 7.0, 13.0, 6.0, 15.0, 12.0, 17.0, 18.0, 16.0, 24.0, 21.0, 19.0, 34.0, 28.0, 45.0, 40.0, 47.0, 41.0, 52.0, 44.0, 37.0, 43.0, 52.0, 54.0, 32.0, 30.0, 43.0, 23.0, 30.0, 26.0, 22.0, 22.0, 17.0, 17.0, 8.0, 12.0, 8.0, 4.0, 3.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.283203125, -0.2745780944824219, -0.26595306396484375, -0.2573280334472656, -0.2487030029296875, -0.24007797241210938, -0.23145294189453125, -0.22282791137695312, -0.214202880859375, -0.20557785034179688, -0.19695281982421875, -0.18832778930664062, -0.1797027587890625, -0.17107772827148438, -0.16245269775390625, -0.15382766723632812, -0.14520263671875, -0.13657760620117188, -0.12795257568359375, -0.11932754516601562, -0.1107025146484375, -0.10207748413085938, -0.09345245361328125, -0.08482742309570312, -0.076202392578125, -0.06757736206054688, -0.05895233154296875, -0.050327301025390625, -0.0417022705078125, -0.033077239990234375, -0.02445220947265625, -0.015827178955078125, -0.0072021484375, 0.001422882080078125, 0.01004791259765625, 0.018672943115234375, 0.0272979736328125, 0.035923004150390625, 0.04454803466796875, 0.053173065185546875, 0.061798095703125, 0.07042312622070312, 0.07904815673828125, 0.08767318725585938, 0.0962982177734375, 0.10492324829101562, 0.11354827880859375, 0.12217330932617188, 0.13079833984375, 0.13942337036132812, 0.14804840087890625, 0.15667343139648438, 0.1652984619140625, 0.17392349243164062, 0.18254852294921875, 0.19117355346679688, 0.199798583984375, 0.20842361450195312, 0.21704864501953125, 0.22567367553710938, 0.2342987060546875, 0.24292373657226562, 0.25154876708984375, 0.2601737976074219, 0.268798828125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 5.0, 0.0, 6.0, 5.0, 8.0, 17.0, 24.0, 44.0, 70.0, 156.0, 389.0, 1668.0, 13327.0, 864536.0, 161288.0, 5514.0, 910.0, 277.0, 121.0, 56.0, 43.0, 20.0, 25.0, 13.0, 7.0, 7.0, 3.0, 5.0, 4.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1549072265625, -0.1503276824951172, -0.14574813842773438, -0.14116859436035156, -0.13658905029296875, -0.13200950622558594, -0.12742996215820312, -0.12285041809082031, -0.1182708740234375, -0.11369132995605469, -0.10911178588867188, -0.10453224182128906, -0.09995269775390625, -0.09537315368652344, -0.09079360961914062, -0.08621406555175781, -0.081634521484375, -0.07705497741699219, -0.07247543334960938, -0.06789588928222656, -0.06331634521484375, -0.05873680114746094, -0.054157257080078125, -0.04957771301269531, -0.0449981689453125, -0.04041862487792969, -0.035839080810546875, -0.03125953674316406, -0.02667999267578125, -0.022100448608398438, -0.017520904541015625, -0.012941360473632812, -0.00836181640625, -0.0037822723388671875, 0.000797271728515625, 0.0053768157958984375, 0.00995635986328125, 0.014535903930664062, 0.019115447998046875, 0.023694992065429688, 0.0282745361328125, 0.03285408020019531, 0.037433624267578125, 0.04201316833496094, 0.04659271240234375, 0.05117225646972656, 0.055751800537109375, 0.06033134460449219, 0.064910888671875, 0.06949043273925781, 0.07406997680664062, 0.07864952087402344, 0.08322906494140625, 0.08780860900878906, 0.09238815307617188, 0.09696769714355469, 0.1015472412109375, 0.10612678527832031, 0.11070632934570312, 0.11528587341308594, 0.11986541748046875, 0.12444496154785156, 0.12902450561523438, 0.1336040496826172, 0.13818359375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 14.0, 8.0, 9.0, 29.0, 39.0, 86.0, 182.0, 240.0, 171.0, 94.0, 45.0, 37.0, 11.0, 9.0, 9.0, 6.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6450881958007812e-05, -1.5875324606895447e-05, -1.529976725578308e-05, -1.4724209904670715e-05, -1.414865255355835e-05, -1.3573095202445984e-05, -1.2997537851333618e-05, -1.2421980500221252e-05, -1.1846423149108887e-05, -1.1270865797996521e-05, -1.0695308446884155e-05, -1.011975109577179e-05, -9.544193744659424e-06, -8.968636393547058e-06, -8.393079042434692e-06, -7.817521691322327e-06, -7.241964340209961e-06, -6.666406989097595e-06, -6.0908496379852295e-06, -5.515292286872864e-06, -4.939734935760498e-06, -4.364177584648132e-06, -3.7886202335357666e-06, -3.213062882423401e-06, -2.637505531311035e-06, -2.0619481801986694e-06, -1.4863908290863037e-06, -9.10833477973938e-07, -3.3527612686157227e-07, 2.4028122425079346e-07, 8.158385753631592e-07, 1.391395926475525e-06, 1.9669532775878906e-06, 2.5425106287002563e-06, 3.118067979812622e-06, 3.693625330924988e-06, 4.2691826820373535e-06, 4.844740033149719e-06, 5.420297384262085e-06, 5.995854735374451e-06, 6.571412086486816e-06, 7.146969437599182e-06, 7.722526788711548e-06, 8.298084139823914e-06, 8.87364149093628e-06, 9.449198842048645e-06, 1.002475619316101e-05, 1.0600313544273376e-05, 1.1175870895385742e-05, 1.1751428246498108e-05, 1.2326985597610474e-05, 1.290254294872284e-05, 1.3478100299835205e-05, 1.405365765094757e-05, 1.4629215002059937e-05, 1.5204772353172302e-05, 1.5780329704284668e-05, 1.6355887055397034e-05, 1.69314444065094e-05, 1.7507001757621765e-05, 1.808255910873413e-05, 1.8658116459846497e-05, 1.9233673810958862e-05, 1.9809231162071228e-05, 2.0384788513183594e-05]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 11.0, 12.0, 12.0, 28.0, 43.0, 79.0, 188.0, 493.0, 1999.0, 18207.0, 984630.0, 38874.0, 2808.0, 678.0, 257.0, 100.0, 53.0, 26.0, 17.0, 10.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.186279296875, -0.18056488037109375, -0.1748504638671875, -0.16913604736328125, -0.163421630859375, -0.15770721435546875, -0.1519927978515625, -0.14627838134765625, -0.14056396484375, -0.13484954833984375, -0.1291351318359375, -0.12342071533203125, -0.117706298828125, -0.11199188232421875, -0.1062774658203125, -0.10056304931640625, -0.0948486328125, -0.08913421630859375, -0.0834197998046875, -0.07770538330078125, -0.071990966796875, -0.06627655029296875, -0.0605621337890625, -0.05484771728515625, -0.04913330078125, -0.04341888427734375, -0.0377044677734375, -0.03199005126953125, -0.026275634765625, -0.02056121826171875, -0.0148468017578125, -0.00913238525390625, -0.00341796875, 0.00229644775390625, 0.0080108642578125, 0.01372528076171875, 0.019439697265625, 0.02515411376953125, 0.0308685302734375, 0.03658294677734375, 0.04229736328125, 0.04801177978515625, 0.0537261962890625, 0.05944061279296875, 0.065155029296875, 0.07086944580078125, 0.0765838623046875, 0.08229827880859375, 0.0880126953125, 0.09372711181640625, 0.0994415283203125, 0.10515594482421875, 0.110870361328125, 0.11658477783203125, 0.1222991943359375, 0.12801361083984375, 0.13372802734375, 0.13944244384765625, 0.1451568603515625, 0.15087127685546875, 0.156585693359375, 0.16230010986328125, 0.1680145263671875, 0.17372894287109375, 0.179443359375]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 7.0, 25.0, 15.0, 28.0, 32.0, 72.0, 75.0, 127.0, 145.0, 150.0, 97.0, 74.0, 40.0, 35.0, 15.0, 15.0, 11.0, 10.0, 10.0, 0.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.033843994140625, -0.03273963928222656, -0.031635284423828125, -0.030530929565429688, -0.02942657470703125, -0.028322219848632812, -0.027217864990234375, -0.026113510131835938, -0.0250091552734375, -0.023904800415039062, -0.022800445556640625, -0.021696090698242188, -0.02059173583984375, -0.019487380981445312, -0.018383026123046875, -0.017278671264648438, -0.01617431640625, -0.015069961547851562, -0.013965606689453125, -0.012861251831054688, -0.01175689697265625, -0.010652542114257812, -0.009548187255859375, -0.008443832397460938, -0.0073394775390625, -0.0062351226806640625, -0.005130767822265625, -0.0040264129638671875, -0.00292205810546875, -0.0018177032470703125, -0.000713348388671875, 0.0003910064697265625, 0.001495361328125, 0.0025997161865234375, 0.003704071044921875, 0.0048084259033203125, 0.00591278076171875, 0.0070171356201171875, 0.008121490478515625, 0.009225845336914062, 0.0103302001953125, 0.011434555053710938, 0.012538909912109375, 0.013643264770507812, 0.01474761962890625, 0.015851974487304688, 0.016956329345703125, 0.018060684204101562, 0.0191650390625, 0.020269393920898438, 0.021373748779296875, 0.022478103637695312, 0.02358245849609375, 0.024686813354492188, 0.025791168212890625, 0.026895523071289062, 0.0279998779296875, 0.029104232788085938, 0.030208587646484375, 0.03131294250488281, 0.03241729736328125, 0.03352165222167969, 0.034626007080078125, 0.03573036193847656, 0.036834716796875]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 13.0, 26.0, 48.0, 185.0, 362.0, 263.0, 58.0, 31.0, 15.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.0096774101257324, -1.9699279069900513, -1.9301785230636597, -1.8904290199279785, -1.850679636001587, -1.8109301328659058, -1.7711807489395142, -1.731431245803833, -1.6916818618774414, -1.6519323587417603, -1.6121829748153687, -1.5724334716796875, -1.532684087753296, -1.4929345846176147, -1.4531852006912231, -1.413435697555542, -1.3736863136291504, -1.3339368104934692, -1.2941874265670776, -1.2544379234313965, -1.2146885395050049, -1.1749390363693237, -1.1351896524429321, -1.095440149307251, -1.0556906461715698, -1.0159411430358887, -0.9761917591094971, -0.9364423155784607, -0.8966928720474243, -0.8569434285163879, -0.8171939849853516, -0.7774444818496704, -0.7376950979232788, -0.6979456543922424, -0.658196210861206, -0.6184467673301697, -0.5786973237991333, -0.5389478802680969, -0.49919840693473816, -0.4594489634037018, -0.4196995198726654, -0.37995007634162903, -0.34020063281059265, -0.3004511594772339, -0.2607017159461975, -0.22095228731632233, -0.18120282888412476, -0.14145338535308838, -0.101703941822052, -0.06195449456572533, -0.02220504730939865, 0.017544403672218323, 0.0572938472032547, 0.09704329073429108, 0.13679274916648865, 0.17654219269752502, 0.2162916362285614, 0.2560410797595978, 0.29579052329063416, 0.3355399966239929, 0.3752894401550293, 0.4150388836860657, 0.45478832721710205, 0.4945377707481384, 0.5342872142791748]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 6.0, 3.0, 3.0, 5.0, 9.0, 7.0, 11.0, 16.0, 23.0, 14.0, 16.0, 27.0, 35.0, 45.0, 43.0, 53.0, 43.0, 37.0, 54.0, 53.0, 46.0, 50.0, 47.0, 46.0, 45.0, 44.0, 46.0, 30.0, 26.0, 26.0, 20.0, 17.0, 19.0, 6.0, 8.0, 9.0, 11.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.589144229888916, -0.5728532075881958, -0.5565621852874756, -0.5402711629867554, -0.5239801406860352, -0.5076891183853149, -0.49139806628227234, -0.4751070439815521, -0.4588159918785095, -0.4425249695777893, -0.4262339472770691, -0.4099429249763489, -0.3936518728733063, -0.37736085057258606, -0.36106982827186584, -0.34477880597114563, -0.3284877836704254, -0.3121967613697052, -0.295905739068985, -0.2796146869659424, -0.26332366466522217, -0.24703264236450195, -0.23074162006378174, -0.21445059776306152, -0.19815956056118011, -0.1818685382604599, -0.1655775010585785, -0.14928647875785828, -0.13299545645713806, -0.11670441925525665, -0.10041339695453644, -0.08412236720323563, -0.0678313672542572, -0.05154033750295639, -0.03524931147694588, -0.018958285450935364, -0.002667255699634552, 0.01362377405166626, 0.029914796352386475, 0.046205826103687286, 0.0624968558549881, 0.07878788560628891, 0.09507891535758972, 0.11136993765830994, 0.12766095995903015, 0.14395199716091156, 0.16024301946163177, 0.17653405666351318, 0.1928250789642334, 0.2091161012649536, 0.22540713846683502, 0.24169816076755524, 0.25798919796943665, 0.27428022027015686, 0.2905712425708771, 0.3068622648715973, 0.3231533169746399, 0.3394443392753601, 0.3557353615760803, 0.37202638387680054, 0.38831743597984314, 0.40460845828056335, 0.42089948058128357, 0.4371905028820038, 0.453481525182724]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 2.0, 8.0, 13.0, 11.0, 16.0, 18.0, 30.0, 40.0, 65.0, 95.0, 149.0, 294.0, 591.0, 1317.0, 3285.0, 12638.0, 258103.0, 3715774.0, 183419.0, 12653.0, 3276.0, 1239.0, 538.0, 280.0, 139.0, 91.0, 54.0, 44.0, 27.0, 20.0, 12.0, 11.0, 6.0, 6.0, 8.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3994140625, -0.3867225646972656, -0.37403106689453125, -0.3613395690917969, -0.3486480712890625, -0.3359565734863281, -0.32326507568359375, -0.3105735778808594, -0.297882080078125, -0.2851905822753906, -0.27249908447265625, -0.2598075866699219, -0.2471160888671875, -0.23442459106445312, -0.22173309326171875, -0.20904159545898438, -0.19635009765625, -0.18365859985351562, -0.17096710205078125, -0.15827560424804688, -0.1455841064453125, -0.13289260864257812, -0.12020111083984375, -0.10750961303710938, -0.094818115234375, -0.08212661743164062, -0.06943511962890625, -0.056743621826171875, -0.0440521240234375, -0.031360626220703125, -0.01866912841796875, -0.005977630615234375, 0.0067138671875, 0.019405364990234375, 0.03209686279296875, 0.044788360595703125, 0.0574798583984375, 0.07017135620117188, 0.08286285400390625, 0.09555435180664062, 0.108245849609375, 0.12093734741210938, 0.13362884521484375, 0.14632034301757812, 0.1590118408203125, 0.17170333862304688, 0.18439483642578125, 0.19708633422851562, 0.20977783203125, 0.22246932983398438, 0.23516082763671875, 0.24785232543945312, 0.2605438232421875, 0.2732353210449219, 0.28592681884765625, 0.2986183166503906, 0.311309814453125, 0.3240013122558594, 0.33669281005859375, 0.3493843078613281, 0.3620758056640625, 0.3747673034667969, 0.38745880126953125, 0.4001502990722656, 0.412841796875]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 8.0, 6.0, 9.0, 10.0, 15.0, 19.0, 27.0, 44.0, 59.0, 50.0, 61.0, 60.0, 77.0, 76.0, 62.0, 67.0, 56.0, 50.0, 43.0, 36.0, 38.0, 34.0, 23.0, 21.0, 20.0, 12.0, 8.0, 5.0, 2.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2509765625, -0.2445354461669922, -0.23809432983398438, -0.23165321350097656, -0.22521209716796875, -0.21877098083496094, -0.21232986450195312, -0.2058887481689453, -0.1994476318359375, -0.1930065155029297, -0.18656539916992188, -0.18012428283691406, -0.17368316650390625, -0.16724205017089844, -0.16080093383789062, -0.1543598175048828, -0.147918701171875, -0.1414775848388672, -0.13503646850585938, -0.12859535217285156, -0.12215423583984375, -0.11571311950683594, -0.10927200317382812, -0.10283088684082031, -0.0963897705078125, -0.08994865417480469, -0.08350753784179688, -0.07706642150878906, -0.07062530517578125, -0.06418418884277344, -0.057743072509765625, -0.05130195617675781, -0.04486083984375, -0.03841972351074219, -0.031978607177734375, -0.025537490844726562, -0.01909637451171875, -0.012655258178710938, -0.006214141845703125, 0.0002269744873046875, 0.0066680908203125, 0.013109207153320312, 0.019550323486328125, 0.025991439819335938, 0.03243255615234375, 0.03887367248535156, 0.045314788818359375, 0.05175590515136719, 0.058197021484375, 0.06463813781738281, 0.07107925415039062, 0.07752037048339844, 0.08396148681640625, 0.09040260314941406, 0.09684371948242188, 0.10328483581542969, 0.1097259521484375, 0.11616706848144531, 0.12260818481445312, 0.12904930114746094, 0.13549041748046875, 0.14193153381347656, 0.14837265014648438, 0.1548137664794922, 0.1612548828125]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 6.0, 11.0, 8.0, 17.0, 19.0, 27.0, 35.0, 73.0, 92.0, 176.0, 315.0, 795.0, 2139.0, 8750.0, 81714.0, 3982344.0, 103343.0, 10134.0, 2479.0, 911.0, 355.0, 200.0, 107.0, 59.0, 46.0, 30.0, 17.0, 13.0, 12.0, 8.0, 6.0, 2.0, 7.0, 3.0, 6.0, 4.0, 2.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.335693359375, -0.3220100402832031, -0.30832672119140625, -0.2946434020996094, -0.2809600830078125, -0.2672767639160156, -0.25359344482421875, -0.23991012573242188, -0.226226806640625, -0.21254348754882812, -0.19886016845703125, -0.18517684936523438, -0.1714935302734375, -0.15781021118164062, -0.14412689208984375, -0.13044357299804688, -0.11676025390625, -0.10307693481445312, -0.08939361572265625, -0.07571029663085938, -0.0620269775390625, -0.048343658447265625, -0.03466033935546875, -0.020977020263671875, -0.007293701171875, 0.006389617919921875, 0.02007293701171875, 0.033756256103515625, 0.0474395751953125, 0.061122894287109375, 0.07480621337890625, 0.08848953247070312, 0.1021728515625, 0.11585617065429688, 0.12953948974609375, 0.14322280883789062, 0.1569061279296875, 0.17058944702148438, 0.18427276611328125, 0.19795608520507812, 0.211639404296875, 0.22532272338867188, 0.23900604248046875, 0.2526893615722656, 0.2663726806640625, 0.2800559997558594, 0.29373931884765625, 0.3074226379394531, 0.32110595703125, 0.3347892761230469, 0.34847259521484375, 0.3621559143066406, 0.3758392333984375, 0.3895225524902344, 0.40320587158203125, 0.4168891906738281, 0.430572509765625, 0.4442558288574219, 0.45793914794921875, 0.4716224670410156, 0.4853057861328125, 0.4989891052246094, 0.5126724243164062, 0.5263557434082031, 0.5400390625]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 10.0, 12.0, 9.0, 16.0, 17.0, 32.0, 43.0, 73.0, 97.0, 252.0, 548.0, 1051.0, 944.0, 467.0, 208.0, 110.0, 41.0, 44.0, 18.0, 16.0, 13.0, 11.0, 6.0, 5.0, 6.0, 2.0, 9.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.10394287109375, -0.1013336181640625, -0.098724365234375, -0.0961151123046875, -0.093505859375, -0.0908966064453125, -0.088287353515625, -0.0856781005859375, -0.08306884765625, -0.0804595947265625, -0.077850341796875, -0.0752410888671875, -0.0726318359375, -0.0700225830078125, -0.067413330078125, -0.0648040771484375, -0.06219482421875, -0.0595855712890625, -0.056976318359375, -0.0543670654296875, -0.0517578125, -0.0491485595703125, -0.046539306640625, -0.0439300537109375, -0.04132080078125, -0.0387115478515625, -0.036102294921875, -0.0334930419921875, -0.0308837890625, -0.0282745361328125, -0.025665283203125, -0.0230560302734375, -0.02044677734375, -0.0178375244140625, -0.015228271484375, -0.0126190185546875, -0.010009765625, -0.0074005126953125, -0.004791259765625, -0.0021820068359375, 0.00042724609375, 0.0030364990234375, 0.005645751953125, 0.0082550048828125, 0.0108642578125, 0.0134735107421875, 0.016082763671875, 0.0186920166015625, 0.02130126953125, 0.0239105224609375, 0.026519775390625, 0.0291290283203125, 0.03173828125, 0.0343475341796875, 0.036956787109375, 0.0395660400390625, 0.04217529296875, 0.0447845458984375, 0.047393798828125, 0.0500030517578125, 0.0526123046875, 0.0552215576171875, 0.057830810546875, 0.0604400634765625, 0.06304931640625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 6.0, 15.0, 6.0, 20.0, 29.0, 44.0, 71.0, 108.0, 153.0, 163.0, 133.0, 82.0, 58.0, 36.0, 23.0, 14.0, 13.0, 9.0, 5.0, 0.0, 4.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34517422318458557, -0.3340901732444763, -0.32300612330436707, -0.3119220733642578, -0.30083802342414856, -0.2897539734840393, -0.27866995334625244, -0.2675859034061432, -0.25650185346603394, -0.24541780352592468, -0.23433375358581543, -0.22324970364570618, -0.21216566860675812, -0.20108161866664886, -0.1899975687265396, -0.17891353368759155, -0.1678294688463211, -0.15674541890621185, -0.1456613689661026, -0.13457733392715454, -0.12349328398704529, -0.11240923404693604, -0.10132518410682678, -0.09024114161729813, -0.07915709167718887, -0.06807304173707962, -0.056988999247550964, -0.04590494930744171, -0.03482090309262276, -0.023736856877803802, -0.01265280693769455, -0.0015687644481658936, 0.00951528549194336, 0.020599331706762314, 0.03168337792158127, 0.04276742786169052, 0.053851474076509476, 0.06493552029132843, 0.07601957023143768, 0.08710361272096634, 0.09818766266107559, 0.10927171260118484, 0.1203557550907135, 0.13143980503082275, 0.142523854970932, 0.15360790491104126, 0.1646919548511505, 0.17577598989009857, 0.18686003983020782, 0.19794408977031708, 0.20902813971042633, 0.2201121747493744, 0.23119622468948364, 0.2422802746295929, 0.25336432456970215, 0.2644483745098114, 0.27553242444992065, 0.2866164743900299, 0.29770052433013916, 0.3087845742702484, 0.31986862421035767, 0.33095264434814453, 0.34203672409057617, 0.35312074422836304, 0.3642047941684723]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 6.0, 4.0, 5.0, 6.0, 14.0, 13.0, 19.0, 15.0, 21.0, 30.0, 29.0, 28.0, 38.0, 43.0, 43.0, 50.0, 49.0, 49.0, 63.0, 53.0, 36.0, 42.0, 44.0, 38.0, 38.0, 37.0, 49.0, 22.0, 21.0, 17.0, 15.0, 15.0, 13.0, 9.0, 8.0, 7.0, 3.0, 2.0, 2.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13359737396240234, -0.12859424948692322, -0.12359113991260529, -0.11858802288770676, -0.11358490586280823, -0.1085817888379097, -0.10357867181301117, -0.09857554733753204, -0.09357243776321411, -0.08856932073831558, -0.08356620371341705, -0.07856308668851852, -0.07355996966362, -0.06855685263872147, -0.06355373561382294, -0.05855061486363411, -0.05354749411344528, -0.04854437708854675, -0.043541260063648224, -0.038538143038749695, -0.033535026013851166, -0.028531907126307487, -0.02352878823876381, -0.01852567121386528, -0.013522554188966751, -0.008519437164068222, -0.0035163192078471184, 0.0014867987483739853, 0.006489915773272514, 0.011493032798171043, 0.01649615168571472, 0.02149926871061325, 0.02650238573551178, 0.03150550276041031, 0.03650861978530884, 0.04151173681020737, 0.046514853835105896, 0.051517970860004425, 0.05652109161019325, 0.06152420863509178, 0.06652732193470001, 0.07153043895959854, 0.07653355598449707, 0.0815366730093956, 0.08653979003429413, 0.09154290705919266, 0.09654602408409119, 0.10154914855957031, 0.10655226558446884, 0.11155538260936737, 0.1165584996342659, 0.12156161665916443, 0.12656474113464355, 0.1315678507089615, 0.1365709751844406, 0.14157408475875854, 0.14657720923423767, 0.1515803337097168, 0.15658344328403473, 0.16158656775951385, 0.1665896773338318, 0.1715928018093109, 0.17659591138362885, 0.18159903585910797, 0.1866021454334259]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 2.0, 3.0, 3.0, 9.0, 16.0, 26.0, 16.0, 32.0, 54.0, 72.0, 121.0, 158.0, 280.0, 370.0, 577.0, 960.0, 1505.0, 2486.0, 4158.0, 7141.0, 12684.0, 23665.0, 45449.0, 92795.0, 187339.0, 276092.0, 193389.0, 95801.0, 47411.0, 24291.0, 13069.0, 7334.0, 4352.0, 2562.0, 1590.0, 948.0, 622.0, 379.0, 274.0, 177.0, 123.0, 80.0, 49.0, 31.0, 25.0, 18.0, 6.0, 6.0, 2.0, 7.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.0172119140625, -0.016713380813598633, -0.016214847564697266, -0.0157163143157959, -0.015217781066894531, -0.014719247817993164, -0.014220714569091797, -0.01372218132019043, -0.013223648071289062, -0.012725114822387695, -0.012226581573486328, -0.011728048324584961, -0.011229515075683594, -0.010730981826782227, -0.01023244857788086, -0.009733915328979492, -0.009235382080078125, -0.008736848831176758, -0.00823831558227539, -0.0077397823333740234, -0.007241249084472656, -0.006742715835571289, -0.006244182586669922, -0.005745649337768555, -0.0052471160888671875, -0.00474858283996582, -0.004250049591064453, -0.003751516342163086, -0.0032529830932617188, -0.0027544498443603516, -0.0022559165954589844, -0.0017573833465576172, -0.00125885009765625, -0.0007603168487548828, -0.0002617835998535156, 0.00023674964904785156, 0.0007352828979492188, 0.001233816146850586, 0.0017323493957519531, 0.0022308826446533203, 0.0027294158935546875, 0.0032279491424560547, 0.003726482391357422, 0.004225015640258789, 0.004723548889160156, 0.0052220821380615234, 0.005720615386962891, 0.006219148635864258, 0.006717681884765625, 0.007216215133666992, 0.007714748382568359, 0.008213281631469727, 0.008711814880371094, 0.009210348129272461, 0.009708881378173828, 0.010207414627075195, 0.010705947875976562, 0.01120448112487793, 0.011703014373779297, 0.012201547622680664, 0.012700080871582031, 0.013198614120483398, 0.013697147369384766, 0.014195680618286133, 0.0146942138671875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 1.0, 3.0, 8.0, 8.0, 15.0, 14.0, 19.0, 17.0, 34.0, 23.0, 39.0, 42.0, 47.0, 67.0, 47.0, 63.0, 64.0, 63.0, 40.0, 55.0, 53.0, 46.0, 39.0, 38.0, 40.0, 28.0, 21.0, 13.0, 15.0, 7.0, 5.0, 7.0, 5.0, 4.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1241455078125, -0.12025260925292969, -0.11635971069335938, -0.11246681213378906, -0.10857391357421875, -0.10468101501464844, -0.10078811645507812, -0.09689521789550781, -0.0930023193359375, -0.08910942077636719, -0.08521652221679688, -0.08132362365722656, -0.07743072509765625, -0.07353782653808594, -0.06964492797851562, -0.06575202941894531, -0.061859130859375, -0.05796623229980469, -0.054073333740234375, -0.05018043518066406, -0.04628753662109375, -0.04239463806152344, -0.038501739501953125, -0.03460884094238281, -0.0307159423828125, -0.026823043823242188, -0.022930145263671875, -0.019037246704101562, -0.01514434814453125, -0.011251449584960938, -0.007358551025390625, -0.0034656524658203125, 0.00042724609375, 0.0043201446533203125, 0.008213043212890625, 0.012105941772460938, 0.01599884033203125, 0.019891738891601562, 0.023784637451171875, 0.027677536010742188, 0.0315704345703125, 0.03546333312988281, 0.039356231689453125, 0.04324913024902344, 0.04714202880859375, 0.05103492736816406, 0.054927825927734375, 0.05882072448730469, 0.062713623046875, 0.06660652160644531, 0.07049942016601562, 0.07439231872558594, 0.07828521728515625, 0.08217811584472656, 0.08607101440429688, 0.08996391296386719, 0.0938568115234375, 0.09774971008300781, 0.10164260864257812, 0.10553550720214844, 0.10942840576171875, 0.11332130432128906, 0.11721420288085938, 0.12110710144042969, 0.125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 9.0, 8.0, 12.0, 39.0, 59.0, 119.0, 295.0, 802.0, 2382.0, 9289.0, 48791.0, 370933.0, 525127.0, 72899.0, 12815.0, 3135.0, 1064.0, 406.0, 171.0, 88.0, 34.0, 19.0, 11.0, 6.0, 8.0, 10.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.048065185546875, -0.046613216400146484, -0.04516124725341797, -0.04370927810668945, -0.04225730895996094, -0.04080533981323242, -0.039353370666503906, -0.03790140151977539, -0.036449432373046875, -0.03499746322631836, -0.033545494079589844, -0.03209352493286133, -0.030641555786132812, -0.029189586639404297, -0.02773761749267578, -0.026285648345947266, -0.02483367919921875, -0.023381710052490234, -0.02192974090576172, -0.020477771759033203, -0.019025802612304688, -0.017573833465576172, -0.016121864318847656, -0.01466989517211914, -0.013217926025390625, -0.01176595687866211, -0.010313987731933594, -0.008862018585205078, -0.0074100494384765625, -0.005958080291748047, -0.004506111145019531, -0.0030541419982910156, -0.0016021728515625, -0.00015020370483398438, 0.0013017654418945312, 0.002753734588623047, 0.0042057037353515625, 0.005657672882080078, 0.007109642028808594, 0.00856161117553711, 0.010013580322265625, 0.01146554946899414, 0.012917518615722656, 0.014369487762451172, 0.015821456909179688, 0.017273426055908203, 0.01872539520263672, 0.020177364349365234, 0.02162933349609375, 0.023081302642822266, 0.02453327178955078, 0.025985240936279297, 0.027437210083007812, 0.028889179229736328, 0.030341148376464844, 0.03179311752319336, 0.033245086669921875, 0.03469705581665039, 0.036149024963378906, 0.03760099411010742, 0.03905296325683594, 0.04050493240356445, 0.04195690155029297, 0.043408870697021484, 0.04486083984375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 5.0, 4.0, 3.0, 3.0, 7.0, 1.0, 8.0, 5.0, 10.0, 14.0, 13.0, 22.0, 20.0, 25.0, 27.0, 23.0, 36.0, 43.0, 38.0, 40.0, 65.0, 46.0, 60.0, 47.0, 54.0, 44.0, 54.0, 31.0, 45.0, 35.0, 36.0, 29.0, 22.0, 21.0, 16.0, 22.0, 5.0, 6.0, 8.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1990966796875, -0.19237327575683594, -0.18564987182617188, -0.1789264678955078, -0.17220306396484375, -0.1654796600341797, -0.15875625610351562, -0.15203285217285156, -0.1453094482421875, -0.13858604431152344, -0.13186264038085938, -0.1251392364501953, -0.11841583251953125, -0.11169242858886719, -0.10496902465820312, -0.09824562072753906, -0.091522216796875, -0.08479881286621094, -0.07807540893554688, -0.07135200500488281, -0.06462860107421875, -0.05790519714355469, -0.051181793212890625, -0.04445838928222656, -0.0377349853515625, -0.031011581420898438, -0.024288177490234375, -0.017564773559570312, -0.01084136962890625, -0.0041179656982421875, 0.002605438232421875, 0.009328842163085938, 0.01605224609375, 0.022775650024414062, 0.029499053955078125, 0.03622245788574219, 0.04294586181640625, 0.04966926574707031, 0.056392669677734375, 0.06311607360839844, 0.0698394775390625, 0.07656288146972656, 0.08328628540039062, 0.09000968933105469, 0.09673309326171875, 0.10345649719238281, 0.11017990112304688, 0.11690330505371094, 0.123626708984375, 0.13035011291503906, 0.13707351684570312, 0.1437969207763672, 0.15052032470703125, 0.1572437286376953, 0.16396713256835938, 0.17069053649902344, 0.1774139404296875, 0.18413734436035156, 0.19086074829101562, 0.1975841522216797, 0.20430755615234375, 0.2110309600830078, 0.21775436401367188, 0.22447776794433594, 0.231201171875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 4.0, 5.0, 8.0, 21.0, 13.0, 26.0, 44.0, 55.0, 90.0, 124.0, 225.0, 347.0, 592.0, 1171.0, 2365.0, 5748.0, 16824.0, 70059.0, 393476.0, 446017.0, 80936.0, 18908.0, 6106.0, 2525.0, 1237.0, 642.0, 345.0, 228.0, 132.0, 80.0, 68.0, 40.0, 18.0, 23.0, 16.0, 10.0, 10.0, 5.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.01029205322265625, -0.009960532188415527, -0.009629011154174805, -0.009297490119934082, -0.00896596908569336, -0.008634448051452637, -0.008302927017211914, -0.007971405982971191, -0.007639884948730469, -0.007308363914489746, -0.0069768428802490234, -0.006645321846008301, -0.006313800811767578, -0.0059822797775268555, -0.005650758743286133, -0.00531923770904541, -0.0049877166748046875, -0.004656195640563965, -0.004324674606323242, -0.0039931535720825195, -0.003661632537841797, -0.0033301115036010742, -0.0029985904693603516, -0.002667069435119629, -0.0023355484008789062, -0.0020040273666381836, -0.001672506332397461, -0.0013409852981567383, -0.0010094642639160156, -0.000677943229675293, -0.0003464221954345703, -1.4901161193847656e-05, 0.000316619873046875, 0.0006481409072875977, 0.0009796619415283203, 0.001311182975769043, 0.0016427040100097656, 0.0019742250442504883, 0.002305746078491211, 0.0026372671127319336, 0.0029687881469726562, 0.003300309181213379, 0.0036318302154541016, 0.003963351249694824, 0.004294872283935547, 0.0046263933181762695, 0.004957914352416992, 0.005289435386657715, 0.0056209564208984375, 0.00595247745513916, 0.006283998489379883, 0.0066155195236206055, 0.006947040557861328, 0.007278561592102051, 0.0076100826263427734, 0.007941603660583496, 0.008273124694824219, 0.008604645729064941, 0.008936166763305664, 0.009267687797546387, 0.00959920883178711, 0.009930729866027832, 0.010262250900268555, 0.010593771934509277, 0.01092529296875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 4.0, 3.0, 10.0, 4.0, 7.0, 6.0, 13.0, 7.0, 23.0, 26.0, 23.0, 55.0, 37.0, 58.0, 61.0, 80.0, 83.0, 48.0, 73.0, 77.0, 61.0, 52.0, 52.0, 43.0, 17.0, 25.0, 19.0, 11.0, 11.0, 7.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.635883331298828e-06, -3.4654513001441956e-06, -3.295019268989563e-06, -3.1245872378349304e-06, -2.954155206680298e-06, -2.7837231755256653e-06, -2.6132911443710327e-06, -2.4428591132164e-06, -2.2724270820617676e-06, -2.101995050907135e-06, -1.9315630197525024e-06, -1.7611309885978699e-06, -1.5906989574432373e-06, -1.4202669262886047e-06, -1.2498348951339722e-06, -1.0794028639793396e-06, -9.08970832824707e-07, -7.385388016700745e-07, -5.681067705154419e-07, -3.976747393608093e-07, -2.2724270820617676e-07, -5.681067705154419e-08, 1.1362135410308838e-07, 2.8405338525772095e-07, 4.544854164123535e-07, 6.249174475669861e-07, 7.953494787216187e-07, 9.657815098762512e-07, 1.1362135410308838e-06, 1.3066455721855164e-06, 1.477077603340149e-06, 1.6475096344947815e-06, 1.817941665649414e-06, 1.9883736968040466e-06, 2.158805727958679e-06, 2.3292377591133118e-06, 2.4996697902679443e-06, 2.670101821422577e-06, 2.8405338525772095e-06, 3.010965883731842e-06, 3.1813979148864746e-06, 3.351829946041107e-06, 3.5222619771957397e-06, 3.6926940083503723e-06, 3.863126039505005e-06, 4.0335580706596375e-06, 4.20399010181427e-06, 4.374422132968903e-06, 4.544854164123535e-06, 4.715286195278168e-06, 4.8857182264328e-06, 5.056150257587433e-06, 5.2265822887420654e-06, 5.397014319896698e-06, 5.5674463510513306e-06, 5.737878382205963e-06, 5.908310413360596e-06, 6.078742444515228e-06, 6.249174475669861e-06, 6.419606506824493e-06, 6.590038537979126e-06, 6.7604705691337585e-06, 6.930902600288391e-06, 7.101334631443024e-06, 7.271766662597656e-06]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 6.0, 7.0, 2.0, 8.0, 7.0, 15.0, 15.0, 25.0, 33.0, 35.0, 57.0, 80.0, 109.0, 178.0, 234.0, 445.0, 826.0, 1583.0, 4112.0, 11775.0, 40542.0, 171836.0, 504253.0, 233566.0, 53747.0, 15336.0, 5321.0, 2059.0, 934.0, 551.0, 304.0, 172.0, 129.0, 72.0, 38.0, 36.0, 33.0, 17.0, 17.0, 8.0, 11.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00911712646484375, -0.00882863998413086, -0.008540153503417969, -0.008251667022705078, -0.007963180541992188, -0.007674694061279297, -0.007386207580566406, -0.007097721099853516, -0.006809234619140625, -0.006520748138427734, -0.006232261657714844, -0.005943775177001953, -0.0056552886962890625, -0.005366802215576172, -0.005078315734863281, -0.004789829254150391, -0.0045013427734375, -0.004212856292724609, -0.003924369812011719, -0.003635883331298828, -0.0033473968505859375, -0.003058910369873047, -0.0027704238891601562, -0.0024819374084472656, -0.002193450927734375, -0.0019049644470214844, -0.0016164779663085938, -0.0013279914855957031, -0.0010395050048828125, -0.0007510185241699219, -0.00046253204345703125, -0.00017404556274414062, 0.00011444091796875, 0.0004029273986816406, 0.0006914138793945312, 0.0009799003601074219, 0.0012683868408203125, 0.0015568733215332031, 0.0018453598022460938, 0.0021338462829589844, 0.002422332763671875, 0.0027108192443847656, 0.0029993057250976562, 0.003287792205810547, 0.0035762786865234375, 0.003864765167236328, 0.004153251647949219, 0.004441738128662109, 0.004730224609375, 0.005018711090087891, 0.005307197570800781, 0.005595684051513672, 0.0058841705322265625, 0.006172657012939453, 0.006461143493652344, 0.006749629974365234, 0.007038116455078125, 0.007326602935791016, 0.007615089416503906, 0.007903575897216797, 0.008192062377929688, 0.008480548858642578, 0.008769035339355469, 0.00905752182006836, 0.00934600830078125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 6.0, 2.0, 1.0, 6.0, 1.0, 3.0, 11.0, 18.0, 16.0, 17.0, 19.0, 25.0, 28.0, 37.0, 33.0, 45.0, 46.0, 53.0, 55.0, 62.0, 53.0, 65.0, 61.0, 56.0, 45.0, 34.0, 31.0, 26.0, 24.0, 27.0, 21.0, 16.0, 5.0, 12.0, 10.0, 9.0, 6.0, 2.0, 2.0, 2.0, 4.0, 7.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0017490386962890625, -0.0016888082027435303, -0.001628577709197998, -0.0015683472156524658, -0.0015081167221069336, -0.0014478862285614014, -0.0013876557350158691, -0.001327425241470337, -0.0012671947479248047, -0.0012069642543792725, -0.0011467337608337402, -0.001086503267288208, -0.0010262727737426758, -0.0009660422801971436, -0.0009058117866516113, -0.0008455812931060791, -0.0007853507995605469, -0.0007251203060150146, -0.0006648898124694824, -0.0006046593189239502, -0.000544428825378418, -0.00048419833183288574, -0.0004239678382873535, -0.0003637373447418213, -0.00030350685119628906, -0.00024327635765075684, -0.0001830458641052246, -0.00012281537055969238, -6.258487701416016e-05, -2.3543834686279297e-06, 5.78761100769043e-05, 0.00011810660362243652, 0.00017833709716796875, 0.00023856759071350098, 0.0002987980842590332, 0.00035902857780456543, 0.00041925907135009766, 0.0004794895648956299, 0.0005397200584411621, 0.0005999505519866943, 0.0006601810455322266, 0.0007204115390777588, 0.000780642032623291, 0.0008408725261688232, 0.0009011030197143555, 0.0009613335132598877, 0.00102156400680542, 0.0010817945003509521, 0.0011420249938964844, 0.0012022554874420166, 0.0012624859809875488, 0.001322716474533081, 0.0013829469680786133, 0.0014431774616241455, 0.0015034079551696777, 0.00156363844871521, 0.0016238689422607422, 0.0016840994358062744, 0.0017443299293518066, 0.0018045604228973389, 0.001864790916442871, 0.0019250214099884033, 0.0019852519035339355, 0.0020454823970794678, 0.002105712890625]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 8.0, 24.0, 31.0, 70.0, 136.0, 264.0, 222.0, 115.0, 63.0, 22.0, 19.0, 8.0, 5.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3553064465522766, -0.34480053186416626, -0.3342946171760559, -0.32378873229026794, -0.3132828176021576, -0.30277690291404724, -0.2922710180282593, -0.2817651033401489, -0.2712591886520386, -0.2607532739639282, -0.25024735927581787, -0.2397414743900299, -0.22923555970191956, -0.2187296450138092, -0.20822374522686005, -0.1977178454399109, -0.18721193075180054, -0.17670601606369019, -0.16620011627674103, -0.15569421648979187, -0.14518830180168152, -0.13468238711357117, -0.12417648732662201, -0.11367058008909225, -0.1031646728515625, -0.09265876561403275, -0.08215285837650299, -0.07164695113897324, -0.06114104390144348, -0.05063513666391373, -0.04012922942638397, -0.029623322188854218, -0.019117414951324463, -0.008611507713794708, 0.0018943995237350464, 0.012400306761264801, 0.022906213998794556, 0.03341212123632431, 0.043918028473854065, 0.05442393571138382, 0.06492984294891357, 0.07543575018644333, 0.08594165742397308, 0.09644756466150284, 0.10695347189903259, 0.11745937913656235, 0.1279652863740921, 0.13847118616104126, 0.1489771008491516, 0.15948301553726196, 0.16998891532421112, 0.18049481511116028, 0.19100072979927063, 0.20150664448738098, 0.21201254427433014, 0.2225184440612793, 0.23302435874938965, 0.2435302734375, 0.25403618812561035, 0.2645420730113983, 0.27504798769950867, 0.285553902387619, 0.296059787273407, 0.30656570196151733, 0.3170716166496277]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 6.0, 2.0, 1.0, 7.0, 10.0, 12.0, 18.0, 14.0, 17.0, 21.0, 28.0, 36.0, 38.0, 42.0, 50.0, 50.0, 49.0, 62.0, 63.0, 56.0, 35.0, 44.0, 54.0, 40.0, 42.0, 37.0, 41.0, 25.0, 24.0, 9.0, 19.0, 13.0, 7.0, 7.0, 6.0, 4.0, 6.0, 2.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10806149989366531, -0.10454869270324707, -0.10103588551282883, -0.09752307832241058, -0.09401026368141174, -0.0904974564909935, -0.08698464930057526, -0.08347184211015701, -0.07995903491973877, -0.07644622772932053, -0.07293342053890228, -0.06942060589790344, -0.0659077987074852, -0.062394991517066956, -0.05888218432664871, -0.05536937713623047, -0.05185656622052193, -0.048343759030103683, -0.04483094811439514, -0.0413181409239769, -0.037805333733558655, -0.03429252654314041, -0.03077971562743187, -0.027266908437013626, -0.023754099383950233, -0.02024129033088684, -0.016728483140468597, -0.013215674087405205, -0.009702865965664387, -0.006190057843923569, -0.002677248790860176, 0.0008355583995580673, 0.00434836745262146, 0.007861175574362278, 0.011373983696103096, 0.014886792749166489, 0.018399599939584732, 0.021912408992648125, 0.025425218045711517, 0.02893802523612976, 0.032450832426548004, 0.03596363961696625, 0.03947645053267479, 0.04298925772309303, 0.046502064913511276, 0.05001487582921982, 0.05352768301963806, 0.057040490210056305, 0.06055330112576485, 0.06406611204147339, 0.06757891923189163, 0.07109172642230988, 0.07460453361272812, 0.07811734080314636, 0.0816301554441452, 0.08514295518398285, 0.08865576982498169, 0.09216857701539993, 0.09568138420581818, 0.09919419884681702, 0.10270700603723526, 0.1062198132276535, 0.10973262041807175, 0.11324542760848999, 0.11675823479890823]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 6.0, 14.0, 33.0, 34.0, 62.0, 90.0, 173.0, 263.0, 503.0, 921.0, 1678.0, 3288.0, 6861.0, 15780.0, 43583.0, 182828.0, 581340.0, 146608.0, 37596.0, 14173.0, 6148.0, 3034.0, 1577.0, 838.0, 469.0, 277.0, 159.0, 102.0, 45.0, 38.0, 20.0, 12.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10638427734375, -0.10338211059570312, -0.10037994384765625, -0.09737777709960938, -0.0943756103515625, -0.09137344360351562, -0.08837127685546875, -0.08536911010742188, -0.082366943359375, -0.07936477661132812, -0.07636260986328125, -0.07336044311523438, -0.0703582763671875, -0.06735610961914062, -0.06435394287109375, -0.061351776123046875, -0.058349609375, -0.055347442626953125, -0.05234527587890625, -0.049343109130859375, -0.0463409423828125, -0.043338775634765625, -0.04033660888671875, -0.037334442138671875, -0.034332275390625, -0.031330108642578125, -0.02832794189453125, -0.025325775146484375, -0.0223236083984375, -0.019321441650390625, -0.01631927490234375, -0.013317108154296875, -0.01031494140625, -0.007312774658203125, -0.00431060791015625, -0.001308441162109375, 0.0016937255859375, 0.004695892333984375, 0.00769805908203125, 0.010700225830078125, 0.013702392578125, 0.016704559326171875, 0.01970672607421875, 0.022708892822265625, 0.0257110595703125, 0.028713226318359375, 0.03171539306640625, 0.034717559814453125, 0.0377197265625, 0.040721893310546875, 0.04372406005859375, 0.046726226806640625, 0.0497283935546875, 0.052730560302734375, 0.05573272705078125, 0.058734893798828125, 0.061737060546875, 0.06473922729492188, 0.06774139404296875, 0.07074356079101562, 0.0737457275390625, 0.07674789428710938, 0.07975006103515625, 0.08275222778320312, 0.08575439453125]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 5.0, 8.0, 3.0, 12.0, 12.0, 8.0, 16.0, 21.0, 26.0, 36.0, 37.0, 49.0, 48.0, 58.0, 53.0, 53.0, 61.0, 54.0, 41.0, 47.0, 49.0, 56.0, 48.0, 44.0, 32.0, 27.0, 21.0, 12.0, 11.0, 12.0, 10.0, 9.0, 4.0, 6.0, 3.0, 1.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.243408203125, -0.23533248901367188, -0.22725677490234375, -0.21918106079101562, -0.2111053466796875, -0.20302963256835938, -0.19495391845703125, -0.18687820434570312, -0.178802490234375, -0.17072677612304688, -0.16265106201171875, -0.15457534790039062, -0.1464996337890625, -0.13842391967773438, -0.13034820556640625, -0.12227249145507812, -0.11419677734375, -0.10612106323242188, -0.09804534912109375, -0.08996963500976562, -0.0818939208984375, -0.07381820678710938, -0.06574249267578125, -0.057666778564453125, -0.049591064453125, -0.041515350341796875, -0.03343963623046875, -0.025363922119140625, -0.0172882080078125, -0.009212493896484375, -0.00113677978515625, 0.006938934326171875, 0.0150146484375, 0.023090362548828125, 0.03116607666015625, 0.039241790771484375, 0.0473175048828125, 0.055393218994140625, 0.06346893310546875, 0.07154464721679688, 0.079620361328125, 0.08769607543945312, 0.09577178955078125, 0.10384750366210938, 0.1119232177734375, 0.11999893188476562, 0.12807464599609375, 0.13615036010742188, 0.14422607421875, 0.15230178833007812, 0.16037750244140625, 0.16845321655273438, 0.1765289306640625, 0.18460464477539062, 0.19268035888671875, 0.20075607299804688, 0.208831787109375, 0.21690750122070312, 0.22498321533203125, 0.23305892944335938, 0.2411346435546875, 0.24921035766601562, 0.25728607177734375, 0.2653617858886719, 0.2734375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 3.0, 3.0, 9.0, 17.0, 27.0, 32.0, 54.0, 101.0, 182.0, 436.0, 1186.0, 5538.0, 141672.0, 879515.0, 16557.0, 2020.0, 611.0, 266.0, 129.0, 61.0, 44.0, 25.0, 13.0, 13.0, 4.0, 6.0, 5.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.33544921875, -0.3264350891113281, -0.31742095947265625, -0.3084068298339844, -0.2993927001953125, -0.2903785705566406, -0.28136444091796875, -0.2723503112792969, -0.263336181640625, -0.2543220520019531, -0.24530792236328125, -0.23629379272460938, -0.2272796630859375, -0.21826553344726562, -0.20925140380859375, -0.20023727416992188, -0.19122314453125, -0.18220901489257812, -0.17319488525390625, -0.16418075561523438, -0.1551666259765625, -0.14615249633789062, -0.13713836669921875, -0.12812423706054688, -0.119110107421875, -0.11009597778320312, -0.10108184814453125, -0.09206771850585938, -0.0830535888671875, -0.07403945922851562, -0.06502532958984375, -0.056011199951171875, -0.0469970703125, -0.037982940673828125, -0.02896881103515625, -0.019954681396484375, -0.0109405517578125, -0.001926422119140625, 0.00708770751953125, 0.016101837158203125, 0.025115966796875, 0.034130096435546875, 0.04314422607421875, 0.052158355712890625, 0.0611724853515625, 0.07018661499023438, 0.07920074462890625, 0.08821487426757812, 0.09722900390625, 0.10624313354492188, 0.11525726318359375, 0.12427139282226562, 0.1332855224609375, 0.14229965209960938, 0.15131378173828125, 0.16032791137695312, 0.169342041015625, 0.17835617065429688, 0.18737030029296875, 0.19638442993164062, 0.2053985595703125, 0.21441268920898438, 0.22342681884765625, 0.23244094848632812, 0.241455078125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 7.0, 3.0, 7.0, 6.0, 9.0, 11.0, 13.0, 24.0, 12.0, 16.0, 21.0, 25.0, 28.0, 26.0, 39.0, 42.0, 49.0, 34.0, 35.0, 43.0, 44.0, 55.0, 37.0, 37.0, 32.0, 45.0, 45.0, 33.0, 37.0, 25.0, 22.0, 16.0, 20.0, 29.0, 15.0, 17.0, 8.0, 8.0, 9.0, 7.0, 3.0, 2.0, 3.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.2427978515625, -0.2352924346923828, -0.22778701782226562, -0.22028160095214844, -0.21277618408203125, -0.20527076721191406, -0.19776535034179688, -0.1902599334716797, -0.1827545166015625, -0.1752490997314453, -0.16774368286132812, -0.16023826599121094, -0.15273284912109375, -0.14522743225097656, -0.13772201538085938, -0.1302165985107422, -0.122711181640625, -0.11520576477050781, -0.10770034790039062, -0.10019493103027344, -0.09268951416015625, -0.08518409729003906, -0.07767868041992188, -0.07017326354980469, -0.0626678466796875, -0.05516242980957031, -0.047657012939453125, -0.04015159606933594, -0.03264617919921875, -0.025140762329101562, -0.017635345458984375, -0.010129928588867188, -0.00262451171875, 0.0048809051513671875, 0.012386322021484375, 0.019891738891601562, 0.02739715576171875, 0.03490257263183594, 0.042407989501953125, 0.04991340637207031, 0.0574188232421875, 0.06492424011230469, 0.07242965698242188, 0.07993507385253906, 0.08744049072265625, 0.09494590759277344, 0.10245132446289062, 0.10995674133300781, 0.117462158203125, 0.12496757507324219, 0.13247299194335938, 0.13997840881347656, 0.14748382568359375, 0.15498924255371094, 0.16249465942382812, 0.1700000762939453, 0.1775054931640625, 0.1850109100341797, 0.19251632690429688, 0.20002174377441406, 0.20752716064453125, 0.21503257751464844, 0.22253799438476562, 0.2300434112548828, 0.237548828125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 6.0, 12.0, 10.0, 18.0, 22.0, 55.0, 130.0, 304.0, 896.0, 4335.0, 84996.0, 943776.0, 11587.0, 1633.0, 444.0, 146.0, 78.0, 39.0, 21.0, 17.0, 12.0, 2.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.169189453125, -0.16438674926757812, -0.15958404541015625, -0.15478134155273438, -0.1499786376953125, -0.14517593383789062, -0.14037322998046875, -0.13557052612304688, -0.130767822265625, -0.12596511840820312, -0.12116241455078125, -0.11635971069335938, -0.1115570068359375, -0.10675430297851562, -0.10195159912109375, -0.09714889526367188, -0.09234619140625, -0.08754348754882812, -0.08274078369140625, -0.07793807983398438, -0.0731353759765625, -0.06833267211914062, -0.06352996826171875, -0.058727264404296875, -0.053924560546875, -0.049121856689453125, -0.04431915283203125, -0.039516448974609375, -0.0347137451171875, -0.029911041259765625, -0.02510833740234375, -0.020305633544921875, -0.0155029296875, -0.010700225830078125, -0.00589752197265625, -0.001094818115234375, 0.0037078857421875, 0.008510589599609375, 0.01331329345703125, 0.018115997314453125, 0.022918701171875, 0.027721405029296875, 0.03252410888671875, 0.037326812744140625, 0.0421295166015625, 0.046932220458984375, 0.05173492431640625, 0.056537628173828125, 0.06134033203125, 0.06614303588867188, 0.07094573974609375, 0.07574844360351562, 0.0805511474609375, 0.08535385131835938, 0.09015655517578125, 0.09495925903320312, 0.099761962890625, 0.10456466674804688, 0.10936737060546875, 0.11417007446289062, 0.1189727783203125, 0.12377548217773438, 0.12857818603515625, 0.13338088989257812, 0.13818359375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 4.0, 9.0, 15.0, 11.0, 22.0, 36.0, 79.0, 143.0, 230.0, 157.0, 125.0, 65.0, 38.0, 21.0, 14.0, 8.0, 5.0, 3.0, 3.0, 2.0, 5.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.6629695892333984e-05, -1.624133437871933e-05, -1.5852972865104675e-05, -1.546461135149002e-05, -1.5076249837875366e-05, -1.4687888324260712e-05, -1.4299526810646057e-05, -1.3911165297031403e-05, -1.3522803783416748e-05, -1.3134442269802094e-05, -1.2746080756187439e-05, -1.2357719242572784e-05, -1.196935772895813e-05, -1.1580996215343475e-05, -1.119263470172882e-05, -1.0804273188114166e-05, -1.0415911674499512e-05, -1.0027550160884857e-05, -9.639188647270203e-06, -9.250827133655548e-06, -8.862465620040894e-06, -8.474104106426239e-06, -8.085742592811584e-06, -7.69738107919693e-06, -7.309019565582275e-06, -6.920658051967621e-06, -6.532296538352966e-06, -6.143935024738312e-06, -5.755573511123657e-06, -5.367211997509003e-06, -4.978850483894348e-06, -4.590488970279694e-06, -4.202127456665039e-06, -3.8137659430503845e-06, -3.42540442943573e-06, -3.0370429158210754e-06, -2.648681402206421e-06, -2.2603198885917664e-06, -1.8719583749771118e-06, -1.4835968613624573e-06, -1.0952353477478027e-06, -7.068738341331482e-07, -3.1851232051849365e-07, 6.984919309616089e-08, 4.5821070671081543e-07, 8.4657222032547e-07, 1.2349337339401245e-06, 1.623295247554779e-06, 2.0116567611694336e-06, 2.400018274784088e-06, 2.7883797883987427e-06, 3.1767413020133972e-06, 3.5651028156280518e-06, 3.953464329242706e-06, 4.341825842857361e-06, 4.730187356472015e-06, 5.11854887008667e-06, 5.5069103837013245e-06, 5.895271897315979e-06, 6.2836334109306335e-06, 6.671994924545288e-06, 7.060356438159943e-06, 7.448717951774597e-06, 7.837079465389252e-06, 8.225440979003906e-06]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 4.0, 6.0, 15.0, 27.0, 39.0, 55.0, 117.0, 256.0, 831.0, 3757.0, 117340.0, 916322.0, 7898.0, 1169.0, 386.0, 134.0, 85.0, 40.0, 20.0, 17.0, 6.0, 6.0, 7.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.157470703125, -0.15187835693359375, -0.1462860107421875, -0.14069366455078125, -0.135101318359375, -0.12950897216796875, -0.1239166259765625, -0.11832427978515625, -0.11273193359375, -0.10713958740234375, -0.1015472412109375, -0.09595489501953125, -0.090362548828125, -0.08477020263671875, -0.0791778564453125, -0.07358551025390625, -0.0679931640625, -0.06240081787109375, -0.0568084716796875, -0.05121612548828125, -0.045623779296875, -0.04003143310546875, -0.0344390869140625, -0.02884674072265625, -0.02325439453125, -0.01766204833984375, -0.0120697021484375, -0.00647735595703125, -0.000885009765625, 0.00470733642578125, 0.0102996826171875, 0.01589202880859375, 0.021484375, 0.02707672119140625, 0.0326690673828125, 0.03826141357421875, 0.043853759765625, 0.04944610595703125, 0.0550384521484375, 0.06063079833984375, 0.06622314453125, 0.07181549072265625, 0.0774078369140625, 0.08300018310546875, 0.088592529296875, 0.09418487548828125, 0.0997772216796875, 0.10536956787109375, 0.1109619140625, 0.11655426025390625, 0.1221466064453125, 0.12773895263671875, 0.133331298828125, 0.13892364501953125, 0.1445159912109375, 0.15010833740234375, 0.15570068359375, 0.16129302978515625, 0.1668853759765625, 0.17247772216796875, 0.178070068359375, 0.18366241455078125, 0.1892547607421875, 0.19484710693359375, 0.200439453125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 5.0, 5.0, 9.0, 7.0, 8.0, 26.0, 23.0, 66.0, 111.0, 235.0, 233.0, 120.0, 61.0, 29.0, 20.0, 18.0, 14.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049224853515625, -0.04785728454589844, -0.046489715576171875, -0.04512214660644531, -0.04375457763671875, -0.04238700866699219, -0.041019439697265625, -0.03965187072753906, -0.0382843017578125, -0.03691673278808594, -0.035549163818359375, -0.03418159484863281, -0.03281402587890625, -0.03144645690917969, -0.030078887939453125, -0.028711318969726562, -0.02734375, -0.025976181030273438, -0.024608612060546875, -0.023241043090820312, -0.02187347412109375, -0.020505905151367188, -0.019138336181640625, -0.017770767211914062, -0.0164031982421875, -0.015035629272460938, -0.013668060302734375, -0.012300491333007812, -0.01093292236328125, -0.009565353393554688, -0.008197784423828125, -0.0068302154541015625, -0.005462646484375, -0.0040950775146484375, -0.002727508544921875, -0.0013599395751953125, 7.62939453125e-06, 0.0013751983642578125, 0.002742767333984375, 0.0041103363037109375, 0.0054779052734375, 0.0068454742431640625, 0.008213043212890625, 0.009580612182617188, 0.01094818115234375, 0.012315750122070312, 0.013683319091796875, 0.015050888061523438, 0.01641845703125, 0.017786026000976562, 0.019153594970703125, 0.020521163940429688, 0.02188873291015625, 0.023256301879882812, 0.024623870849609375, 0.025991439819335938, 0.0273590087890625, 0.028726577758789062, 0.030094146728515625, 0.03146171569824219, 0.03282928466796875, 0.03419685363769531, 0.035564422607421875, 0.03693199157714844, 0.038299560546875]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 13.0, 41.0, 169.0, 461.0, 236.0, 61.0, 12.0, 11.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.575226366519928, -0.5330412983894348, -0.49085626006126404, -0.4486711919307709, -0.4064861536026001, -0.36430108547210693, -0.32211601734161377, -0.279930979013443, -0.23774591088294983, -0.19556085765361786, -0.1533758044242859, -0.11119073629379272, -0.06900568306446075, -0.026820629835128784, 0.01536443829536438, 0.057549476623535156, 0.09973454475402832, 0.1419195979833603, 0.18410465121269226, 0.22628971934318542, 0.2684747576713562, 0.31065982580184937, 0.35284489393234253, 0.3950299322605133, 0.43721500039100647, 0.47940006852149963, 0.5215851068496704, 0.5637701749801636, 0.6059552431106567, 0.6481403112411499, 0.6903253793716431, 0.7325103878974915, 0.7746955156326294, 0.8168805837631226, 0.8590656518936157, 0.9012507200241089, 0.9434357285499573, 0.9856207966804504, 1.0278058052062988, 1.069990873336792, 1.1121759414672852, 1.1543610095977783, 1.1965460777282715, 1.2387311458587646, 1.2809162139892578, 1.323101282119751, 1.3652863502502441, 1.4074712991714478, 1.4496564865112305, 1.4918415546417236, 1.5340266227722168, 1.57621169090271, 1.6183967590332031, 1.6605818271636963, 1.7027668952941895, 1.744951844215393, 1.7871369123458862, 1.8293219804763794, 1.8715070486068726, 1.9136921167373657, 1.9558771848678589, 1.9980621337890625, 2.0402472019195557, 2.082432270050049, 2.124617338180542]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 6.0, 12.0, 15.0, 17.0, 26.0, 19.0, 37.0, 27.0, 29.0, 52.0, 34.0, 35.0, 44.0, 48.0, 47.0, 60.0, 60.0, 45.0, 52.0, 48.0, 40.0, 45.0, 36.0, 35.0, 25.0, 16.0, 19.0, 14.0, 13.0, 12.0, 11.0, 4.0, 7.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.6271568536758423, -0.6113367676734924, -0.5955166816711426, -0.5796966552734375, -0.5638765692710876, -0.5480564832687378, -0.5322363972663879, -0.5164163112640381, -0.500596284866333, -0.48477619886398315, -0.4689561426639557, -0.45313605666160583, -0.43731600046157837, -0.4214959144592285, -0.40567582845687866, -0.3898557424545288, -0.37403565645217896, -0.3582155704498291, -0.34239551424980164, -0.3265754282474518, -0.3107553720474243, -0.29493528604507446, -0.2791152000427246, -0.26329511404037476, -0.2474750578403473, -0.23165498673915863, -0.21583491563796997, -0.20001482963562012, -0.18419475853443146, -0.1683746874332428, -0.15255460143089294, -0.13673453032970428, -0.12091448903083801, -0.10509441792964935, -0.0892743393778801, -0.07345426082611084, -0.05763418972492218, -0.04181411862373352, -0.025994040071964264, -0.010173961520195007, 0.005646109580993652, 0.02146618440747261, 0.03728625923395157, 0.05310633406043053, 0.06892640888690948, 0.08474647998809814, 0.1005665585398674, 0.11638663709163666, 0.13220670819282532, 0.14802677929401398, 0.16384685039520264, 0.1796669363975525, 0.19548700749874115, 0.2113070785999298, 0.22712716460227966, 0.24294723570346832, 0.258767306804657, 0.27458739280700684, 0.2904074490070343, 0.30622753500938416, 0.3220475912094116, 0.3378676772117615, 0.35368776321411133, 0.3695078492164612, 0.38532790541648865]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 5.0, 2.0, 3.0, 2.0, 3.0, 4.0, 11.0, 12.0, 14.0, 19.0, 36.0, 37.0, 68.0, 112.0, 185.0, 242.0, 491.0, 889.0, 1722.0, 4311.0, 14165.0, 117929.0, 2952185.0, 1039865.0, 47029.0, 8593.0, 3285.0, 1371.0, 749.0, 367.0, 219.0, 117.0, 74.0, 45.0, 42.0, 27.0, 19.0, 13.0, 8.0, 11.0, 3.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.291259765625, -0.28238677978515625, -0.2735137939453125, -0.26464080810546875, -0.255767822265625, -0.24689483642578125, -0.2380218505859375, -0.22914886474609375, -0.22027587890625, -0.21140289306640625, -0.2025299072265625, -0.19365692138671875, -0.184783935546875, -0.17591094970703125, -0.1670379638671875, -0.15816497802734375, -0.1492919921875, -0.14041900634765625, -0.1315460205078125, -0.12267303466796875, -0.113800048828125, -0.10492706298828125, -0.0960540771484375, -0.08718109130859375, -0.07830810546875, -0.06943511962890625, -0.0605621337890625, -0.05168914794921875, -0.042816162109375, -0.03394317626953125, -0.0250701904296875, -0.01619720458984375, -0.00732421875, 0.00154876708984375, 0.0104217529296875, 0.01929473876953125, 0.028167724609375, 0.03704071044921875, 0.0459136962890625, 0.05478668212890625, 0.06365966796875, 0.07253265380859375, 0.0814056396484375, 0.09027862548828125, 0.099151611328125, 0.10802459716796875, 0.1168975830078125, 0.12577056884765625, 0.1346435546875, 0.14351654052734375, 0.1523895263671875, 0.16126251220703125, 0.170135498046875, 0.17900848388671875, 0.1878814697265625, 0.19675445556640625, 0.20562744140625, 0.21450042724609375, 0.2233734130859375, 0.23224639892578125, 0.241119384765625, 0.24999237060546875, 0.2588653564453125, 0.26773834228515625, 0.276611328125]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 9.0, 4.0, 8.0, 20.0, 18.0, 28.0, 22.0, 25.0, 25.0, 40.0, 38.0, 64.0, 54.0, 43.0, 54.0, 51.0, 70.0, 45.0, 57.0, 47.0, 35.0, 37.0, 35.0, 30.0, 26.0, 16.0, 18.0, 10.0, 14.0, 9.0, 7.0, 11.0, 6.0, 6.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11334228515625, -0.10926532745361328, -0.10518836975097656, -0.10111141204833984, -0.09703445434570312, -0.0929574966430664, -0.08888053894042969, -0.08480358123779297, -0.08072662353515625, -0.07664966583251953, -0.07257270812988281, -0.0684957504272461, -0.06441879272460938, -0.060341835021972656, -0.05626487731933594, -0.05218791961669922, -0.0481109619140625, -0.04403400421142578, -0.03995704650878906, -0.035880088806152344, -0.031803131103515625, -0.027726173400878906, -0.023649215698242188, -0.01957225799560547, -0.01549530029296875, -0.011418342590332031, -0.0073413848876953125, -0.0032644271850585938, 0.000812530517578125, 0.004889488220214844, 0.008966445922851562, 0.013043403625488281, 0.017120361328125, 0.02119731903076172, 0.025274276733398438, 0.029351234436035156, 0.033428192138671875, 0.037505149841308594, 0.04158210754394531, 0.04565906524658203, 0.04973602294921875, 0.05381298065185547, 0.05788993835449219, 0.061966896057128906, 0.06604385375976562, 0.07012081146240234, 0.07419776916503906, 0.07827472686767578, 0.0823516845703125, 0.08642864227294922, 0.09050559997558594, 0.09458255767822266, 0.09865951538085938, 0.1027364730834961, 0.10681343078613281, 0.11089038848876953, 0.11496734619140625, 0.11904430389404297, 0.12312126159667969, 0.1271982192993164, 0.13127517700195312, 0.13535213470458984, 0.13942909240722656, 0.14350605010986328, 0.1475830078125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 5.0, 4.0, 3.0, 9.0, 8.0, 13.0, 13.0, 15.0, 27.0, 50.0, 55.0, 104.0, 183.0, 321.0, 754.0, 2102.0, 8211.0, 63622.0, 3762991.0, 330422.0, 19270.0, 3884.0, 1168.0, 470.0, 229.0, 118.0, 81.0, 42.0, 25.0, 20.0, 17.0, 12.0, 7.0, 13.0, 12.0, 3.0, 1.0, 2.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.32666015625, -0.31603240966796875, -0.3054046630859375, -0.29477691650390625, -0.284149169921875, -0.27352142333984375, -0.2628936767578125, -0.25226593017578125, -0.24163818359375, -0.23101043701171875, -0.2203826904296875, -0.20975494384765625, -0.199127197265625, -0.18849945068359375, -0.1778717041015625, -0.16724395751953125, -0.1566162109375, -0.14598846435546875, -0.1353607177734375, -0.12473297119140625, -0.114105224609375, -0.10347747802734375, -0.0928497314453125, -0.08222198486328125, -0.07159423828125, -0.06096649169921875, -0.0503387451171875, -0.03971099853515625, -0.029083251953125, -0.01845550537109375, -0.0078277587890625, 0.00279998779296875, 0.013427734375, 0.02405548095703125, 0.0346832275390625, 0.04531097412109375, 0.055938720703125, 0.06656646728515625, 0.0771942138671875, 0.08782196044921875, 0.09844970703125, 0.10907745361328125, 0.1197052001953125, 0.13033294677734375, 0.140960693359375, 0.15158843994140625, 0.1622161865234375, 0.17284393310546875, 0.1834716796875, 0.19409942626953125, 0.2047271728515625, 0.21535491943359375, 0.225982666015625, 0.23661041259765625, 0.2472381591796875, 0.25786590576171875, 0.26849365234375, 0.27912139892578125, 0.2897491455078125, 0.30037689208984375, 0.311004638671875, 0.32163238525390625, 0.3322601318359375, 0.34288787841796875, 0.353515625]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 5.0, 5.0, 9.0, 13.0, 10.0, 20.0, 28.0, 44.0, 82.0, 83.0, 168.0, 387.0, 643.0, 957.0, 685.0, 380.0, 191.0, 118.0, 72.0, 41.0, 27.0, 25.0, 23.0, 17.0, 10.0, 5.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055877685546875, -0.0538487434387207, -0.051819801330566406, -0.04979085922241211, -0.04776191711425781, -0.045732975006103516, -0.04370403289794922, -0.04167509078979492, -0.039646148681640625, -0.03761720657348633, -0.03558826446533203, -0.033559322357177734, -0.03153038024902344, -0.02950143814086914, -0.027472496032714844, -0.025443553924560547, -0.02341461181640625, -0.021385669708251953, -0.019356727600097656, -0.01732778549194336, -0.015298843383789062, -0.013269901275634766, -0.011240959167480469, -0.009212017059326172, -0.007183074951171875, -0.005154132843017578, -0.0031251907348632812, -0.0010962486267089844, 0.0009326934814453125, 0.0029616355895996094, 0.004990577697753906, 0.007019519805908203, 0.0090484619140625, 0.011077404022216797, 0.013106346130371094, 0.01513528823852539, 0.017164230346679688, 0.019193172454833984, 0.02122211456298828, 0.023251056671142578, 0.025279998779296875, 0.027308940887451172, 0.02933788299560547, 0.031366825103759766, 0.03339576721191406, 0.03542470932006836, 0.037453651428222656, 0.03948259353637695, 0.04151153564453125, 0.04354047775268555, 0.045569419860839844, 0.04759836196899414, 0.04962730407714844, 0.051656246185302734, 0.05368518829345703, 0.05571413040161133, 0.057743072509765625, 0.05977201461791992, 0.06180095672607422, 0.06382989883422852, 0.06585884094238281, 0.06788778305053711, 0.0699167251586914, 0.0719456672668457, 0.073974609375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 8.0, 3.0, 6.0, 14.0, 14.0, 17.0, 55.0, 67.0, 97.0, 152.0, 144.0, 145.0, 92.0, 57.0, 44.0, 32.0, 24.0, 10.0, 2.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.32026854157447815, -0.3109922707080841, -0.3017159700393677, -0.29243969917297363, -0.2831634283065796, -0.27388715744018555, -0.2646108567714691, -0.2553345859050751, -0.24605830013751984, -0.2367820143699646, -0.22750574350357056, -0.21822945773601532, -0.20895317196846008, -0.19967690110206604, -0.1904006153345108, -0.18112432956695557, -0.17184805870056152, -0.1625717729330063, -0.15329550206661224, -0.144019216299057, -0.13474294543266296, -0.12546665966510773, -0.11619037389755249, -0.10691409558057785, -0.09763781726360321, -0.08836153894662857, -0.07908526062965393, -0.0698089748620987, -0.060532696545124054, -0.051256418228149414, -0.041980136185884476, -0.03270385414361954, -0.023427575826644897, -0.014151295647025108, -0.004875015467405319, 0.00440126471221447, 0.013677544891834259, 0.0229538232088089, 0.03223010525107384, 0.041506387293338776, 0.050782665610313416, 0.060058943927288055, 0.0693352222442627, 0.07861150801181793, 0.08788778632879257, 0.09716406464576721, 0.10644035041332245, 0.11571662873029709, 0.12499290704727173, 0.13426919281482697, 0.143545463681221, 0.15282174944877625, 0.1620980203151703, 0.17137430608272552, 0.18065059185028076, 0.1899268627166748, 0.19920314848423004, 0.20847943425178528, 0.21775570511817932, 0.22703199088573456, 0.2363082766532898, 0.24558454751968384, 0.2548608183860779, 0.2641371190547943, 0.27341338992118835]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 11.0, 16.0, 17.0, 16.0, 21.0, 23.0, 22.0, 16.0, 36.0, 40.0, 32.0, 33.0, 46.0, 45.0, 49.0, 44.0, 57.0, 51.0, 42.0, 47.0, 49.0, 33.0, 43.0, 37.0, 31.0, 30.0, 18.0, 12.0, 16.0, 13.0, 15.0, 5.0, 6.0, 6.0, 2.0, 3.0, 4.0, 4.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11806507408618927, -0.11389222741127014, -0.10971938073635101, -0.10554653406143188, -0.10137368738651276, -0.09720084071159363, -0.0930280014872551, -0.08885515481233597, -0.08468230813741684, -0.08050946146249771, -0.07633661478757858, -0.07216376811265945, -0.06799092888832092, -0.0638180822134018, -0.059645235538482666, -0.05547238886356354, -0.05129954218864441, -0.04712669551372528, -0.04295384883880615, -0.03878100588917732, -0.034608159214258194, -0.030435312539339066, -0.026262467727065086, -0.022089622914791107, -0.01791677623987198, -0.013743930496275425, -0.009571084752678871, -0.005398239009082317, -0.0012253932654857635, 0.002947453409433365, 0.007120298221707344, 0.011293143033981323, 0.015466004610061646, 0.019638851284980774, 0.023811696097254753, 0.027984540909528732, 0.03215738758444786, 0.03633023425936699, 0.04050307720899582, 0.04467592388391495, 0.048848770558834076, 0.053021617233753204, 0.05719446390867233, 0.06136730685830116, 0.06554014980792999, 0.06971299648284912, 0.07388584315776825, 0.07805868983268738, 0.0822315365076065, 0.08640438318252563, 0.09057722985744476, 0.09475007653236389, 0.09892292320728302, 0.10309576988220215, 0.10726860910654068, 0.11144145578145981, 0.11561430245637894, 0.11978714913129807, 0.1239599958062172, 0.12813283503055573, 0.13230568170547485, 0.13647852838039398, 0.1406513750553131, 0.14482422173023224, 0.14899706840515137]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 2.0, 3.0, 14.0, 7.0, 15.0, 25.0, 69.0, 87.0, 181.0, 421.0, 770.0, 1804.0, 4467.0, 12421.0, 39922.0, 156743.0, 482547.0, 258288.0, 61947.0, 18145.0, 6223.0, 2438.0, 1020.0, 474.0, 255.0, 102.0, 68.0, 37.0, 26.0, 17.0, 11.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.037994384765625, -0.03703665733337402, -0.03607892990112305, -0.03512120246887207, -0.034163475036621094, -0.03320574760437012, -0.03224802017211914, -0.031290292739868164, -0.030332565307617188, -0.02937483787536621, -0.028417110443115234, -0.027459383010864258, -0.02650165557861328, -0.025543928146362305, -0.024586200714111328, -0.02362847328186035, -0.022670745849609375, -0.0217130184173584, -0.020755290985107422, -0.019797563552856445, -0.01883983612060547, -0.017882108688354492, -0.016924381256103516, -0.01596665382385254, -0.015008926391601562, -0.014051198959350586, -0.01309347152709961, -0.012135744094848633, -0.011178016662597656, -0.01022028923034668, -0.009262561798095703, -0.008304834365844727, -0.00734710693359375, -0.0063893795013427734, -0.005431652069091797, -0.00447392463684082, -0.0035161972045898438, -0.002558469772338867, -0.0016007423400878906, -0.0006430149078369141, 0.0003147125244140625, 0.001272439956665039, 0.0022301673889160156, 0.003187894821166992, 0.004145622253417969, 0.005103349685668945, 0.006061077117919922, 0.0070188045501708984, 0.007976531982421875, 0.008934259414672852, 0.009891986846923828, 0.010849714279174805, 0.011807441711425781, 0.012765169143676758, 0.013722896575927734, 0.014680624008178711, 0.015638351440429688, 0.016596078872680664, 0.01755380630493164, 0.018511533737182617, 0.019469261169433594, 0.02042698860168457, 0.021384716033935547, 0.022342443466186523, 0.0233001708984375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 8.0, 9.0, 19.0, 23.0, 19.0, 23.0, 23.0, 26.0, 27.0, 35.0, 57.0, 45.0, 50.0, 44.0, 62.0, 57.0, 59.0, 47.0, 58.0, 42.0, 53.0, 38.0, 35.0, 25.0, 22.0, 20.0, 7.0, 8.0, 9.0, 10.0, 13.0, 6.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.095458984375, -0.0921010971069336, -0.08874320983886719, -0.08538532257080078, -0.08202743530273438, -0.07866954803466797, -0.07531166076660156, -0.07195377349853516, -0.06859588623046875, -0.06523799896240234, -0.06188011169433594, -0.05852222442626953, -0.055164337158203125, -0.05180644989013672, -0.04844856262207031, -0.045090675354003906, -0.0417327880859375, -0.038374900817871094, -0.03501701354980469, -0.03165912628173828, -0.028301239013671875, -0.02494335174560547, -0.021585464477539062, -0.018227577209472656, -0.01486968994140625, -0.011511802673339844, -0.008153915405273438, -0.004796028137207031, -0.001438140869140625, 0.0019197463989257812, 0.0052776336669921875, 0.008635520935058594, 0.011993408203125, 0.015351295471191406, 0.018709182739257812, 0.02206707000732422, 0.025424957275390625, 0.02878284454345703, 0.03214073181152344, 0.035498619079589844, 0.03885650634765625, 0.042214393615722656, 0.04557228088378906, 0.04893016815185547, 0.052288055419921875, 0.05564594268798828, 0.05900382995605469, 0.062361717224121094, 0.0657196044921875, 0.0690774917602539, 0.07243537902832031, 0.07579326629638672, 0.07915115356445312, 0.08250904083251953, 0.08586692810058594, 0.08922481536865234, 0.09258270263671875, 0.09594058990478516, 0.09929847717285156, 0.10265636444091797, 0.10601425170898438, 0.10937213897705078, 0.11273002624511719, 0.1160879135131836, 0.11944580078125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 7.0, 6.0, 5.0, 14.0, 14.0, 21.0, 38.0, 77.0, 111.0, 177.0, 342.0, 603.0, 1162.0, 2607.0, 6800.0, 20911.0, 84265.0, 379515.0, 417585.0, 97268.0, 23864.0, 7454.0, 2854.0, 1309.0, 680.0, 346.0, 203.0, 108.0, 75.0, 35.0, 25.0, 16.0, 13.0, 9.0, 8.0, 3.0, 6.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.032928466796875, -0.03196120262145996, -0.030993938446044922, -0.030026674270629883, -0.029059410095214844, -0.028092145919799805, -0.027124881744384766, -0.026157617568969727, -0.025190353393554688, -0.02422308921813965, -0.02325582504272461, -0.02228856086730957, -0.02132129669189453, -0.020354032516479492, -0.019386768341064453, -0.018419504165649414, -0.017452239990234375, -0.016484975814819336, -0.015517711639404297, -0.014550447463989258, -0.013583183288574219, -0.01261591911315918, -0.01164865493774414, -0.010681390762329102, -0.009714126586914062, -0.008746862411499023, -0.007779598236083984, -0.006812334060668945, -0.005845069885253906, -0.004877805709838867, -0.003910541534423828, -0.002943277359008789, -0.00197601318359375, -0.001008749008178711, -4.1484832763671875e-05, 0.0009257793426513672, 0.0018930435180664062, 0.0028603076934814453, 0.0038275718688964844, 0.0047948360443115234, 0.0057621002197265625, 0.0067293643951416016, 0.007696628570556641, 0.00866389274597168, 0.009631156921386719, 0.010598421096801758, 0.011565685272216797, 0.012532949447631836, 0.013500213623046875, 0.014467477798461914, 0.015434741973876953, 0.016402006149291992, 0.01736927032470703, 0.01833653450012207, 0.01930379867553711, 0.02027106285095215, 0.021238327026367188, 0.022205591201782227, 0.023172855377197266, 0.024140119552612305, 0.025107383728027344, 0.026074647903442383, 0.027041912078857422, 0.02800917625427246, 0.0289764404296875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 5.0, 3.0, 6.0, 6.0, 15.0, 13.0, 14.0, 16.0, 13.0, 23.0, 19.0, 26.0, 19.0, 21.0, 26.0, 38.0, 32.0, 37.0, 39.0, 41.0, 37.0, 43.0, 37.0, 44.0, 36.0, 40.0, 36.0, 50.0, 31.0, 17.0, 34.0, 30.0, 24.0, 26.0, 16.0, 15.0, 9.0, 9.0, 16.0, 9.0, 7.0, 5.0, 7.0, 6.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.1640625, -0.15893936157226562, -0.15381622314453125, -0.14869308471679688, -0.1435699462890625, -0.13844680786132812, -0.13332366943359375, -0.12820053100585938, -0.123077392578125, -0.11795425415039062, -0.11283111572265625, -0.10770797729492188, -0.1025848388671875, -0.09746170043945312, -0.09233856201171875, -0.08721542358398438, -0.08209228515625, -0.07696914672851562, -0.07184600830078125, -0.06672286987304688, -0.0615997314453125, -0.056476593017578125, -0.05135345458984375, -0.046230316162109375, -0.041107177734375, -0.035984039306640625, -0.03086090087890625, -0.025737762451171875, -0.0206146240234375, -0.015491485595703125, -0.01036834716796875, -0.005245208740234375, -0.0001220703125, 0.005001068115234375, 0.01012420654296875, 0.015247344970703125, 0.0203704833984375, 0.025493621826171875, 0.03061676025390625, 0.035739898681640625, 0.040863037109375, 0.045986175537109375, 0.05110931396484375, 0.056232452392578125, 0.0613555908203125, 0.06647872924804688, 0.07160186767578125, 0.07672500610351562, 0.08184814453125, 0.08697128295898438, 0.09209442138671875, 0.09721755981445312, 0.1023406982421875, 0.10746383666992188, 0.11258697509765625, 0.11771011352539062, 0.122833251953125, 0.12795639038085938, 0.13307952880859375, 0.13820266723632812, 0.1433258056640625, 0.14844894409179688, 0.15357208251953125, 0.15869522094726562, 0.163818359375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 6.0, 12.0, 14.0, 24.0, 37.0, 60.0, 109.0, 236.0, 495.0, 1255.0, 4028.0, 20170.0, 215857.0, 710464.0, 81264.0, 10412.0, 2464.0, 863.0, 378.0, 167.0, 85.0, 56.0, 30.0, 17.0, 12.0, 9.0, 9.0, 4.0, 9.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0142364501953125, -0.013715267181396484, -0.013194084167480469, -0.012672901153564453, -0.012151718139648438, -0.011630535125732422, -0.011109352111816406, -0.01058816909790039, -0.010066986083984375, -0.00954580307006836, -0.009024620056152344, -0.008503437042236328, -0.007982254028320312, -0.007461071014404297, -0.006939888000488281, -0.006418704986572266, -0.00589752197265625, -0.005376338958740234, -0.004855155944824219, -0.004333972930908203, -0.0038127899169921875, -0.003291606903076172, -0.0027704238891601562, -0.0022492408752441406, -0.001728057861328125, -0.0012068748474121094, -0.0006856918334960938, -0.00016450881958007812, 0.0003566741943359375, 0.0008778572082519531, 0.0013990402221679688, 0.0019202232360839844, 0.00244140625, 0.0029625892639160156, 0.0034837722778320312, 0.004004955291748047, 0.0045261383056640625, 0.005047321319580078, 0.005568504333496094, 0.006089687347412109, 0.006610870361328125, 0.007132053375244141, 0.007653236389160156, 0.008174419403076172, 0.008695602416992188, 0.009216785430908203, 0.009737968444824219, 0.010259151458740234, 0.01078033447265625, 0.011301517486572266, 0.011822700500488281, 0.012343883514404297, 0.012865066528320312, 0.013386249542236328, 0.013907432556152344, 0.01442861557006836, 0.014949798583984375, 0.01547098159790039, 0.015992164611816406, 0.016513347625732422, 0.017034530639648438, 0.017555713653564453, 0.01807689666748047, 0.018598079681396484, 0.0191192626953125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 9.0, 6.0, 12.0, 18.0, 15.0, 37.0, 32.0, 57.0, 58.0, 57.0, 107.0, 75.0, 125.0, 82.0, 68.0, 53.0, 43.0, 43.0, 23.0, 27.0, 9.0, 12.0, 12.0, 6.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.841255187988281e-06, -5.638226866722107e-06, -5.435198545455933e-06, -5.232170224189758e-06, -5.029141902923584e-06, -4.82611358165741e-06, -4.623085260391235e-06, -4.420056939125061e-06, -4.217028617858887e-06, -4.014000296592712e-06, -3.810971975326538e-06, -3.6079436540603638e-06, -3.4049153327941895e-06, -3.201887011528015e-06, -2.998858690261841e-06, -2.7958303689956665e-06, -2.592802047729492e-06, -2.389773726463318e-06, -2.1867454051971436e-06, -1.9837170839309692e-06, -1.780688762664795e-06, -1.5776604413986206e-06, -1.3746321201324463e-06, -1.171603798866272e-06, -9.685754776000977e-07, -7.655471563339233e-07, -5.62518835067749e-07, -3.594905138015747e-07, -1.564621925354004e-07, 4.6566128730773926e-08, 2.4959444999694824e-07, 4.5262277126312256e-07, 6.556510925292969e-07, 8.586794137954712e-07, 1.0617077350616455e-06, 1.2647360563278198e-06, 1.4677643775939941e-06, 1.6707926988601685e-06, 1.8738210201263428e-06, 2.076849341392517e-06, 2.2798776626586914e-06, 2.4829059839248657e-06, 2.68593430519104e-06, 2.8889626264572144e-06, 3.0919909477233887e-06, 3.295019268989563e-06, 3.4980475902557373e-06, 3.7010759115219116e-06, 3.904104232788086e-06, 4.10713255405426e-06, 4.3101608753204346e-06, 4.513189196586609e-06, 4.716217517852783e-06, 4.9192458391189575e-06, 5.122274160385132e-06, 5.325302481651306e-06, 5.5283308029174805e-06, 5.731359124183655e-06, 5.934387445449829e-06, 6.137415766716003e-06, 6.340444087982178e-06, 6.543472409248352e-06, 6.746500730514526e-06, 6.949529051780701e-06, 7.152557373046875e-06]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 9.0, 7.0, 3.0, 14.0, 15.0, 33.0, 27.0, 41.0, 62.0, 113.0, 150.0, 234.0, 443.0, 830.0, 1940.0, 4786.0, 15297.0, 64376.0, 313413.0, 481180.0, 126005.0, 26734.0, 7441.0, 2755.0, 1157.0, 603.0, 321.0, 194.0, 113.0, 87.0, 53.0, 43.0, 19.0, 18.0, 10.0, 14.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00933837890625, -0.009018659591674805, -0.00869894027709961, -0.008379220962524414, -0.008059501647949219, -0.0077397823333740234, -0.007420063018798828, -0.007100343704223633, -0.0067806243896484375, -0.006460905075073242, -0.006141185760498047, -0.0058214664459228516, -0.005501747131347656, -0.005182027816772461, -0.004862308502197266, -0.00454258918762207, -0.004222869873046875, -0.0039031505584716797, -0.0035834312438964844, -0.003263711929321289, -0.0029439926147460938, -0.0026242733001708984, -0.002304553985595703, -0.001984834671020508, -0.0016651153564453125, -0.0013453960418701172, -0.0010256767272949219, -0.0007059574127197266, -0.00038623809814453125, -6.651878356933594e-05, 0.0002532005310058594, 0.0005729198455810547, 0.00089263916015625, 0.0012123584747314453, 0.0015320777893066406, 0.001851797103881836, 0.0021715164184570312, 0.0024912357330322266, 0.002810955047607422, 0.003130674362182617, 0.0034503936767578125, 0.003770112991333008, 0.004089832305908203, 0.0044095516204833984, 0.004729270935058594, 0.005048990249633789, 0.005368709564208984, 0.00568842887878418, 0.006008148193359375, 0.00632786750793457, 0.006647586822509766, 0.006967306137084961, 0.007287025451660156, 0.0076067447662353516, 0.007926464080810547, 0.008246183395385742, 0.008565902709960938, 0.008885622024536133, 0.009205341339111328, 0.009525060653686523, 0.009844779968261719, 0.010164499282836914, 0.01048421859741211, 0.010803937911987305, 0.0111236572265625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 6.0, 12.0, 7.0, 15.0, 21.0, 19.0, 30.0, 35.0, 44.0, 68.0, 49.0, 63.0, 70.0, 78.0, 79.0, 58.0, 71.0, 61.0, 32.0, 46.0, 34.0, 30.0, 16.0, 10.0, 13.0, 12.0, 6.0, 3.0, 5.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0029659271240234375, -0.0028780102729797363, -0.002790093421936035, -0.002702176570892334, -0.002614259719848633, -0.0025263428688049316, -0.0024384260177612305, -0.0023505091667175293, -0.002262592315673828, -0.002174675464630127, -0.0020867586135864258, -0.0019988417625427246, -0.0019109249114990234, -0.0018230080604553223, -0.001735091209411621, -0.00164717435836792, -0.0015592575073242188, -0.0014713406562805176, -0.0013834238052368164, -0.0012955069541931152, -0.001207590103149414, -0.0011196732521057129, -0.0010317564010620117, -0.0009438395500183105, -0.0008559226989746094, -0.0007680058479309082, -0.000680088996887207, -0.0005921721458435059, -0.0005042552947998047, -0.0004163384437561035, -0.00032842159271240234, -0.00024050474166870117, -0.000152587890625, -6.467103958129883e-05, 2.3245811462402344e-05, 0.00011116266250610352, 0.0001990795135498047, 0.00028699636459350586, 0.00037491321563720703, 0.0004628300666809082, 0.0005507469177246094, 0.0006386637687683105, 0.0007265806198120117, 0.0008144974708557129, 0.0009024143218994141, 0.0009903311729431152, 0.0010782480239868164, 0.0011661648750305176, 0.0012540817260742188, 0.00134199857711792, 0.001429915428161621, 0.0015178322792053223, 0.0016057491302490234, 0.0016936659812927246, 0.0017815828323364258, 0.001869499683380127, 0.001957416534423828, 0.0020453333854675293, 0.0021332502365112305, 0.0022211670875549316, 0.002309083938598633, 0.002397000789642334, 0.002484917640686035, 0.0025728344917297363, 0.0026607513427734375]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 7.0, 13.0, 15.0, 52.0, 94.0, 169.0, 214.0, 188.0, 104.0, 61.0, 26.0, 24.0, 7.0, 7.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3339976370334625, -0.32557156682014465, -0.3171454668045044, -0.3087193965911865, -0.30029332637786865, -0.2918672561645508, -0.2834411859512329, -0.27501508593559265, -0.2665890157222748, -0.2581629455089569, -0.24973686039447784, -0.24131077527999878, -0.2328847050666809, -0.22445863485336304, -0.21603254973888397, -0.2076064646244049, -0.19918039441108704, -0.19075432419776917, -0.1823282390832901, -0.17390215396881104, -0.16547608375549316, -0.1570500135421753, -0.14862392842769623, -0.14019784331321716, -0.1317717730998993, -0.12334569543600082, -0.11491961777210236, -0.10649354010820389, -0.09806746244430542, -0.08964138478040695, -0.08121530711650848, -0.07278922945261002, -0.06436315178871155, -0.05593707412481308, -0.04751099646091461, -0.039084918797016144, -0.030658841133117676, -0.022232763469219208, -0.01380668580532074, -0.005380608141422272, 0.0030454695224761963, 0.011471547186374664, 0.019897624850273132, 0.0283237025141716, 0.03674978017807007, 0.045175857841968536, 0.053601935505867004, 0.06202801316976547, 0.07045409083366394, 0.07888016849756241, 0.08730624616146088, 0.09573232382535934, 0.10415840148925781, 0.11258447915315628, 0.12101055681705475, 0.1294366419315338, 0.13786271214485168, 0.14628878235816956, 0.15471486747264862, 0.16314095258712769, 0.17156702280044556, 0.17999309301376343, 0.1884191781282425, 0.19684526324272156, 0.20527133345603943]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 6.0, 6.0, 8.0, 17.0, 14.0, 24.0, 20.0, 29.0, 23.0, 35.0, 43.0, 37.0, 48.0, 41.0, 49.0, 64.0, 66.0, 52.0, 54.0, 58.0, 48.0, 34.0, 45.0, 35.0, 30.0, 24.0, 17.0, 14.0, 14.0, 12.0, 9.0, 5.0, 7.0, 0.0, 2.0, 4.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0979456678032875, -0.09462704509496689, -0.09130841493606567, -0.08798979222774506, -0.08467116206884384, -0.08135253936052322, -0.07803390920162201, -0.07471528649330139, -0.07139666378498077, -0.06807804107666016, -0.06475941091775894, -0.061440788209438324, -0.05812216177582741, -0.05480353534221649, -0.051484908908605576, -0.04816628247499466, -0.04484765604138374, -0.04152902960777283, -0.03821040317416191, -0.034891776740550995, -0.03157315403223038, -0.02825452759861946, -0.024935901165008545, -0.021617276594042778, -0.018298650160431862, -0.01498002465814352, -0.011661399155855179, -0.008342772722244263, -0.005024147219955921, -0.0017055217176675797, 0.0016131047159433365, 0.004931729286909103, 0.00825035572052002, 0.011568981222808361, 0.014887606725096703, 0.01820623315870762, 0.021524857729673386, 0.024843484163284302, 0.028162110596895218, 0.031480737030506134, 0.03479935973882675, 0.03811798617243767, 0.041436612606048584, 0.0447552353143692, 0.04807386174798012, 0.051392488181591034, 0.05471111461520195, 0.058029741048812866, 0.06134836748242378, 0.0646669939160347, 0.06798561662435532, 0.07130424678325653, 0.07462286949157715, 0.07794149219989777, 0.08126012235879898, 0.0845787450671196, 0.08789737522602081, 0.09121599793434143, 0.09453462809324265, 0.09785325080156326, 0.10117188096046448, 0.1044905036687851, 0.10780912637710571, 0.11112775653600693, 0.11444637924432755]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 7.0, 6.0, 2.0, 10.0, 21.0, 10.0, 23.0, 34.0, 49.0, 63.0, 128.0, 142.0, 268.0, 429.0, 689.0, 1210.0, 2213.0, 4444.0, 9748.0, 23440.0, 68303.0, 287531.0, 477539.0, 111663.0, 34522.0, 13509.0, 5880.0, 2901.0, 1538.0, 831.0, 506.0, 293.0, 186.0, 145.0, 91.0, 47.0, 44.0, 28.0, 22.0, 17.0, 10.0, 11.0, 2.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0711669921875, -0.06864261627197266, -0.06611824035644531, -0.06359386444091797, -0.061069488525390625, -0.05854511260986328, -0.05602073669433594, -0.053496360778808594, -0.05097198486328125, -0.048447608947753906, -0.04592323303222656, -0.04339885711669922, -0.040874481201171875, -0.03835010528564453, -0.03582572937011719, -0.033301353454589844, -0.0307769775390625, -0.028252601623535156, -0.025728225708007812, -0.02320384979248047, -0.020679473876953125, -0.01815509796142578, -0.015630722045898438, -0.013106346130371094, -0.01058197021484375, -0.008057594299316406, -0.0055332183837890625, -0.0030088424682617188, -0.000484466552734375, 0.0020399093627929688, 0.0045642852783203125, 0.007088661193847656, 0.009613037109375, 0.012137413024902344, 0.014661788940429688, 0.01718616485595703, 0.019710540771484375, 0.02223491668701172, 0.024759292602539062, 0.027283668518066406, 0.02980804443359375, 0.032332420349121094, 0.03485679626464844, 0.03738117218017578, 0.039905548095703125, 0.04242992401123047, 0.04495429992675781, 0.047478675842285156, 0.0500030517578125, 0.052527427673339844, 0.05505180358886719, 0.05757617950439453, 0.060100555419921875, 0.06262493133544922, 0.06514930725097656, 0.0676736831665039, 0.07019805908203125, 0.0727224349975586, 0.07524681091308594, 0.07777118682861328, 0.08029556274414062, 0.08281993865966797, 0.08534431457519531, 0.08786869049072266, 0.09039306640625]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 11.0, 12.0, 9.0, 16.0, 18.0, 22.0, 22.0, 39.0, 43.0, 48.0, 46.0, 52.0, 62.0, 74.0, 65.0, 57.0, 57.0, 65.0, 43.0, 40.0, 42.0, 32.0, 20.0, 19.0, 19.0, 14.0, 12.0, 7.0, 4.0, 4.0, 3.0, 3.0, 5.0, 5.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.211669921875, -0.20444107055664062, -0.19721221923828125, -0.18998336791992188, -0.1827545166015625, -0.17552566528320312, -0.16829681396484375, -0.16106796264648438, -0.153839111328125, -0.14661026000976562, -0.13938140869140625, -0.13215255737304688, -0.1249237060546875, -0.11769485473632812, -0.11046600341796875, -0.10323715209960938, -0.09600830078125, -0.08877944946289062, -0.08155059814453125, -0.07432174682617188, -0.0670928955078125, -0.059864044189453125, -0.05263519287109375, -0.045406341552734375, -0.038177490234375, -0.030948638916015625, -0.02371978759765625, -0.016490936279296875, -0.0092620849609375, -0.002033233642578125, 0.00519561767578125, 0.012424468994140625, 0.0196533203125, 0.026882171630859375, 0.03411102294921875, 0.041339874267578125, 0.0485687255859375, 0.055797576904296875, 0.06302642822265625, 0.07025527954101562, 0.077484130859375, 0.08471298217773438, 0.09194183349609375, 0.09917068481445312, 0.1063995361328125, 0.11362838745117188, 0.12085723876953125, 0.12808609008789062, 0.13531494140625, 0.14254379272460938, 0.14977264404296875, 0.15700149536132812, 0.1642303466796875, 0.17145919799804688, 0.17868804931640625, 0.18591690063476562, 0.193145751953125, 0.20037460327148438, 0.20760345458984375, 0.21483230590820312, 0.2220611572265625, 0.22929000854492188, 0.23651885986328125, 0.24374771118164062, 0.2509765625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 0.0, 3.0, 8.0, 5.0, 8.0, 6.0, 8.0, 28.0, 31.0, 48.0, 97.0, 193.0, 491.0, 1489.0, 13253.0, 804644.0, 219947.0, 6499.0, 1046.0, 351.0, 157.0, 89.0, 51.0, 29.0, 21.0, 8.0, 11.0, 7.0, 6.0, 6.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28759765625, -0.27857208251953125, -0.2695465087890625, -0.26052093505859375, -0.251495361328125, -0.24246978759765625, -0.2334442138671875, -0.22441864013671875, -0.21539306640625, -0.20636749267578125, -0.1973419189453125, -0.18831634521484375, -0.179290771484375, -0.17026519775390625, -0.1612396240234375, -0.15221405029296875, -0.1431884765625, -0.13416290283203125, -0.1251373291015625, -0.11611175537109375, -0.107086181640625, -0.09806060791015625, -0.0890350341796875, -0.08000946044921875, -0.07098388671875, -0.06195831298828125, -0.0529327392578125, -0.04390716552734375, -0.034881591796875, -0.02585601806640625, -0.0168304443359375, -0.00780487060546875, 0.001220703125, 0.01024627685546875, 0.0192718505859375, 0.02829742431640625, 0.037322998046875, 0.04634857177734375, 0.0553741455078125, 0.06439971923828125, 0.07342529296875, 0.08245086669921875, 0.0914764404296875, 0.10050201416015625, 0.109527587890625, 0.11855316162109375, 0.1275787353515625, 0.13660430908203125, 0.1456298828125, 0.15465545654296875, 0.1636810302734375, 0.17270660400390625, 0.181732177734375, 0.19075775146484375, 0.1997833251953125, 0.20880889892578125, 0.21783447265625, 0.22686004638671875, 0.2358856201171875, 0.24491119384765625, 0.253936767578125, 0.26296234130859375, 0.2719879150390625, 0.28101348876953125, 0.2900390625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 8.0, 8.0, 8.0, 10.0, 19.0, 21.0, 22.0, 32.0, 33.0, 32.0, 29.0, 37.0, 47.0, 35.0, 55.0, 53.0, 48.0, 51.0, 54.0, 36.0, 32.0, 33.0, 33.0, 38.0, 23.0, 27.0, 31.0, 22.0, 25.0, 18.0, 15.0, 16.0, 11.0, 10.0, 4.0, 5.0, 4.0, 1.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.221923828125, -0.21456527709960938, -0.20720672607421875, -0.19984817504882812, -0.1924896240234375, -0.18513107299804688, -0.17777252197265625, -0.17041397094726562, -0.163055419921875, -0.15569686889648438, -0.14833831787109375, -0.14097976684570312, -0.1336212158203125, -0.12626266479492188, -0.11890411376953125, -0.11154556274414062, -0.10418701171875, -0.09682846069335938, -0.08946990966796875, -0.08211135864257812, -0.0747528076171875, -0.06739425659179688, -0.06003570556640625, -0.052677154541015625, -0.045318603515625, -0.037960052490234375, -0.03060150146484375, -0.023242950439453125, -0.0158843994140625, -0.008525848388671875, -0.00116729736328125, 0.006191253662109375, 0.0135498046875, 0.020908355712890625, 0.02826690673828125, 0.035625457763671875, 0.0429840087890625, 0.050342559814453125, 0.05770111083984375, 0.06505966186523438, 0.072418212890625, 0.07977676391601562, 0.08713531494140625, 0.09449386596679688, 0.1018524169921875, 0.10921096801757812, 0.11656951904296875, 0.12392807006835938, 0.13128662109375, 0.13864517211914062, 0.14600372314453125, 0.15336227416992188, 0.1607208251953125, 0.16807937622070312, 0.17543792724609375, 0.18279647827148438, 0.190155029296875, 0.19751358032226562, 0.20487213134765625, 0.21223068237304688, 0.2195892333984375, 0.22694778442382812, 0.23430633544921875, 0.24166488647460938, 0.2490234375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 7.0, 19.0, 14.0, 24.0, 33.0, 64.0, 103.0, 255.0, 1063.0, 10755.0, 949727.0, 82892.0, 2758.0, 476.0, 160.0, 59.0, 40.0, 38.0, 15.0, 13.0, 9.0, 9.0, 5.0, 9.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1317138671875, -0.1272869110107422, -0.12285995483398438, -0.11843299865722656, -0.11400604248046875, -0.10957908630371094, -0.10515213012695312, -0.10072517395019531, -0.0962982177734375, -0.09187126159667969, -0.08744430541992188, -0.08301734924316406, -0.07859039306640625, -0.07416343688964844, -0.06973648071289062, -0.06530952453613281, -0.060882568359375, -0.05645561218261719, -0.052028656005859375, -0.04760169982910156, -0.04317474365234375, -0.03874778747558594, -0.034320831298828125, -0.029893875122070312, -0.0254669189453125, -0.021039962768554688, -0.016613006591796875, -0.012186050415039062, -0.00775909423828125, -0.0033321380615234375, 0.001094818115234375, 0.0055217742919921875, 0.00994873046875, 0.014375686645507812, 0.018802642822265625, 0.023229598999023438, 0.02765655517578125, 0.03208351135253906, 0.036510467529296875, 0.04093742370605469, 0.0453643798828125, 0.04979133605957031, 0.054218292236328125, 0.05864524841308594, 0.06307220458984375, 0.06749916076660156, 0.07192611694335938, 0.07635307312011719, 0.080780029296875, 0.08520698547363281, 0.08963394165039062, 0.09406089782714844, 0.09848785400390625, 0.10291481018066406, 0.10734176635742188, 0.11176872253417969, 0.1161956787109375, 0.12062263488769531, 0.12504959106445312, 0.12947654724121094, 0.13390350341796875, 0.13833045959472656, 0.14275741577148438, 0.1471843719482422, 0.151611328125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 3.0, 6.0, 8.0, 7.0, 7.0, 19.0, 24.0, 42.0, 68.0, 109.0, 195.0, 203.0, 129.0, 64.0, 34.0, 27.0, 13.0, 14.0, 12.0, 5.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2993812561035156e-05, -1.2575648725032806e-05, -1.2157484889030457e-05, -1.1739321053028107e-05, -1.1321157217025757e-05, -1.0902993381023407e-05, -1.0484829545021057e-05, -1.0066665709018707e-05, -9.648501873016357e-06, -9.230338037014008e-06, -8.812174201011658e-06, -8.394010365009308e-06, -7.975846529006958e-06, -7.557682693004608e-06, -7.139518857002258e-06, -6.7213550209999084e-06, -6.303191184997559e-06, -5.885027348995209e-06, -5.466863512992859e-06, -5.048699676990509e-06, -4.630535840988159e-06, -4.212372004985809e-06, -3.7942081689834595e-06, -3.3760443329811096e-06, -2.9578804969787598e-06, -2.53971666097641e-06, -2.12155282497406e-06, -1.7033889889717102e-06, -1.2852251529693604e-06, -8.670613169670105e-07, -4.4889748096466064e-07, -3.073364496231079e-08, 3.8743019104003906e-07, 8.055940270423889e-07, 1.2237578630447388e-06, 1.6419216990470886e-06, 2.0600855350494385e-06, 2.4782493710517883e-06, 2.896413207054138e-06, 3.314577043056488e-06, 3.732740879058838e-06, 4.150904715061188e-06, 4.569068551063538e-06, 4.9872323870658875e-06, 5.405396223068237e-06, 5.823560059070587e-06, 6.241723895072937e-06, 6.659887731075287e-06, 7.078051567077637e-06, 7.4962154030799866e-06, 7.914379239082336e-06, 8.332543075084686e-06, 8.750706911087036e-06, 9.168870747089386e-06, 9.587034583091736e-06, 1.0005198419094086e-05, 1.0423362255096436e-05, 1.0841526091098785e-05, 1.1259689927101135e-05, 1.1677853763103485e-05, 1.2096017599105835e-05, 1.2514181435108185e-05, 1.2932345271110535e-05, 1.3350509107112885e-05, 1.3768672943115234e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 8.0, 14.0, 14.0, 54.0, 103.0, 427.0, 2932.0, 647226.0, 394474.0, 2684.0, 397.0, 114.0, 40.0, 22.0, 13.0, 13.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1622314453125, -0.15517234802246094, -0.14811325073242188, -0.1410541534423828, -0.13399505615234375, -0.1269359588623047, -0.11987686157226562, -0.11281776428222656, -0.1057586669921875, -0.09869956970214844, -0.09164047241210938, -0.08458137512207031, -0.07752227783203125, -0.07046318054199219, -0.06340408325195312, -0.05634498596191406, -0.049285888671875, -0.04222679138183594, -0.035167694091796875, -0.028108596801757812, -0.02104949951171875, -0.013990402221679688, -0.006931304931640625, 0.0001277923583984375, 0.0071868896484375, 0.014245986938476562, 0.021305084228515625, 0.028364181518554688, 0.03542327880859375, 0.04248237609863281, 0.049541473388671875, 0.05660057067871094, 0.06365966796875, 0.07071876525878906, 0.07777786254882812, 0.08483695983886719, 0.09189605712890625, 0.09895515441894531, 0.10601425170898438, 0.11307334899902344, 0.1201324462890625, 0.12719154357910156, 0.13425064086914062, 0.1413097381591797, 0.14836883544921875, 0.1554279327392578, 0.16248703002929688, 0.16954612731933594, 0.176605224609375, 0.18366432189941406, 0.19072341918945312, 0.1977825164794922, 0.20484161376953125, 0.2119007110595703, 0.21895980834960938, 0.22601890563964844, 0.2330780029296875, 0.24013710021972656, 0.24719619750976562, 0.2542552947998047, 0.26131439208984375, 0.2683734893798828, 0.2754325866699219, 0.28249168395996094, 0.28955078125]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 7.0, 8.0, 12.0, 17.0, 44.0, 53.0, 115.0, 258.0, 231.0, 109.0, 56.0, 38.0, 13.0, 10.0, 6.0, 6.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.054962158203125, -0.05368375778198242, -0.052405357360839844, -0.051126956939697266, -0.04984855651855469, -0.04857015609741211, -0.04729175567626953, -0.04601335525512695, -0.044734954833984375, -0.0434565544128418, -0.04217815399169922, -0.04089975357055664, -0.03962135314941406, -0.038342952728271484, -0.037064552307128906, -0.03578615188598633, -0.03450775146484375, -0.03322935104370117, -0.031950950622558594, -0.030672550201416016, -0.029394149780273438, -0.02811574935913086, -0.02683734893798828, -0.025558948516845703, -0.024280548095703125, -0.023002147674560547, -0.02172374725341797, -0.02044534683227539, -0.019166946411132812, -0.017888545989990234, -0.016610145568847656, -0.015331745147705078, -0.0140533447265625, -0.012774944305419922, -0.011496543884277344, -0.010218143463134766, -0.008939743041992188, -0.007661342620849609, -0.006382942199707031, -0.005104541778564453, -0.003826141357421875, -0.002547740936279297, -0.0012693405151367188, 9.059906005859375e-06, 0.0012874603271484375, 0.0025658607482910156, 0.0038442611694335938, 0.005122661590576172, 0.00640106201171875, 0.007679462432861328, 0.008957862854003906, 0.010236263275146484, 0.011514663696289062, 0.01279306411743164, 0.014071464538574219, 0.015349864959716797, 0.016628265380859375, 0.017906665802001953, 0.01918506622314453, 0.02046346664428711, 0.021741867065429688, 0.023020267486572266, 0.024298667907714844, 0.025577068328857422, 0.02685546875]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 4.0, 7.0, 11.0, 12.0, 34.0, 74.0, 112.0, 183.0, 183.0, 145.0, 95.0, 52.0, 34.0, 22.0, 11.0, 7.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38317203521728516, -0.3685572147369385, -0.3539423644542694, -0.33932754397392273, -0.32471272349357605, -0.310097873210907, -0.2954830527305603, -0.2808682322502136, -0.26625341176986694, -0.25163859128952026, -0.2370237559080124, -0.22240892052650452, -0.20779410004615784, -0.19317926466464996, -0.1785644292831421, -0.1639496088027954, -0.14933475852012634, -0.13471992313861847, -0.12010510265827179, -0.10549026727676392, -0.09087543934583664, -0.07626061141490936, -0.06164577603340149, -0.04703094810247421, -0.032416120171546936, -0.01780129037797451, -0.0031864605844020844, 0.01142837107181549, 0.026043199002742767, 0.040658026933670044, 0.05527286231517792, 0.0698876902461052, 0.08450251817703247, 0.09911734610795975, 0.11373217403888702, 0.1283470094203949, 0.14296182990074158, 0.15757666528224945, 0.17219150066375732, 0.186806321144104, 0.20142115652561188, 0.21603599190711975, 0.23065081238746643, 0.2452656477689743, 0.2598804831504822, 0.27449530363082886, 0.28911012411117554, 0.3037249743938446, 0.3183397948741913, 0.33295461535453796, 0.34756946563720703, 0.3621842861175537, 0.3767991065979004, 0.39141392707824707, 0.40602877736091614, 0.4206435978412628, 0.4352584481239319, 0.44987326860427856, 0.46448811888694763, 0.4791029393672943, 0.493717759847641, 0.5083326101303101, 0.5229474306106567, 0.5375622510910034, 0.5521770715713501]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 1.0, 1.0, 3.0, 6.0, 4.0, 12.0, 10.0, 13.0, 13.0, 22.0, 22.0, 24.0, 21.0, 23.0, 36.0, 34.0, 43.0, 39.0, 26.0, 44.0, 44.0, 48.0, 51.0, 43.0, 29.0, 33.0, 40.0, 41.0, 30.0, 30.0, 24.0, 25.0, 25.0, 28.0, 20.0, 20.0, 12.0, 10.0, 10.0, 10.0, 6.0, 7.0, 5.0, 5.0, 5.0, 4.0, 3.0, 1.0, 0.0, 4.0, 0.0, 2.0], "bins": [-0.388520210981369, -0.37729737162590027, -0.3660745322704315, -0.35485169291496277, -0.343628853559494, -0.33240601420402527, -0.32118314504623413, -0.3099603056907654, -0.29873746633529663, -0.2875146269798279, -0.27629178762435913, -0.2650689482688904, -0.25384610891342163, -0.24262326955795288, -0.23140041530132294, -0.2201775759458542, -0.20895475149154663, -0.19773191213607788, -0.18650907278060913, -0.17528623342514038, -0.16406339406967163, -0.15284055471420288, -0.14161770045757294, -0.1303948611021042, -0.11917202174663544, -0.10794918239116669, -0.09672634303569794, -0.08550349622964859, -0.07428065687417984, -0.06305781751871109, -0.05183497071266174, -0.04061213135719299, -0.029389262199401855, -0.018166420981287956, -0.006943579763174057, 0.0042792633175849915, 0.015502102673053741, 0.02672494202852249, 0.03794778883457184, 0.04917062819004059, 0.06039346754550934, 0.07161630690097809, 0.08283914625644684, 0.09406199306249619, 0.10528483241796494, 0.11650767177343369, 0.12773051857948303, 0.13895335793495178, 0.15017619729042053, 0.16139903664588928, 0.17262187600135803, 0.18384471535682678, 0.19506755471229553, 0.20629039406776428, 0.21751324832439423, 0.22873608767986298, 0.23995892703533173, 0.25118178129196167, 0.2624046206474304, 0.27362746000289917, 0.2848502993583679, 0.29607313871383667, 0.3072959780693054, 0.31851881742477417, 0.3297416567802429]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 4.0, 3.0, 1.0, 12.0, 10.0, 10.0, 20.0, 26.0, 42.0, 53.0, 88.0, 155.0, 238.0, 417.0, 702.0, 1389.0, 2951.0, 7843.0, 32816.0, 368109.0, 3315159.0, 417360.0, 32846.0, 7895.0, 2997.0, 1382.0, 721.0, 400.0, 240.0, 145.0, 76.0, 60.0, 39.0, 33.0, 7.0, 14.0, 8.0, 8.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.226318359375, -0.2193584442138672, -0.21239852905273438, -0.20543861389160156, -0.19847869873046875, -0.19151878356933594, -0.18455886840820312, -0.1775989532470703, -0.1706390380859375, -0.1636791229248047, -0.15671920776367188, -0.14975929260253906, -0.14279937744140625, -0.13583946228027344, -0.12887954711914062, -0.12191963195800781, -0.114959716796875, -0.10799980163574219, -0.10103988647460938, -0.09407997131347656, -0.08712005615234375, -0.08016014099121094, -0.07320022583007812, -0.06624031066894531, -0.0592803955078125, -0.05232048034667969, -0.045360565185546875, -0.03840065002441406, -0.03144073486328125, -0.024480819702148438, -0.017520904541015625, -0.010560989379882812, -0.00360107421875, 0.0033588409423828125, 0.010318756103515625, 0.017278671264648438, 0.02423858642578125, 0.031198501586914062, 0.038158416748046875, 0.04511833190917969, 0.0520782470703125, 0.05903816223144531, 0.06599807739257812, 0.07295799255371094, 0.07991790771484375, 0.08687782287597656, 0.09383773803710938, 0.10079765319824219, 0.107757568359375, 0.11471748352050781, 0.12167739868164062, 0.12863731384277344, 0.13559722900390625, 0.14255714416503906, 0.14951705932617188, 0.1564769744873047, 0.1634368896484375, 0.1703968048095703, 0.17735671997070312, 0.18431663513183594, 0.19127655029296875, 0.19823646545410156, 0.20519638061523438, 0.2121562957763672, 0.2191162109375]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 5.0, 1.0, 3.0, 5.0, 8.0, 7.0, 11.0, 21.0, 14.0, 16.0, 34.0, 28.0, 29.0, 38.0, 47.0, 55.0, 49.0, 61.0, 52.0, 45.0, 71.0, 45.0, 55.0, 48.0, 44.0, 34.0, 31.0, 19.0, 31.0, 18.0, 20.0, 10.0, 19.0, 6.0, 2.0, 7.0, 2.0, 3.0, 5.0, 0.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.098876953125, -0.09499549865722656, -0.09111404418945312, -0.08723258972167969, -0.08335113525390625, -0.07946968078613281, -0.07558822631835938, -0.07170677185058594, -0.0678253173828125, -0.06394386291503906, -0.060062408447265625, -0.05618095397949219, -0.05229949951171875, -0.04841804504394531, -0.044536590576171875, -0.04065513610839844, -0.036773681640625, -0.03289222717285156, -0.029010772705078125, -0.025129318237304688, -0.02124786376953125, -0.017366409301757812, -0.013484954833984375, -0.009603500366210938, -0.0057220458984375, -0.0018405914306640625, 0.002040863037109375, 0.0059223175048828125, 0.00980377197265625, 0.013685226440429688, 0.017566680908203125, 0.021448135375976562, 0.02532958984375, 0.029211044311523438, 0.033092498779296875, 0.03697395324707031, 0.04085540771484375, 0.04473686218261719, 0.048618316650390625, 0.05249977111816406, 0.0563812255859375, 0.06026268005371094, 0.06414413452148438, 0.06802558898925781, 0.07190704345703125, 0.07578849792480469, 0.07966995239257812, 0.08355140686035156, 0.087432861328125, 0.09131431579589844, 0.09519577026367188, 0.09907722473144531, 0.10295867919921875, 0.10684013366699219, 0.11072158813476562, 0.11460304260253906, 0.1184844970703125, 0.12236595153808594, 0.12624740600585938, 0.1301288604736328, 0.13401031494140625, 0.1378917694091797, 0.14177322387695312, 0.14565467834472656, 0.1495361328125]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 8.0, 6.0, 13.0, 8.0, 18.0, 24.0, 37.0, 83.0, 107.0, 284.0, 622.0, 2225.0, 14292.0, 1135959.0, 3018251.0, 18474.0, 2569.0, 737.0, 272.0, 127.0, 64.0, 27.0, 22.0, 18.0, 3.0, 10.0, 6.0, 3.0, 7.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.322509765625, -0.3085212707519531, -0.29453277587890625, -0.2805442810058594, -0.2665557861328125, -0.2525672912597656, -0.23857879638671875, -0.22459030151367188, -0.210601806640625, -0.19661331176757812, -0.18262481689453125, -0.16863632202148438, -0.1546478271484375, -0.14065933227539062, -0.12667083740234375, -0.11268234252929688, -0.09869384765625, -0.08470535278320312, -0.07071685791015625, -0.056728363037109375, -0.0427398681640625, -0.028751373291015625, -0.01476287841796875, -0.000774383544921875, 0.013214111328125, 0.027202606201171875, 0.04119110107421875, 0.055179595947265625, 0.0691680908203125, 0.08315658569335938, 0.09714508056640625, 0.11113357543945312, 0.1251220703125, 0.13911056518554688, 0.15309906005859375, 0.16708755493164062, 0.1810760498046875, 0.19506454467773438, 0.20905303955078125, 0.22304153442382812, 0.237030029296875, 0.2510185241699219, 0.26500701904296875, 0.2789955139160156, 0.2929840087890625, 0.3069725036621094, 0.32096099853515625, 0.3349494934082031, 0.34893798828125, 0.3629264831542969, 0.37691497802734375, 0.3909034729003906, 0.4048919677734375, 0.4188804626464844, 0.43286895751953125, 0.4468574523925781, 0.460845947265625, 0.4748344421386719, 0.48882293701171875, 0.5028114318847656, 0.5167999267578125, 0.5307884216308594, 0.5447769165039062, 0.5587654113769531, 0.57275390625]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 3.0, 3.0, 7.0, 7.0, 9.0, 10.0, 14.0, 35.0, 38.0, 99.0, 180.0, 313.0, 693.0, 1059.0, 753.0, 366.0, 180.0, 94.0, 75.0, 35.0, 26.0, 17.0, 15.0, 12.0, 7.0, 6.0, 9.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0906982421875, -0.0885167121887207, -0.0863351821899414, -0.08415365219116211, -0.08197212219238281, -0.07979059219360352, -0.07760906219482422, -0.07542753219604492, -0.07324600219726562, -0.07106447219848633, -0.06888294219970703, -0.06670141220092773, -0.06451988220214844, -0.06233835220336914, -0.060156822204589844, -0.05797529220581055, -0.05579376220703125, -0.05361223220825195, -0.051430702209472656, -0.04924917221069336, -0.04706764221191406, -0.044886112213134766, -0.04270458221435547, -0.04052305221557617, -0.038341522216796875, -0.03615999221801758, -0.03397846221923828, -0.031796932220458984, -0.029615402221679688, -0.02743387222290039, -0.025252342224121094, -0.023070812225341797, -0.0208892822265625, -0.018707752227783203, -0.016526222229003906, -0.01434469223022461, -0.012163162231445312, -0.009981632232666016, -0.007800102233886719, -0.005618572235107422, -0.003437042236328125, -0.0012555122375488281, 0.0009260177612304688, 0.0031075477600097656, 0.0052890777587890625, 0.007470607757568359, 0.009652137756347656, 0.011833667755126953, 0.01401519775390625, 0.016196727752685547, 0.018378257751464844, 0.02055978775024414, 0.022741317749023438, 0.024922847747802734, 0.02710437774658203, 0.029285907745361328, 0.031467437744140625, 0.03364896774291992, 0.03583049774169922, 0.038012027740478516, 0.04019355773925781, 0.04237508773803711, 0.044556617736816406, 0.0467381477355957, 0.048919677734375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 6.0, 5.0, 9.0, 19.0, 38.0, 83.0, 119.0, 174.0, 186.0, 148.0, 85.0, 64.0, 37.0, 9.0, 9.0, 4.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4136539697647095, -0.4022037088871002, -0.39075344800949097, -0.3793031871318817, -0.36785292625427246, -0.3564026653766632, -0.34495240449905396, -0.3335021436214447, -0.32205188274383545, -0.3106016218662262, -0.29915136098861694, -0.2877011001110077, -0.27625083923339844, -0.2648005783557892, -0.25335031747817993, -0.24190005660057068, -0.23044981062412262, -0.21899954974651337, -0.2075492888689041, -0.19609902799129486, -0.1846487671136856, -0.17319850623607635, -0.1617482602596283, -0.15029799938201904, -0.1388477385044098, -0.12739747762680054, -0.11594721674919128, -0.10449695587158203, -0.09304669499397278, -0.08159643411636353, -0.07014618068933487, -0.058695919811725616, -0.04724565148353577, -0.035795390605926514, -0.02434513159096241, -0.012894872575998306, -0.0014446116983890533, 0.0100056491792202, 0.021455906331539154, 0.03290616720914841, 0.04435642808675766, 0.05580668896436691, 0.06725694984197617, 0.07870720326900482, 0.09015746414661407, 0.10160772502422333, 0.11305798590183258, 0.12450824677944183, 0.1359585076570511, 0.14740876853466034, 0.1588590294122696, 0.17030929028987885, 0.1817595511674881, 0.19320981204509735, 0.2046600580215454, 0.21611031889915466, 0.22756057977676392, 0.23901084065437317, 0.2504611015319824, 0.2619113624095917, 0.2733616232872009, 0.2848118841648102, 0.29626214504241943, 0.3077124059200287, 0.31916266679763794]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 4.0, 7.0, 13.0, 8.0, 12.0, 12.0, 20.0, 23.0, 22.0, 35.0, 38.0, 31.0, 41.0, 39.0, 52.0, 27.0, 52.0, 47.0, 45.0, 44.0, 46.0, 46.0, 50.0, 47.0, 42.0, 35.0, 22.0, 38.0, 28.0, 15.0, 12.0, 6.0, 10.0, 4.0, 4.0, 7.0, 7.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11764003336429596, -0.11358009278774261, -0.10952015221118927, -0.10546021908521652, -0.10140027850866318, -0.09734033793210983, -0.09328040480613708, -0.08922046422958374, -0.0851605236530304, -0.08110058307647705, -0.0770406424999237, -0.07298070937395096, -0.06892076879739761, -0.06486082822084427, -0.06080089136958122, -0.056740954518318176, -0.05268101394176483, -0.04862107336521149, -0.04456113651394844, -0.040501199662685394, -0.03644125908613205, -0.032381318509578705, -0.02832138165831566, -0.024261442944407463, -0.020201504230499268, -0.016141565516591072, -0.012081626802682877, -0.008021688088774681, -0.003961749374866486, 9.81893390417099e-05, 0.004158128052949905, 0.008218066766858101, 0.01227802038192749, 0.016337959095835686, 0.02039789780974388, 0.024457836523652077, 0.028517775237560272, 0.03257771581411362, 0.03663765266537666, 0.04069758951663971, 0.044757530093193054, 0.0488174706697464, 0.052877407521009445, 0.05693734437227249, 0.060997284948825836, 0.06505722552537918, 0.06911715865135193, 0.07317709922790527, 0.07723703980445862, 0.08129698038101196, 0.08535692095756531, 0.08941685408353806, 0.0934767946600914, 0.09753673523664474, 0.10159666836261749, 0.10565660893917084, 0.10971654951572418, 0.11377649009227753, 0.11783643066883087, 0.12189636379480362, 0.12595629692077637, 0.1300162374973297, 0.13407617807388306, 0.1381361186504364, 0.14219605922698975]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 7.0, 8.0, 13.0, 11.0, 26.0, 29.0, 47.0, 73.0, 103.0, 164.0, 262.0, 395.0, 683.0, 1109.0, 1945.0, 3831.0, 8066.0, 21199.0, 95432.0, 613053.0, 241798.0, 37204.0, 11746.0, 5067.0, 2632.0, 1531.0, 825.0, 466.0, 288.0, 165.0, 138.0, 83.0, 48.0, 50.0, 19.0, 9.0, 9.0, 4.0, 6.0, 3.0, 2.0, 5.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.045806884765625, -0.04415416717529297, -0.04250144958496094, -0.040848731994628906, -0.039196014404296875, -0.037543296813964844, -0.03589057922363281, -0.03423786163330078, -0.03258514404296875, -0.03093242645263672, -0.029279708862304688, -0.027626991271972656, -0.025974273681640625, -0.024321556091308594, -0.022668838500976562, -0.02101612091064453, -0.0193634033203125, -0.01771068572998047, -0.016057968139648438, -0.014405250549316406, -0.012752532958984375, -0.011099815368652344, -0.009447097778320312, -0.007794380187988281, -0.00614166259765625, -0.004488945007324219, -0.0028362274169921875, -0.0011835098266601562, 0.000469207763671875, 0.0021219253540039062, 0.0037746429443359375, 0.005427360534667969, 0.007080078125, 0.008732795715332031, 0.010385513305664062, 0.012038230895996094, 0.013690948486328125, 0.015343666076660156, 0.016996383666992188, 0.01864910125732422, 0.02030181884765625, 0.02195453643798828, 0.023607254028320312, 0.025259971618652344, 0.026912689208984375, 0.028565406799316406, 0.030218124389648438, 0.03187084197998047, 0.0335235595703125, 0.03517627716064453, 0.03682899475097656, 0.038481712341308594, 0.040134429931640625, 0.041787147521972656, 0.04343986511230469, 0.04509258270263672, 0.04674530029296875, 0.04839801788330078, 0.05005073547363281, 0.051703453063964844, 0.053356170654296875, 0.055008888244628906, 0.05666160583496094, 0.05831432342529297, 0.059967041015625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 9.0, 9.0, 9.0, 14.0, 16.0, 30.0, 28.0, 34.0, 50.0, 55.0, 55.0, 61.0, 67.0, 70.0, 58.0, 66.0, 57.0, 61.0, 55.0, 44.0, 42.0, 35.0, 24.0, 12.0, 9.0, 10.0, 6.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09808349609375, -0.09442615509033203, -0.09076881408691406, -0.0871114730834961, -0.08345413208007812, -0.07979679107666016, -0.07613945007324219, -0.07248210906982422, -0.06882476806640625, -0.06516742706298828, -0.06151008605957031, -0.057852745056152344, -0.054195404052734375, -0.050538063049316406, -0.04688072204589844, -0.04322338104248047, -0.0395660400390625, -0.03590869903564453, -0.03225135803222656, -0.028594017028808594, -0.024936676025390625, -0.021279335021972656, -0.017621994018554688, -0.013964653015136719, -0.01030731201171875, -0.006649971008300781, -0.0029926300048828125, 0.0006647109985351562, 0.004322052001953125, 0.007979393005371094, 0.011636734008789062, 0.015294075012207031, 0.018951416015625, 0.02260875701904297, 0.026266098022460938, 0.029923439025878906, 0.033580780029296875, 0.037238121032714844, 0.04089546203613281, 0.04455280303955078, 0.04821014404296875, 0.05186748504638672, 0.05552482604980469, 0.059182167053222656, 0.06283950805664062, 0.0664968490600586, 0.07015419006347656, 0.07381153106689453, 0.0774688720703125, 0.08112621307373047, 0.08478355407714844, 0.0884408950805664, 0.09209823608398438, 0.09575557708740234, 0.09941291809082031, 0.10307025909423828, 0.10672760009765625, 0.11038494110107422, 0.11404228210449219, 0.11769962310791016, 0.12135696411132812, 0.1250143051147461, 0.12867164611816406, 0.13232898712158203, 0.135986328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 5.0, 4.0, 10.0, 11.0, 15.0, 16.0, 28.0, 43.0, 77.0, 166.0, 286.0, 731.0, 1802.0, 5298.0, 23853.0, 446803.0, 533094.0, 27334.0, 5687.0, 1897.0, 727.0, 296.0, 148.0, 82.0, 40.0, 32.0, 18.0, 13.0, 2.0, 7.0, 5.0, 4.0, 2.0, 2.0, 3.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.08599853515625, -0.08367633819580078, -0.08135414123535156, -0.07903194427490234, -0.07670974731445312, -0.0743875503540039, -0.07206535339355469, -0.06974315643310547, -0.06742095947265625, -0.06509876251220703, -0.06277656555175781, -0.060454368591308594, -0.058132171630859375, -0.055809974670410156, -0.05348777770996094, -0.05116558074951172, -0.0488433837890625, -0.04652118682861328, -0.04419898986816406, -0.041876792907714844, -0.039554595947265625, -0.037232398986816406, -0.03491020202636719, -0.03258800506591797, -0.03026580810546875, -0.02794361114501953, -0.025621414184570312, -0.023299217224121094, -0.020977020263671875, -0.018654823303222656, -0.016332626342773438, -0.014010429382324219, -0.011688232421875, -0.009366035461425781, -0.0070438385009765625, -0.004721641540527344, -0.002399444580078125, -7.724761962890625e-05, 0.0022449493408203125, 0.004567146301269531, 0.00688934326171875, 0.009211540222167969, 0.011533737182617188, 0.013855934143066406, 0.016178131103515625, 0.018500328063964844, 0.020822525024414062, 0.02314472198486328, 0.0254669189453125, 0.02778911590576172, 0.030111312866210938, 0.032433509826660156, 0.034755706787109375, 0.037077903747558594, 0.03940010070800781, 0.04172229766845703, 0.04404449462890625, 0.04636669158935547, 0.04868888854980469, 0.051011085510253906, 0.053333282470703125, 0.055655479431152344, 0.05797767639160156, 0.06029987335205078, 0.0626220703125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 4.0, 10.0, 12.0, 10.0, 15.0, 11.0, 19.0, 20.0, 30.0, 26.0, 38.0, 36.0, 25.0, 52.0, 48.0, 46.0, 33.0, 40.0, 57.0, 45.0, 35.0, 46.0, 53.0, 39.0, 38.0, 35.0, 30.0, 27.0, 30.0, 18.0, 22.0, 8.0, 12.0, 3.0, 7.0, 6.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1611328125, -0.1559123992919922, -0.15069198608398438, -0.14547157287597656, -0.14025115966796875, -0.13503074645996094, -0.12981033325195312, -0.12458992004394531, -0.1193695068359375, -0.11414909362792969, -0.10892868041992188, -0.10370826721191406, -0.09848785400390625, -0.09326744079589844, -0.08804702758789062, -0.08282661437988281, -0.077606201171875, -0.07238578796386719, -0.06716537475585938, -0.06194496154785156, -0.05672454833984375, -0.05150413513183594, -0.046283721923828125, -0.04106330871582031, -0.0358428955078125, -0.030622482299804688, -0.025402069091796875, -0.020181655883789062, -0.01496124267578125, -0.009740829467773438, -0.004520416259765625, 0.0006999969482421875, 0.00592041015625, 0.011140823364257812, 0.016361236572265625, 0.021581649780273438, 0.02680206298828125, 0.03202247619628906, 0.037242889404296875, 0.04246330261230469, 0.0476837158203125, 0.05290412902832031, 0.058124542236328125, 0.06334495544433594, 0.06856536865234375, 0.07378578186035156, 0.07900619506835938, 0.08422660827636719, 0.089447021484375, 0.09466743469238281, 0.09988784790039062, 0.10510826110839844, 0.11032867431640625, 0.11554908752441406, 0.12076950073242188, 0.1259899139404297, 0.1312103271484375, 0.1364307403564453, 0.14165115356445312, 0.14687156677246094, 0.15209197998046875, 0.15731239318847656, 0.16253280639648438, 0.1677532196044922, 0.1729736328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 3.0, 6.0, 8.0, 11.0, 10.0, 17.0, 18.0, 33.0, 42.0, 78.0, 123.0, 239.0, 357.0, 811.0, 1981.0, 5821.0, 22293.0, 145021.0, 697981.0, 142005.0, 22020.0, 5768.0, 2074.0, 846.0, 440.0, 218.0, 117.0, 56.0, 52.0, 32.0, 22.0, 12.0, 14.0, 5.0, 2.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0153045654296875, -0.014802694320678711, -0.014300823211669922, -0.013798952102661133, -0.013297080993652344, -0.012795209884643555, -0.012293338775634766, -0.011791467666625977, -0.011289596557617188, -0.010787725448608398, -0.01028585433959961, -0.00978398323059082, -0.009282112121582031, -0.008780241012573242, -0.008278369903564453, -0.007776498794555664, -0.007274627685546875, -0.006772756576538086, -0.006270885467529297, -0.005769014358520508, -0.005267143249511719, -0.00476527214050293, -0.004263401031494141, -0.0037615299224853516, -0.0032596588134765625, -0.0027577877044677734, -0.0022559165954589844, -0.0017540454864501953, -0.0012521743774414062, -0.0007503032684326172, -0.0002484321594238281, 0.00025343894958496094, 0.00075531005859375, 0.001257181167602539, 0.0017590522766113281, 0.002260923385620117, 0.0027627944946289062, 0.0032646656036376953, 0.0037665367126464844, 0.0042684078216552734, 0.0047702789306640625, 0.0052721500396728516, 0.005774021148681641, 0.00627589225769043, 0.006777763366699219, 0.007279634475708008, 0.007781505584716797, 0.008283376693725586, 0.008785247802734375, 0.009287118911743164, 0.009788990020751953, 0.010290861129760742, 0.010792732238769531, 0.01129460334777832, 0.01179647445678711, 0.012298345565795898, 0.012800216674804688, 0.013302087783813477, 0.013803958892822266, 0.014305830001831055, 0.014807701110839844, 0.015309572219848633, 0.015811443328857422, 0.01631331443786621, 0.016815185546875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 2.0, 2.0, 8.0, 8.0, 13.0, 19.0, 16.0, 24.0, 39.0, 47.0, 56.0, 47.0, 69.0, 74.0, 81.0, 98.0, 74.0, 65.0, 63.0, 38.0, 32.0, 28.0, 23.0, 17.0, 10.0, 11.0, 7.0, 4.0, 3.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0067901611328125e-06, -4.827044904232025e-06, -4.647299647331238e-06, -4.4675543904304504e-06, -4.287809133529663e-06, -4.108063876628876e-06, -3.928318619728088e-06, -3.748573362827301e-06, -3.5688281059265137e-06, -3.3890828490257263e-06, -3.209337592124939e-06, -3.0295923352241516e-06, -2.8498470783233643e-06, -2.670101821422577e-06, -2.4903565645217896e-06, -2.310611307621002e-06, -2.130866050720215e-06, -1.9511207938194275e-06, -1.7713755369186401e-06, -1.5916302800178528e-06, -1.4118850231170654e-06, -1.232139766216278e-06, -1.0523945093154907e-06, -8.726492524147034e-07, -6.92903995513916e-07, -5.131587386131287e-07, -3.334134817123413e-07, -1.5366822481155396e-07, 2.60770320892334e-08, 2.0582228899002075e-07, 3.855675458908081e-07, 5.653128027915955e-07, 7.450580596923828e-07, 9.248033165931702e-07, 1.1045485734939575e-06, 1.2842938303947449e-06, 1.4640390872955322e-06, 1.6437843441963196e-06, 1.823529601097107e-06, 2.0032748579978943e-06, 2.1830201148986816e-06, 2.362765371799469e-06, 2.5425106287002563e-06, 2.7222558856010437e-06, 2.902001142501831e-06, 3.0817463994026184e-06, 3.2614916563034058e-06, 3.441236913204193e-06, 3.6209821701049805e-06, 3.800727427005768e-06, 3.980472683906555e-06, 4.1602179408073425e-06, 4.33996319770813e-06, 4.519708454608917e-06, 4.699453711509705e-06, 4.879198968410492e-06, 5.058944225311279e-06, 5.238689482212067e-06, 5.418434739112854e-06, 5.598179996013641e-06, 5.777925252914429e-06, 5.957670509815216e-06, 6.137415766716003e-06, 6.317161023616791e-06, 6.496906280517578e-06]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 7.0, 4.0, 11.0, 15.0, 11.0, 25.0, 39.0, 39.0, 71.0, 128.0, 194.0, 319.0, 553.0, 996.0, 2093.0, 4895.0, 14299.0, 59439.0, 363697.0, 487548.0, 84442.0, 18577.0, 6012.0, 2388.0, 1153.0, 644.0, 384.0, 198.0, 125.0, 89.0, 52.0, 33.0, 28.0, 13.0, 14.0, 6.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01465606689453125, -0.014213323593139648, -0.013770580291748047, -0.013327836990356445, -0.012885093688964844, -0.012442350387573242, -0.01199960708618164, -0.011556863784790039, -0.011114120483398438, -0.010671377182006836, -0.010228633880615234, -0.009785890579223633, -0.009343147277832031, -0.00890040397644043, -0.008457660675048828, -0.008014917373657227, -0.007572174072265625, -0.0071294307708740234, -0.006686687469482422, -0.00624394416809082, -0.005801200866699219, -0.005358457565307617, -0.004915714263916016, -0.004472970962524414, -0.0040302276611328125, -0.003587484359741211, -0.0031447410583496094, -0.002701997756958008, -0.0022592544555664062, -0.0018165111541748047, -0.0013737678527832031, -0.0009310245513916016, -0.00048828125, -4.553794860839844e-05, 0.0003972053527832031, 0.0008399486541748047, 0.0012826919555664062, 0.0017254352569580078, 0.0021681785583496094, 0.002610921859741211, 0.0030536651611328125, 0.003496408462524414, 0.003939151763916016, 0.004381895065307617, 0.004824638366699219, 0.00526738166809082, 0.005710124969482422, 0.0061528682708740234, 0.006595611572265625, 0.0070383548736572266, 0.007481098175048828, 0.00792384147644043, 0.008366584777832031, 0.008809328079223633, 0.009252071380615234, 0.009694814682006836, 0.010137557983398438, 0.010580301284790039, 0.01102304458618164, 0.011465787887573242, 0.011908531188964844, 0.012351274490356445, 0.012794017791748047, 0.013236761093139648, 0.01367950439453125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 7.0, 4.0, 8.0, 11.0, 19.0, 25.0, 29.0, 35.0, 46.0, 54.0, 74.0, 94.0, 101.0, 82.0, 72.0, 75.0, 55.0, 54.0, 44.0, 28.0, 16.0, 19.0, 14.0, 7.0, 6.0, 4.0, 5.0, 4.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00290679931640625, -0.0027904510498046875, -0.002674102783203125, -0.0025577545166015625, -0.00244140625, -0.0023250579833984375, -0.002208709716796875, -0.0020923614501953125, -0.00197601318359375, -0.0018596649169921875, -0.001743316650390625, -0.0016269683837890625, -0.0015106201171875, -0.0013942718505859375, -0.001277923583984375, -0.0011615753173828125, -0.00104522705078125, -0.0009288787841796875, -0.000812530517578125, -0.0006961822509765625, -0.000579833984375, -0.0004634857177734375, -0.000347137451171875, -0.0002307891845703125, -0.00011444091796875, 1.9073486328125e-06, 0.000118255615234375, 0.0002346038818359375, 0.0003509521484375, 0.0004673004150390625, 0.000583648681640625, 0.0006999969482421875, 0.00081634521484375, 0.0009326934814453125, 0.001049041748046875, 0.0011653900146484375, 0.00128173828125, 0.0013980865478515625, 0.001514434814453125, 0.0016307830810546875, 0.00174713134765625, 0.0018634796142578125, 0.001979827880859375, 0.0020961761474609375, 0.0022125244140625, 0.0023288726806640625, 0.002445220947265625, 0.0025615692138671875, 0.00267791748046875, 0.0027942657470703125, 0.002910614013671875, 0.0030269622802734375, 0.003143310546875, 0.0032596588134765625, 0.003376007080078125, 0.0034923553466796875, 0.00360870361328125, 0.0037250518798828125, 0.003841400146484375, 0.0039577484130859375, 0.0040740966796875, 0.0041904449462890625, 0.004306793212890625, 0.0044231414794921875, 0.00453948974609375]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 10.0, 13.0, 31.0, 88.0, 160.0, 228.0, 214.0, 129.0, 68.0, 24.0, 18.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31877464056015015, -0.3103354275226593, -0.30189621448516846, -0.29345703125, -0.28501781821250916, -0.2765786051750183, -0.26813939213752747, -0.2597001791000366, -0.25126099586486816, -0.24282178282737732, -0.23438258469104767, -0.22594337165355682, -0.21750417351722717, -0.20906496047973633, -0.20062574744224548, -0.19218653440475464, -0.1837473213672638, -0.17530810832977295, -0.1668689101934433, -0.15842969715595245, -0.1499904990196228, -0.14155128598213196, -0.1331120729446411, -0.12467286735773087, -0.11623366177082062, -0.10779445618391037, -0.09935525059700012, -0.09091603755950928, -0.08247683197259903, -0.07403762638568878, -0.06559841334819794, -0.05715920776128769, -0.04871998727321625, -0.040280781686306, -0.031841572374105453, -0.023402364924550056, -0.01496315747499466, -0.006523951888084412, 0.0019152574241161346, 0.010354466736316681, 0.01879367232322693, 0.027232879772782326, 0.03567208722233772, 0.04411129653453827, 0.05255050212144852, 0.060989707708358765, 0.06942892074584961, 0.07786812633275986, 0.0863073319196701, 0.09474653750658035, 0.1031857430934906, 0.11162495613098145, 0.1200641617178917, 0.12850336730480194, 0.13694258034229279, 0.14538177847862244, 0.15382099151611328, 0.16226020455360413, 0.17069940268993378, 0.17913861572742462, 0.18757781386375427, 0.19601702690124512, 0.20445623993873596, 0.2128954529762268, 0.22133465111255646]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 8.0, 3.0, 12.0, 11.0, 10.0, 24.0, 33.0, 33.0, 50.0, 40.0, 56.0, 61.0, 52.0, 60.0, 69.0, 56.0, 59.0, 52.0, 64.0, 61.0, 37.0, 38.0, 40.0, 12.0, 15.0, 13.0, 7.0, 10.0, 3.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08594147861003876, -0.08259603381156921, -0.07925058156251907, -0.07590513676404953, -0.07255969196557999, -0.06921423971652985, -0.0658687949180603, -0.06252335011959076, -0.059177905321121216, -0.055832456797361374, -0.05248701199889183, -0.04914156347513199, -0.045796118676662445, -0.0424506701529026, -0.03910522162914276, -0.03575977683067322, -0.032414328306913376, -0.029068881645798683, -0.02572343498468399, -0.02237798646092415, -0.019032541662454605, -0.015687093138694763, -0.01234164647758007, -0.008996199816465378, -0.005650753155350685, -0.0023053062614053488, 0.0010401406325399876, 0.0043855877593159676, 0.00773103442043066, 0.011076482012867928, 0.01442192867398262, 0.017767375335097313, 0.021112821996212006, 0.0244582686573267, 0.02780371531844139, 0.031149163842201233, 0.034494608640670776, 0.03784005716443062, 0.04118550568819046, 0.044530950486660004, 0.04787639528512955, 0.05122184380888939, 0.05456728860735893, 0.057912737131118774, 0.06125818192958832, 0.06460362672805786, 0.067949078977108, 0.07129452377557755, 0.07463997602462769, 0.07798542082309723, 0.08133087307214737, 0.08467631787061691, 0.08802176266908646, 0.0913672149181366, 0.09471265971660614, 0.09805810451507568, 0.10140354931354523, 0.10474899411201477, 0.10809444636106491, 0.11143989115953445, 0.114785335958004, 0.11813078820705414, 0.12147623300552368, 0.12482167780399323, 0.12816712260246277]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 4.0, 5.0, 10.0, 9.0, 12.0, 16.0, 17.0, 36.0, 47.0, 77.0, 132.0, 217.0, 279.0, 470.0, 882.0, 1543.0, 2943.0, 6018.0, 13143.0, 35739.0, 171263.0, 680459.0, 89537.0, 25209.0, 10287.0, 4636.0, 2391.0, 1259.0, 724.0, 455.0, 250.0, 161.0, 116.0, 67.0, 44.0, 29.0, 24.0, 14.0, 12.0, 8.0, 8.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09271240234375, -0.08932113647460938, -0.08592987060546875, -0.08253860473632812, -0.0791473388671875, -0.07575607299804688, -0.07236480712890625, -0.06897354125976562, -0.065582275390625, -0.062191009521484375, -0.05879974365234375, -0.055408477783203125, -0.0520172119140625, -0.048625946044921875, -0.04523468017578125, -0.041843414306640625, -0.0384521484375, -0.035060882568359375, -0.03166961669921875, -0.028278350830078125, -0.0248870849609375, -0.021495819091796875, -0.01810455322265625, -0.014713287353515625, -0.011322021484375, -0.007930755615234375, -0.00453948974609375, -0.001148223876953125, 0.0022430419921875, 0.005634307861328125, 0.00902557373046875, 0.012416839599609375, 0.01580810546875, 0.019199371337890625, 0.02259063720703125, 0.025981903076171875, 0.0293731689453125, 0.032764434814453125, 0.03615570068359375, 0.039546966552734375, 0.042938232421875, 0.046329498291015625, 0.04972076416015625, 0.053112030029296875, 0.0565032958984375, 0.059894561767578125, 0.06328582763671875, 0.06667709350585938, 0.070068359375, 0.07345962524414062, 0.07685089111328125, 0.08024215698242188, 0.0836334228515625, 0.08702468872070312, 0.09041595458984375, 0.09380722045898438, 0.097198486328125, 0.10058975219726562, 0.10398101806640625, 0.10737228393554688, 0.1107635498046875, 0.11415481567382812, 0.11754608154296875, 0.12093734741210938, 0.12432861328125]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 2.0, 5.0, 4.0, 7.0, 8.0, 8.0, 16.0, 18.0, 17.0, 31.0, 39.0, 39.0, 46.0, 59.0, 50.0, 65.0, 66.0, 45.0, 56.0, 57.0, 55.0, 61.0, 56.0, 37.0, 35.0, 33.0, 19.0, 23.0, 7.0, 8.0, 9.0, 5.0, 5.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1820068359375, -0.17581939697265625, -0.1696319580078125, -0.16344451904296875, -0.157257080078125, -0.15106964111328125, -0.1448822021484375, -0.13869476318359375, -0.13250732421875, -0.12631988525390625, -0.1201324462890625, -0.11394500732421875, -0.107757568359375, -0.10157012939453125, -0.0953826904296875, -0.08919525146484375, -0.0830078125, -0.07682037353515625, -0.0706329345703125, -0.06444549560546875, -0.058258056640625, -0.05207061767578125, -0.0458831787109375, -0.03969573974609375, -0.03350830078125, -0.02732086181640625, -0.0211334228515625, -0.01494598388671875, -0.008758544921875, -0.00257110595703125, 0.0036163330078125, 0.00980377197265625, 0.0159912109375, 0.02217864990234375, 0.0283660888671875, 0.03455352783203125, 0.040740966796875, 0.04692840576171875, 0.0531158447265625, 0.05930328369140625, 0.06549072265625, 0.07167816162109375, 0.0778656005859375, 0.08405303955078125, 0.090240478515625, 0.09642791748046875, 0.1026153564453125, 0.10880279541015625, 0.114990234375, 0.12117767333984375, 0.1273651123046875, 0.13355255126953125, 0.139739990234375, 0.14592742919921875, 0.1521148681640625, 0.15830230712890625, 0.16448974609375, 0.17067718505859375, 0.1768646240234375, 0.18305206298828125, 0.189239501953125, 0.19542694091796875, 0.2016143798828125, 0.20780181884765625, 0.2139892578125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0, 5.0, 8.0, 7.0, 14.0, 21.0, 12.0, 26.0, 20.0, 22.0, 36.0, 45.0, 60.0, 83.0, 120.0, 151.0, 178.0, 251.0, 390.0, 841.0, 3050.0, 16699.0, 630274.0, 377084.0, 14148.0, 2695.0, 823.0, 396.0, 251.0, 182.0, 152.0, 125.0, 64.0, 84.0, 48.0, 47.0, 46.0, 24.0, 22.0, 19.0, 10.0, 5.0, 5.0, 8.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2342529296875, -0.22643470764160156, -0.21861648559570312, -0.2107982635498047, -0.20298004150390625, -0.1951618194580078, -0.18734359741210938, -0.17952537536621094, -0.1717071533203125, -0.16388893127441406, -0.15607070922851562, -0.1482524871826172, -0.14043426513671875, -0.1326160430908203, -0.12479782104492188, -0.11697959899902344, -0.109161376953125, -0.10134315490722656, -0.09352493286132812, -0.08570671081542969, -0.07788848876953125, -0.07007026672363281, -0.062252044677734375, -0.05443382263183594, -0.0466156005859375, -0.03879737854003906, -0.030979156494140625, -0.023160934448242188, -0.01534271240234375, -0.0075244903564453125, 0.000293731689453125, 0.008111953735351562, 0.01593017578125, 0.023748397827148438, 0.031566619873046875, 0.03938484191894531, 0.04720306396484375, 0.05502128601074219, 0.06283950805664062, 0.07065773010253906, 0.0784759521484375, 0.08629417419433594, 0.09411239624023438, 0.10193061828613281, 0.10974884033203125, 0.11756706237792969, 0.12538528442382812, 0.13320350646972656, 0.141021728515625, 0.14883995056152344, 0.15665817260742188, 0.1644763946533203, 0.17229461669921875, 0.1801128387451172, 0.18793106079101562, 0.19574928283691406, 0.2035675048828125, 0.21138572692871094, 0.21920394897460938, 0.2270221710205078, 0.23484039306640625, 0.2426586151123047, 0.2504768371582031, 0.25829505920410156, 0.26611328125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 5.0, 7.0, 4.0, 8.0, 5.0, 8.0, 13.0, 11.0, 23.0, 24.0, 21.0, 17.0, 26.0, 26.0, 40.0, 23.0, 46.0, 39.0, 34.0, 44.0, 48.0, 42.0, 41.0, 48.0, 46.0, 36.0, 31.0, 32.0, 29.0, 20.0, 20.0, 27.0, 22.0, 24.0, 29.0, 18.0, 13.0, 14.0, 5.0, 9.0, 4.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 4.0], "bins": [-0.1719970703125, -0.16673660278320312, -0.16147613525390625, -0.15621566772460938, -0.1509552001953125, -0.14569473266601562, -0.14043426513671875, -0.13517379760742188, -0.129913330078125, -0.12465286254882812, -0.11939239501953125, -0.11413192749023438, -0.1088714599609375, -0.10361099243164062, -0.09835052490234375, -0.09309005737304688, -0.08782958984375, -0.08256912231445312, -0.07730865478515625, -0.07204818725585938, -0.0667877197265625, -0.061527252197265625, -0.05626678466796875, -0.051006317138671875, -0.045745849609375, -0.040485382080078125, -0.03522491455078125, -0.029964447021484375, -0.0247039794921875, -0.019443511962890625, -0.01418304443359375, -0.008922576904296875, -0.003662109375, 0.001598358154296875, 0.00685882568359375, 0.012119293212890625, 0.0173797607421875, 0.022640228271484375, 0.02790069580078125, 0.033161163330078125, 0.038421630859375, 0.043682098388671875, 0.04894256591796875, 0.054203033447265625, 0.0594635009765625, 0.06472396850585938, 0.06998443603515625, 0.07524490356445312, 0.08050537109375, 0.08576583862304688, 0.09102630615234375, 0.09628677368164062, 0.1015472412109375, 0.10680770874023438, 0.11206817626953125, 0.11732864379882812, 0.122589111328125, 0.12784957885742188, 0.13311004638671875, 0.13837051391601562, 0.1436309814453125, 0.14889144897460938, 0.15415191650390625, 0.15941238403320312, 0.1646728515625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 2.0, 5.0, 7.0, 6.0, 16.0, 7.0, 21.0, 42.0, 37.0, 73.0, 88.0, 204.0, 372.0, 767.0, 1611.0, 4209.0, 15312.0, 326154.0, 673493.0, 17945.0, 4544.0, 1794.0, 832.0, 406.0, 206.0, 139.0, 78.0, 60.0, 27.0, 36.0, 13.0, 10.0, 12.0, 8.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.0970458984375, -0.09435367584228516, -0.09166145324707031, -0.08896923065185547, -0.08627700805664062, -0.08358478546142578, -0.08089256286621094, -0.0782003402709961, -0.07550811767578125, -0.0728158950805664, -0.07012367248535156, -0.06743144989013672, -0.06473922729492188, -0.06204700469970703, -0.05935478210449219, -0.056662559509277344, -0.0539703369140625, -0.051278114318847656, -0.04858589172363281, -0.04589366912841797, -0.043201446533203125, -0.04050922393798828, -0.03781700134277344, -0.035124778747558594, -0.03243255615234375, -0.029740333557128906, -0.027048110961914062, -0.02435588836669922, -0.021663665771484375, -0.01897144317626953, -0.016279220581054688, -0.013586997985839844, -0.010894775390625, -0.008202552795410156, -0.0055103302001953125, -0.0028181076049804688, -0.000125885009765625, 0.0025663375854492188, 0.0052585601806640625, 0.007950782775878906, 0.01064300537109375, 0.013335227966308594, 0.016027450561523438, 0.01871967315673828, 0.021411895751953125, 0.02410411834716797, 0.026796340942382812, 0.029488563537597656, 0.0321807861328125, 0.034873008728027344, 0.03756523132324219, 0.04025745391845703, 0.042949676513671875, 0.04564189910888672, 0.04833412170410156, 0.051026344299316406, 0.05371856689453125, 0.056410789489746094, 0.05910301208496094, 0.06179523468017578, 0.06448745727539062, 0.06717967987060547, 0.06987190246582031, 0.07256412506103516, 0.07525634765625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 2.0, 9.0, 5.0, 7.0, 13.0, 23.0, 27.0, 61.0, 121.0, 337.0, 191.0, 79.0, 40.0, 22.0, 18.0, 13.0, 13.0, 4.0, 10.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3589859008789062e-05, -1.3173557817935944e-05, -1.2757256627082825e-05, -1.2340955436229706e-05, -1.1924654245376587e-05, -1.1508353054523468e-05, -1.1092051863670349e-05, -1.067575067281723e-05, -1.0259449481964111e-05, -9.843148291110992e-06, -9.426847100257874e-06, -9.010545909404755e-06, -8.594244718551636e-06, -8.177943527698517e-06, -7.761642336845398e-06, -7.345341145992279e-06, -6.92903995513916e-06, -6.512738764286041e-06, -6.096437573432922e-06, -5.6801363825798035e-06, -5.2638351917266846e-06, -4.847534000873566e-06, -4.431232810020447e-06, -4.014931619167328e-06, -3.598630428314209e-06, -3.18232923746109e-06, -2.766028046607971e-06, -2.3497268557548523e-06, -1.9334256649017334e-06, -1.5171244740486145e-06, -1.1008232831954956e-06, -6.845220923423767e-07, -2.682209014892578e-07, 1.4808028936386108e-07, 5.6438148021698e-07, 9.806826710700989e-07, 1.3969838619232178e-06, 1.8132850527763367e-06, 2.2295862436294556e-06, 2.6458874344825745e-06, 3.0621886253356934e-06, 3.4784898161888123e-06, 3.894791007041931e-06, 4.31109219789505e-06, 4.727393388748169e-06, 5.143694579601288e-06, 5.559995770454407e-06, 5.976296961307526e-06, 6.3925981521606445e-06, 6.8088993430137634e-06, 7.225200533866882e-06, 7.641501724720001e-06, 8.05780291557312e-06, 8.474104106426239e-06, 8.890405297279358e-06, 9.306706488132477e-06, 9.723007678985596e-06, 1.0139308869838715e-05, 1.0555610060691833e-05, 1.0971911251544952e-05, 1.1388212442398071e-05, 1.180451363325119e-05, 1.2220814824104309e-05, 1.2637116014957428e-05, 1.3053417205810547e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 4.0, 2.0, 2.0, 3.0, 4.0, 8.0, 11.0, 24.0, 39.0, 68.0, 160.0, 347.0, 886.0, 2831.0, 14047.0, 906676.0, 113912.0, 6730.0, 1701.0, 583.0, 245.0, 101.0, 64.0, 35.0, 24.0, 13.0, 3.0, 6.0, 5.0, 8.0, 7.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.16552734375, -0.1611490249633789, -0.1567707061767578, -0.15239238739013672, -0.14801406860351562, -0.14363574981689453, -0.13925743103027344, -0.13487911224365234, -0.13050079345703125, -0.12612247467041016, -0.12174415588378906, -0.11736583709716797, -0.11298751831054688, -0.10860919952392578, -0.10423088073730469, -0.0998525619506836, -0.0954742431640625, -0.0910959243774414, -0.08671760559082031, -0.08233928680419922, -0.07796096801757812, -0.07358264923095703, -0.06920433044433594, -0.06482601165771484, -0.06044769287109375, -0.056069374084472656, -0.05169105529785156, -0.04731273651123047, -0.042934417724609375, -0.03855609893798828, -0.03417778015136719, -0.029799461364746094, -0.025421142578125, -0.021042823791503906, -0.016664505004882812, -0.012286186218261719, -0.007907867431640625, -0.0035295486450195312, 0.0008487701416015625, 0.005227088928222656, 0.00960540771484375, 0.013983726501464844, 0.018362045288085938, 0.02274036407470703, 0.027118682861328125, 0.03149700164794922, 0.03587532043457031, 0.040253639221191406, 0.0446319580078125, 0.049010276794433594, 0.05338859558105469, 0.05776691436767578, 0.062145233154296875, 0.06652355194091797, 0.07090187072753906, 0.07528018951416016, 0.07965850830078125, 0.08403682708740234, 0.08841514587402344, 0.09279346466064453, 0.09717178344726562, 0.10155010223388672, 0.10592842102050781, 0.1103067398071289, 0.11468505859375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 1.0, 3.0, 1.0, 5.0, 5.0, 6.0, 12.0, 16.0, 37.0, 65.0, 110.0, 271.0, 211.0, 105.0, 51.0, 47.0, 21.0, 12.0, 4.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03369140625, -0.03239250183105469, -0.031093597412109375, -0.029794692993164062, -0.02849578857421875, -0.027196884155273438, -0.025897979736328125, -0.024599075317382812, -0.0233001708984375, -0.022001266479492188, -0.020702362060546875, -0.019403457641601562, -0.01810455322265625, -0.016805648803710938, -0.015506744384765625, -0.014207839965820312, -0.012908935546875, -0.011610031127929688, -0.010311126708984375, -0.009012222290039062, -0.00771331787109375, -0.0064144134521484375, -0.005115509033203125, -0.0038166046142578125, -0.0025177001953125, -0.0012187957763671875, 8.0108642578125e-05, 0.0013790130615234375, 0.00267791748046875, 0.0039768218994140625, 0.005275726318359375, 0.0065746307373046875, 0.00787353515625, 0.009172439575195312, 0.010471343994140625, 0.011770248413085938, 0.01306915283203125, 0.014368057250976562, 0.015666961669921875, 0.016965866088867188, 0.0182647705078125, 0.019563674926757812, 0.020862579345703125, 0.022161483764648438, 0.02346038818359375, 0.024759292602539062, 0.026058197021484375, 0.027357101440429688, 0.028656005859375, 0.029954910278320312, 0.031253814697265625, 0.03255271911621094, 0.03385162353515625, 0.03515052795410156, 0.036449432373046875, 0.03774833679199219, 0.0390472412109375, 0.04034614562988281, 0.041645050048828125, 0.04294395446777344, 0.04424285888671875, 0.04554176330566406, 0.046840667724609375, 0.04813957214355469, 0.0494384765625]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 13.0, 23.0, 36.0, 80.0, 167.0, 201.0, 194.0, 104.0, 81.0, 54.0, 25.0, 11.0, 9.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.618438184261322, -0.6024943590164185, -0.5865505337715149, -0.5706067085266113, -0.5546629428863525, -0.538719117641449, -0.5227752923965454, -0.5068314671516418, -0.4908876419067383, -0.4749438166618347, -0.45900002121925354, -0.44305619597435, -0.4271123707294464, -0.41116857528686523, -0.39522475004196167, -0.3792809247970581, -0.36333712935447693, -0.34739330410957336, -0.3314495086669922, -0.3155056834220886, -0.29956185817718506, -0.2836180329322815, -0.2676742374897003, -0.25173041224479675, -0.23578660190105438, -0.219842791557312, -0.20389896631240845, -0.18795515596866608, -0.1720113456249237, -0.15606752038002014, -0.14012371003627777, -0.1241798922419548, -0.10823610424995422, -0.09229228645563126, -0.07634846866130829, -0.06040465831756592, -0.04446084052324295, -0.028517022728919983, -0.012573212385177612, 0.0033706054091453552, 0.019314423203468323, 0.03525824099779129, 0.05120205506682396, 0.06714586913585663, 0.0830896869301796, 0.09903350472450256, 0.11497731506824493, 0.1309211254119873, 0.14686495065689087, 0.16280876100063324, 0.1787525862455368, 0.19469639658927917, 0.21064022183418274, 0.2265840321779251, 0.24252784252166748, 0.25847166776657104, 0.2744154930114746, 0.2903593182563782, 0.30630311369895935, 0.3222469389438629, 0.3381907641887665, 0.35413455963134766, 0.3700783848762512, 0.3860222101211548, 0.40196600556373596]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 8.0, 13.0, 8.0, 8.0, 17.0, 15.0, 20.0, 13.0, 23.0, 28.0, 29.0, 29.0, 27.0, 35.0, 37.0, 39.0, 41.0, 43.0, 38.0, 43.0, 37.0, 36.0, 36.0, 49.0, 34.0, 29.0, 41.0, 30.0, 27.0, 25.0, 24.0, 20.0, 20.0, 15.0, 19.0, 7.0, 9.0, 8.0, 4.0, 3.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.3023441433906555, -0.2936819791793823, -0.28501978516578674, -0.27635762095451355, -0.26769545674324036, -0.25903329253196716, -0.2503710985183716, -0.2417089343070984, -0.2330467700958252, -0.2243845909833908, -0.21572242677211761, -0.20706024765968323, -0.19839808344841003, -0.18973590433597565, -0.18107372522354126, -0.17241156101226807, -0.16374938189983368, -0.1550872027873993, -0.1464250385761261, -0.1377628594636917, -0.12910069525241852, -0.12043851613998413, -0.11177634447813034, -0.10311417281627655, -0.09445200115442276, -0.08578982949256897, -0.07712765783071518, -0.06846548616886139, -0.0598033107817173, -0.05114113911986351, -0.04247896373271942, -0.03381679207086563, -0.02515462040901184, -0.01649244874715805, -0.007830275222659111, 0.0008318983018398285, 0.009494069963693619, 0.01815624162554741, 0.026818417012691498, 0.03548058867454529, 0.04414276033639908, 0.05280493199825287, 0.06146710366010666, 0.07012927532196045, 0.07879145443439484, 0.08745361864566803, 0.09611579775810242, 0.10477796941995621, 0.11344014108181, 0.12210231274366379, 0.13076448440551758, 0.13942666351795197, 0.14808882772922516, 0.15675100684165955, 0.16541317105293274, 0.17407535016536713, 0.1827375292778015, 0.1913997083902359, 0.2000618726015091, 0.20872405171394348, 0.21738621592521667, 0.22604839503765106, 0.23471057415008545, 0.24337273836135864, 0.25203490257263184]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 5.0, 3.0, 8.0, 13.0, 10.0, 8.0, 12.0, 25.0, 19.0, 17.0, 21.0, 27.0, 19.0, 34.0, 48.0, 52.0, 109.0, 206.0, 581.0, 1953.0, 13075.0, 3081344.0, 1085318.0, 8746.0, 1530.0, 493.0, 205.0, 92.0, 62.0, 37.0, 27.0, 25.0, 26.0, 20.0, 21.0, 19.0, 13.0, 10.0, 11.0, 7.0, 5.0, 8.0, 6.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0], "bins": [-0.51806640625, -0.5007553100585938, -0.4834442138671875, -0.46613311767578125, -0.448822021484375, -0.43151092529296875, -0.4141998291015625, -0.39688873291015625, -0.37957763671875, -0.36226654052734375, -0.3449554443359375, -0.32764434814453125, -0.310333251953125, -0.29302215576171875, -0.2757110595703125, -0.25839996337890625, -0.2410888671875, -0.22377777099609375, -0.2064666748046875, -0.18915557861328125, -0.171844482421875, -0.15453338623046875, -0.1372222900390625, -0.11991119384765625, -0.10260009765625, -0.08528900146484375, -0.0679779052734375, -0.05066680908203125, -0.033355712890625, -0.01604461669921875, 0.0012664794921875, 0.01857757568359375, 0.035888671875, 0.05319976806640625, 0.0705108642578125, 0.08782196044921875, 0.105133056640625, 0.12244415283203125, 0.1397552490234375, 0.15706634521484375, 0.17437744140625, 0.19168853759765625, 0.2089996337890625, 0.22631072998046875, 0.243621826171875, 0.26093292236328125, 0.2782440185546875, 0.29555511474609375, 0.3128662109375, 0.33017730712890625, 0.3474884033203125, 0.36479949951171875, 0.382110595703125, 0.39942169189453125, 0.4167327880859375, 0.43404388427734375, 0.45135498046875, 0.46866607666015625, 0.4859771728515625, 0.5032882690429688, 0.520599365234375, 0.5379104614257812, 0.5552215576171875, 0.5725326538085938, 0.58984375]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 6.0, 4.0, 5.0, 10.0, 15.0, 13.0, 19.0, 24.0, 33.0, 39.0, 55.0, 48.0, 45.0, 59.0, 70.0, 61.0, 74.0, 64.0, 63.0, 60.0, 56.0, 36.0, 27.0, 32.0, 29.0, 12.0, 13.0, 9.0, 2.0, 9.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12481689453125, -0.12087154388427734, -0.11692619323730469, -0.11298084259033203, -0.10903549194335938, -0.10509014129638672, -0.10114479064941406, -0.0971994400024414, -0.09325408935546875, -0.0893087387084961, -0.08536338806152344, -0.08141803741455078, -0.07747268676757812, -0.07352733612060547, -0.06958198547363281, -0.06563663482666016, -0.0616912841796875, -0.057745933532714844, -0.05380058288574219, -0.04985523223876953, -0.045909881591796875, -0.04196453094482422, -0.03801918029785156, -0.034073829650878906, -0.03012847900390625, -0.026183128356933594, -0.022237777709960938, -0.01829242706298828, -0.014347076416015625, -0.010401725769042969, -0.0064563751220703125, -0.0025110244750976562, 0.001434326171875, 0.005379676818847656, 0.009325027465820312, 0.013270378112792969, 0.017215728759765625, 0.02116107940673828, 0.025106430053710938, 0.029051780700683594, 0.03299713134765625, 0.036942481994628906, 0.04088783264160156, 0.04483318328857422, 0.048778533935546875, 0.05272388458251953, 0.05666923522949219, 0.060614585876464844, 0.0645599365234375, 0.06850528717041016, 0.07245063781738281, 0.07639598846435547, 0.08034133911132812, 0.08428668975830078, 0.08823204040527344, 0.0921773910522461, 0.09612274169921875, 0.1000680923461914, 0.10401344299316406, 0.10795879364013672, 0.11190414428710938, 0.11584949493408203, 0.11979484558105469, 0.12374019622802734, 0.127685546875]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 10.0, 13.0, 11.0, 28.0, 42.0, 42.0, 125.0, 226.0, 687.0, 2270.0, 14543.0, 388518.0, 3733725.0, 47413.0, 4769.0, 1091.0, 394.0, 152.0, 58.0, 53.0, 32.0, 22.0, 16.0, 7.0, 8.0, 7.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.234130859375, -0.22359466552734375, -0.2130584716796875, -0.20252227783203125, -0.191986083984375, -0.18144989013671875, -0.1709136962890625, -0.16037750244140625, -0.14984130859375, -0.13930511474609375, -0.1287689208984375, -0.11823272705078125, -0.107696533203125, -0.09716033935546875, -0.0866241455078125, -0.07608795166015625, -0.0655517578125, -0.05501556396484375, -0.0444793701171875, -0.03394317626953125, -0.023406982421875, -0.01287078857421875, -0.0023345947265625, 0.00820159912109375, 0.01873779296875, 0.02927398681640625, 0.0398101806640625, 0.05034637451171875, 0.060882568359375, 0.07141876220703125, 0.0819549560546875, 0.09249114990234375, 0.10302734375, 0.11356353759765625, 0.1240997314453125, 0.13463592529296875, 0.145172119140625, 0.15570831298828125, 0.1662445068359375, 0.17678070068359375, 0.18731689453125, 0.19785308837890625, 0.2083892822265625, 0.21892547607421875, 0.229461669921875, 0.23999786376953125, 0.2505340576171875, 0.26107025146484375, 0.2716064453125, 0.28214263916015625, 0.2926788330078125, 0.30321502685546875, 0.313751220703125, 0.32428741455078125, 0.3348236083984375, 0.34535980224609375, 0.35589599609375, 0.36643218994140625, 0.3769683837890625, 0.38750457763671875, 0.398040771484375, 0.40857696533203125, 0.4191131591796875, 0.42964935302734375, 0.440185546875]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 2.0, 3.0, 15.0, 13.0, 24.0, 20.0, 33.0, 39.0, 52.0, 64.0, 114.0, 149.0, 251.0, 470.0, 668.0, 771.0, 521.0, 309.0, 189.0, 102.0, 77.0, 39.0, 41.0, 34.0, 24.0, 11.0, 14.0, 9.0, 4.0, 5.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.057708740234375, -0.05623483657836914, -0.05476093292236328, -0.05328702926635742, -0.05181312561035156, -0.0503392219543457, -0.048865318298339844, -0.047391414642333984, -0.045917510986328125, -0.044443607330322266, -0.042969703674316406, -0.04149580001831055, -0.04002189636230469, -0.03854799270629883, -0.03707408905029297, -0.03560018539428711, -0.03412628173828125, -0.03265237808227539, -0.03117847442626953, -0.029704570770263672, -0.028230667114257812, -0.026756763458251953, -0.025282859802246094, -0.023808956146240234, -0.022335052490234375, -0.020861148834228516, -0.019387245178222656, -0.017913341522216797, -0.016439437866210938, -0.014965534210205078, -0.013491630554199219, -0.01201772689819336, -0.0105438232421875, -0.00906991958618164, -0.007596015930175781, -0.006122112274169922, -0.0046482086181640625, -0.003174304962158203, -0.0017004013061523438, -0.00022649765014648438, 0.001247406005859375, 0.0027213096618652344, 0.004195213317871094, 0.005669116973876953, 0.0071430206298828125, 0.008616924285888672, 0.010090827941894531, 0.01156473159790039, 0.01303863525390625, 0.01451253890991211, 0.01598644256591797, 0.017460346221923828, 0.018934249877929688, 0.020408153533935547, 0.021882057189941406, 0.023355960845947266, 0.024829864501953125, 0.026303768157958984, 0.027777671813964844, 0.029251575469970703, 0.030725479125976562, 0.03219938278198242, 0.03367328643798828, 0.03514719009399414, 0.03662109375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 3.0, 5.0, 14.0, 14.0, 31.0, 44.0, 77.0, 104.0, 131.0, 160.0, 139.0, 94.0, 70.0, 45.0, 31.0, 20.0, 13.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25304198265075684, -0.2447388917207718, -0.23643580079078674, -0.2281327098608017, -0.21982961893081665, -0.2115265280008316, -0.20322343707084656, -0.19492033123970032, -0.18661725521087646, -0.17831416428089142, -0.17001107335090637, -0.16170798242092133, -0.15340489149093628, -0.14510180056095123, -0.1367987096309662, -0.12849560379981995, -0.1201925128698349, -0.11188942193984985, -0.10358633100986481, -0.09528324007987976, -0.08698014914989471, -0.07867705821990967, -0.07037395983934402, -0.06207086890935898, -0.05376777797937393, -0.045464687049388885, -0.03716159611940384, -0.028858501464128494, -0.020555410534143448, -0.012252319604158401, -0.003949224948883057, 0.00435386598110199, 0.012656956911087036, 0.020960047841072083, 0.029263140633702278, 0.037566233426332474, 0.04586932435631752, 0.054172415286302567, 0.06247550994157791, 0.07077860087156296, 0.079081691801548, 0.08738478273153305, 0.0956878736615181, 0.10399097204208374, 0.11229406297206879, 0.12059715390205383, 0.12890024483203888, 0.13720333576202393, 0.14550642669200897, 0.15380951762199402, 0.16211260855197906, 0.1704156994819641, 0.17871879041194916, 0.1870218813419342, 0.19532498717308044, 0.2036280632019043, 0.21193116903305054, 0.22023425996303558, 0.22853735089302063, 0.23684044182300568, 0.24514353275299072, 0.25344663858413696, 0.2617497146129608, 0.27005282044410706, 0.2783558964729309]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 5.0, 6.0, 7.0, 3.0, 7.0, 13.0, 14.0, 15.0, 21.0, 18.0, 28.0, 33.0, 36.0, 39.0, 49.0, 34.0, 48.0, 42.0, 42.0, 47.0, 56.0, 64.0, 45.0, 44.0, 33.0, 33.0, 43.0, 34.0, 22.0, 23.0, 18.0, 21.0, 24.0, 11.0, 13.0, 4.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09925607591867447, -0.0955699160695076, -0.09188375622034073, -0.08819759637117386, -0.08451143652200699, -0.08082527667284012, -0.07713910937309265, -0.07345294952392578, -0.06976678967475891, -0.06608062982559204, -0.06239446997642517, -0.0587083101272583, -0.05502215027809143, -0.05133599042892456, -0.04764982685446739, -0.04396366700530052, -0.04027751088142395, -0.03659135103225708, -0.03290519118309021, -0.02921902947127819, -0.02553286962211132, -0.02184670977294445, -0.01816054806113243, -0.014474388211965561, -0.01078822836279869, -0.007102068047970533, -0.003415907733142376, 0.0002702530473470688, 0.003956412896513939, 0.007642572745680809, 0.011328734457492828, 0.015014894306659698, 0.018701061606407166, 0.022387221455574036, 0.026073381304740906, 0.029759543016552925, 0.033445701003074646, 0.037131860852241516, 0.040818024426698685, 0.044504184275865555, 0.048190344125032425, 0.051876503974199295, 0.055562663823366165, 0.059248827397823334, 0.0629349872469902, 0.06662114709615707, 0.07030730694532394, 0.07399346679449081, 0.07767962664365768, 0.08136578649282455, 0.08505194634199142, 0.0887381061911583, 0.09242426604032516, 0.09611042588949203, 0.0997965931892395, 0.10348275303840637, 0.10716891288757324, 0.11085507273674011, 0.11454123258590698, 0.11822739243507385, 0.12191355228424072, 0.1255997121334076, 0.12928587198257446, 0.13297203183174133, 0.1366581916809082]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 6.0, 6.0, 9.0, 16.0, 25.0, 27.0, 59.0, 126.0, 233.0, 480.0, 1068.0, 2525.0, 6339.0, 18429.0, 129495.0, 777317.0, 87528.0, 15397.0, 5444.0, 2139.0, 954.0, 451.0, 201.0, 125.0, 61.0, 36.0, 23.0, 9.0, 12.0, 5.0, 7.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1121826171875, -0.10918521881103516, -0.10618782043457031, -0.10319042205810547, -0.10019302368164062, -0.09719562530517578, -0.09419822692871094, -0.0912008285522461, -0.08820343017578125, -0.0852060317993164, -0.08220863342285156, -0.07921123504638672, -0.07621383666992188, -0.07321643829345703, -0.07021903991699219, -0.06722164154052734, -0.0642242431640625, -0.061226844787597656, -0.05822944641113281, -0.05523204803466797, -0.052234649658203125, -0.04923725128173828, -0.04623985290527344, -0.043242454528808594, -0.04024505615234375, -0.037247657775878906, -0.03425025939941406, -0.03125286102294922, -0.028255462646484375, -0.02525806427001953, -0.022260665893554688, -0.019263267517089844, -0.016265869140625, -0.013268470764160156, -0.010271072387695312, -0.007273674011230469, -0.004276275634765625, -0.0012788772583007812, 0.0017185211181640625, 0.004715919494628906, 0.00771331787109375, 0.010710716247558594, 0.013708114624023438, 0.01670551300048828, 0.019702911376953125, 0.02270030975341797, 0.025697708129882812, 0.028695106506347656, 0.0316925048828125, 0.034689903259277344, 0.03768730163574219, 0.04068470001220703, 0.043682098388671875, 0.04667949676513672, 0.04967689514160156, 0.052674293518066406, 0.05567169189453125, 0.058669090270996094, 0.06166648864746094, 0.06466388702392578, 0.06766128540039062, 0.07065868377685547, 0.07365608215332031, 0.07665348052978516, 0.07965087890625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 4.0, 6.0, 10.0, 10.0, 14.0, 15.0, 14.0, 27.0, 24.0, 39.0, 29.0, 50.0, 41.0, 55.0, 51.0, 65.0, 45.0, 51.0, 59.0, 58.0, 40.0, 39.0, 47.0, 34.0, 34.0, 25.0, 32.0, 24.0, 16.0, 14.0, 6.0, 8.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.076904296875, -0.0740365982055664, -0.07116889953613281, -0.06830120086669922, -0.06543350219726562, -0.06256580352783203, -0.05969810485839844, -0.056830406188964844, -0.05396270751953125, -0.051095008850097656, -0.04822731018066406, -0.04535961151123047, -0.042491912841796875, -0.03962421417236328, -0.03675651550292969, -0.033888816833496094, -0.0310211181640625, -0.028153419494628906, -0.025285720825195312, -0.02241802215576172, -0.019550323486328125, -0.01668262481689453, -0.013814926147460938, -0.010947227478027344, -0.00807952880859375, -0.005211830139160156, -0.0023441314697265625, 0.0005235671997070312, 0.003391265869140625, 0.006258964538574219, 0.009126663208007812, 0.011994361877441406, 0.014862060546875, 0.017729759216308594, 0.020597457885742188, 0.02346515655517578, 0.026332855224609375, 0.02920055389404297, 0.03206825256347656, 0.034935951232910156, 0.03780364990234375, 0.040671348571777344, 0.04353904724121094, 0.04640674591064453, 0.049274444580078125, 0.05214214324951172, 0.05500984191894531, 0.057877540588378906, 0.0607452392578125, 0.0636129379272461, 0.06648063659667969, 0.06934833526611328, 0.07221603393554688, 0.07508373260498047, 0.07795143127441406, 0.08081912994384766, 0.08368682861328125, 0.08655452728271484, 0.08942222595214844, 0.09228992462158203, 0.09515762329101562, 0.09802532196044922, 0.10089302062988281, 0.1037607192993164, 0.10662841796875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 7.0, 6.0, 14.0, 22.0, 20.0, 50.0, 79.0, 153.0, 399.0, 1108.0, 4094.0, 23271.0, 521538.0, 470569.0, 21615.0, 3855.0, 1023.0, 387.0, 141.0, 72.0, 40.0, 23.0, 14.0, 14.0, 11.0, 13.0, 8.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11566162109375, -0.11261653900146484, -0.10957145690917969, -0.10652637481689453, -0.10348129272460938, -0.10043621063232422, -0.09739112854003906, -0.0943460464477539, -0.09130096435546875, -0.0882558822631836, -0.08521080017089844, -0.08216571807861328, -0.07912063598632812, -0.07607555389404297, -0.07303047180175781, -0.06998538970947266, -0.0669403076171875, -0.06389522552490234, -0.06085014343261719, -0.05780506134033203, -0.054759979248046875, -0.05171489715576172, -0.04866981506347656, -0.045624732971191406, -0.04257965087890625, -0.039534568786621094, -0.03648948669433594, -0.03344440460205078, -0.030399322509765625, -0.02735424041748047, -0.024309158325195312, -0.021264076232910156, -0.018218994140625, -0.015173912048339844, -0.012128829956054688, -0.009083747863769531, -0.006038665771484375, -0.0029935836791992188, 5.14984130859375e-05, 0.0030965805053710938, 0.00614166259765625, 0.009186744689941406, 0.012231826782226562, 0.015276908874511719, 0.018321990966796875, 0.02136707305908203, 0.024412155151367188, 0.027457237243652344, 0.0305023193359375, 0.033547401428222656, 0.03659248352050781, 0.03963756561279297, 0.042682647705078125, 0.04572772979736328, 0.04877281188964844, 0.051817893981933594, 0.05486297607421875, 0.057908058166503906, 0.06095314025878906, 0.06399822235107422, 0.06704330444335938, 0.07008838653564453, 0.07313346862792969, 0.07617855072021484, 0.0792236328125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 4.0, 7.0, 12.0, 5.0, 7.0, 10.0, 8.0, 14.0, 10.0, 18.0, 20.0, 33.0, 32.0, 28.0, 32.0, 42.0, 45.0, 29.0, 44.0, 49.0, 30.0, 52.0, 44.0, 39.0, 51.0, 41.0, 35.0, 39.0, 16.0, 35.0, 29.0, 23.0, 13.0, 22.0, 13.0, 14.0, 14.0, 12.0, 8.0, 9.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.1610107421875, -0.15622520446777344, -0.15143966674804688, -0.1466541290283203, -0.14186859130859375, -0.1370830535888672, -0.13229751586914062, -0.12751197814941406, -0.1227264404296875, -0.11794090270996094, -0.11315536499023438, -0.10836982727050781, -0.10358428955078125, -0.09879875183105469, -0.09401321411132812, -0.08922767639160156, -0.084442138671875, -0.07965660095214844, -0.07487106323242188, -0.07008552551269531, -0.06529998779296875, -0.06051445007324219, -0.055728912353515625, -0.05094337463378906, -0.0461578369140625, -0.04137229919433594, -0.036586761474609375, -0.03180122375488281, -0.02701568603515625, -0.022230148315429688, -0.017444610595703125, -0.012659072875976562, -0.00787353515625, -0.0030879974365234375, 0.001697540283203125, 0.0064830780029296875, 0.01126861572265625, 0.016054153442382812, 0.020839691162109375, 0.025625228881835938, 0.0304107666015625, 0.03519630432128906, 0.039981842041015625, 0.04476737976074219, 0.04955291748046875, 0.05433845520019531, 0.059123992919921875, 0.06390953063964844, 0.068695068359375, 0.07348060607910156, 0.07826614379882812, 0.08305168151855469, 0.08783721923828125, 0.09262275695800781, 0.09740829467773438, 0.10219383239746094, 0.1069793701171875, 0.11176490783691406, 0.11655044555664062, 0.12133598327636719, 0.12612152099609375, 0.1309070587158203, 0.13569259643554688, 0.14047813415527344, 0.145263671875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 6.0, 5.0, 13.0, 17.0, 26.0, 49.0, 61.0, 107.0, 181.0, 413.0, 992.0, 2753.0, 10055.0, 57676.0, 494707.0, 421199.0, 47246.0, 8741.0, 2480.0, 926.0, 401.0, 193.0, 104.0, 66.0, 39.0, 22.0, 18.0, 14.0, 7.0, 10.0, 4.0, 3.0, 3.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015625, -0.015103340148925781, -0.014581680297851562, -0.014060020446777344, -0.013538360595703125, -0.013016700744628906, -0.012495040893554688, -0.011973381042480469, -0.01145172119140625, -0.010930061340332031, -0.010408401489257812, -0.009886741638183594, -0.009365081787109375, -0.008843421936035156, -0.008321762084960938, -0.007800102233886719, -0.0072784423828125, -0.006756782531738281, -0.0062351226806640625, -0.005713462829589844, -0.005191802978515625, -0.004670143127441406, -0.0041484832763671875, -0.0036268234252929688, -0.00310516357421875, -0.0025835037231445312, -0.0020618438720703125, -0.0015401840209960938, -0.001018524169921875, -0.0004968643188476562, 2.47955322265625e-05, 0.0005464553833007812, 0.001068115234375, 0.0015897750854492188, 0.0021114349365234375, 0.0026330947875976562, 0.003154754638671875, 0.0036764144897460938, 0.0041980743408203125, 0.004719734191894531, 0.00524139404296875, 0.005763053894042969, 0.0062847137451171875, 0.006806373596191406, 0.007328033447265625, 0.007849693298339844, 0.008371353149414062, 0.008893013000488281, 0.0094146728515625, 0.009936332702636719, 0.010457992553710938, 0.010979652404785156, 0.011501312255859375, 0.012022972106933594, 0.012544631958007812, 0.013066291809082031, 0.01358795166015625, 0.014109611511230469, 0.014631271362304688, 0.015152931213378906, 0.015674591064453125, 0.016196250915527344, 0.016717910766601562, 0.01723957061767578, 0.01776123046875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 6.0, 9.0, 4.0, 14.0, 9.0, 14.0, 18.0, 20.0, 31.0, 21.0, 37.0, 54.0, 31.0, 80.0, 81.0, 85.0, 42.0, 69.0, 86.0, 58.0, 29.0, 43.0, 31.0, 23.0, 26.0, 20.0, 16.0, 6.0, 9.0, 7.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-5.662441253662109e-06, -5.500391125679016e-06, -5.338340997695923e-06, -5.17629086971283e-06, -5.014240741729736e-06, -4.852190613746643e-06, -4.69014048576355e-06, -4.5280903577804565e-06, -4.366040229797363e-06, -4.20399010181427e-06, -4.041939973831177e-06, -3.8798898458480835e-06, -3.7178397178649902e-06, -3.555789589881897e-06, -3.3937394618988037e-06, -3.2316893339157104e-06, -3.069639205932617e-06, -2.907589077949524e-06, -2.7455389499664307e-06, -2.5834888219833374e-06, -2.421438694000244e-06, -2.259388566017151e-06, -2.0973384380340576e-06, -1.9352883100509644e-06, -1.773238182067871e-06, -1.6111880540847778e-06, -1.4491379261016846e-06, -1.2870877981185913e-06, -1.125037670135498e-06, -9.629875421524048e-07, -8.009374141693115e-07, -6.388872861862183e-07, -4.76837158203125e-07, -3.1478703022003174e-07, -1.5273690223693848e-07, 9.313225746154785e-09, 1.7136335372924805e-07, 3.334134817123413e-07, 4.954636096954346e-07, 6.575137376785278e-07, 8.195638656616211e-07, 9.816139936447144e-07, 1.1436641216278076e-06, 1.3057142496109009e-06, 1.4677643775939941e-06, 1.6298145055770874e-06, 1.7918646335601807e-06, 1.953914761543274e-06, 2.115964889526367e-06, 2.2780150175094604e-06, 2.4400651454925537e-06, 2.602115273475647e-06, 2.7641654014587402e-06, 2.9262155294418335e-06, 3.0882656574249268e-06, 3.25031578540802e-06, 3.4123659133911133e-06, 3.5744160413742065e-06, 3.7364661693573e-06, 3.898516297340393e-06, 4.060566425323486e-06, 4.22261655330658e-06, 4.384666681289673e-06, 4.546716809272766e-06, 4.708766937255859e-06]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 7.0, 5.0, 3.0, 4.0, 9.0, 11.0, 15.0, 29.0, 64.0, 74.0, 101.0, 211.0, 415.0, 883.0, 2209.0, 6554.0, 28415.0, 197968.0, 627334.0, 151975.0, 22934.0, 5763.0, 1965.0, 741.0, 402.0, 196.0, 105.0, 50.0, 33.0, 27.0, 12.0, 7.0, 8.0, 8.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.018890380859375, -0.018357276916503906, -0.017824172973632812, -0.01729106903076172, -0.016757965087890625, -0.01622486114501953, -0.015691757202148438, -0.015158653259277344, -0.01462554931640625, -0.014092445373535156, -0.013559341430664062, -0.013026237487792969, -0.012493133544921875, -0.011960029602050781, -0.011426925659179688, -0.010893821716308594, -0.0103607177734375, -0.009827613830566406, -0.009294509887695312, -0.008761405944824219, -0.008228302001953125, -0.007695198059082031, -0.0071620941162109375, -0.006628990173339844, -0.00609588623046875, -0.005562782287597656, -0.0050296783447265625, -0.004496574401855469, -0.003963470458984375, -0.0034303665161132812, -0.0028972625732421875, -0.0023641586303710938, -0.0018310546875, -0.0012979507446289062, -0.0007648468017578125, -0.00023174285888671875, 0.000301361083984375, 0.0008344650268554688, 0.0013675689697265625, 0.0019006729125976562, 0.00243377685546875, 0.0029668807983398438, 0.0034999847412109375, 0.004033088684082031, 0.004566192626953125, 0.005099296569824219, 0.0056324005126953125, 0.006165504455566406, 0.0066986083984375, 0.007231712341308594, 0.0077648162841796875, 0.008297920227050781, 0.008831024169921875, 0.009364128112792969, 0.009897232055664062, 0.010430335998535156, 0.01096343994140625, 0.011496543884277344, 0.012029647827148438, 0.012562751770019531, 0.013095855712890625, 0.013628959655761719, 0.014162063598632812, 0.014695167541503906, 0.015228271484375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 9.0, 6.0, 10.0, 11.0, 26.0, 19.0, 35.0, 32.0, 35.0, 59.0, 88.0, 91.0, 75.0, 85.0, 78.0, 76.0, 61.0, 35.0, 36.0, 29.0, 28.0, 17.0, 10.0, 3.0, 7.0, 7.0, 5.0, 6.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.003871917724609375, -0.0037503838539123535, -0.003628849983215332, -0.0035073161125183105, -0.003385782241821289, -0.0032642483711242676, -0.003142714500427246, -0.0030211806297302246, -0.002899646759033203, -0.0027781128883361816, -0.00265657901763916, -0.0025350451469421387, -0.002413511276245117, -0.0022919774055480957, -0.0021704435348510742, -0.0020489096641540527, -0.0019273757934570312, -0.0018058419227600098, -0.0016843080520629883, -0.0015627741813659668, -0.0014412403106689453, -0.0013197064399719238, -0.0011981725692749023, -0.0010766386985778809, -0.0009551048278808594, -0.0008335709571838379, -0.0007120370864868164, -0.0005905032157897949, -0.00046896934509277344, -0.00034743547439575195, -0.00022590160369873047, -0.00010436773300170898, 1.71661376953125e-05, 0.00013870000839233398, 0.00026023387908935547, 0.00038176774978637695, 0.0005033016204833984, 0.0006248354911804199, 0.0007463693618774414, 0.0008679032325744629, 0.0009894371032714844, 0.0011109709739685059, 0.0012325048446655273, 0.0013540387153625488, 0.0014755725860595703, 0.0015971064567565918, 0.0017186403274536133, 0.0018401741981506348, 0.0019617080688476562, 0.0020832419395446777, 0.0022047758102416992, 0.0023263096809387207, 0.002447843551635742, 0.0025693774223327637, 0.002690911293029785, 0.0028124451637268066, 0.002933979034423828, 0.0030555129051208496, 0.003177046775817871, 0.0032985806465148926, 0.003420114517211914, 0.0035416483879089355, 0.003663182258605957, 0.0037847161293029785, 0.00390625]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 3.0, 9.0, 12.0, 22.0, 32.0, 79.0, 79.0, 133.0, 140.0, 159.0, 120.0, 88.0, 42.0, 38.0, 23.0, 13.0, 4.0, 8.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.20603322982788086, -0.2004377394914627, -0.19484224915504456, -0.1892467439174652, -0.18365125358104706, -0.1780557632446289, -0.17246027290821075, -0.1668647825717926, -0.16126927733421326, -0.1556737869977951, -0.15007829666137695, -0.1444827914237976, -0.13888730108737946, -0.1332918107509613, -0.12769632041454315, -0.122100830078125, -0.11650533974170685, -0.1109098494052887, -0.10531435161828995, -0.0997188612818718, -0.09412336349487305, -0.0885278731584549, -0.08293238282203674, -0.07733689248561859, -0.07174139469861984, -0.06614590436220169, -0.06055040657520294, -0.05495491623878479, -0.04935942217707634, -0.04376392811536789, -0.03816843777894974, -0.03257294371724129, -0.026977434754371643, -0.021381940692663193, -0.01578644849359989, -0.01019095629453659, -0.00459546223282814, 0.00100003182888031, 0.006595522165298462, 0.012191016227006912, 0.017786510288715363, 0.023382004350423813, 0.028977496549487114, 0.034572988748550415, 0.040168482810258865, 0.045763976871967316, 0.05135946720838547, 0.05695496127009392, 0.06255045533180237, 0.06814594566822052, 0.07374144345521927, 0.07933693379163742, 0.08493243157863617, 0.09052792191505432, 0.09612341225147247, 0.10171890258789062, 0.10731440037488937, 0.11290989071130753, 0.11850538849830627, 0.12410087883472443, 0.12969636917114258, 0.13529187440872192, 0.14088734984397888, 0.14648285508155823, 0.15207834541797638]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 6.0, 8.0, 9.0, 5.0, 4.0, 9.0, 14.0, 22.0, 14.0, 26.0, 34.0, 31.0, 47.0, 44.0, 49.0, 40.0, 44.0, 54.0, 62.0, 58.0, 57.0, 56.0, 36.0, 42.0, 32.0, 45.0, 24.0, 31.0, 34.0, 23.0, 17.0, 11.0, 7.0, 5.0, 6.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07813102751970291, -0.07540745288133621, -0.07268387824296951, -0.06996030360460281, -0.06723672896623611, -0.06451314687728882, -0.06178957596421242, -0.05906599760055542, -0.05634242296218872, -0.05361884832382202, -0.05089527368545532, -0.04817169904708862, -0.045448120683431625, -0.042724546045064926, -0.04000097140669823, -0.03727739304304123, -0.03455382212996483, -0.03183024749159813, -0.02910667099058628, -0.02638309635221958, -0.023659519851207733, -0.020935945212841034, -0.018212370574474335, -0.015488794073462486, -0.012765219435095787, -0.010041643865406513, -0.007318068761378527, -0.00459449365735054, -0.0018709180876612663, 0.0008526574820280075, 0.0035762321203947067, 0.006299808621406555, 0.009023383259773254, 0.011746958829462528, 0.014470534399151802, 0.0171941090375185, 0.01991768553853035, 0.02264126017689705, 0.025364834815263748, 0.028088411316275597, 0.030811985954642296, 0.033535562455654144, 0.036259137094020844, 0.03898271173238754, 0.04170628637075424, 0.04442986100912094, 0.04715343564748764, 0.04987701401114464, 0.05260058864951134, 0.055324163287878036, 0.058047737926244736, 0.06077131628990173, 0.06349489092826843, 0.06621846556663513, 0.06894204020500183, 0.07166561484336853, 0.07438918948173523, 0.07711276412010193, 0.07983633875846863, 0.08255991339683533, 0.08528348803520203, 0.08800706267356873, 0.09073063731193542, 0.09345421940088272, 0.09617779403924942]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 5.0, 12.0, 10.0, 16.0, 29.0, 44.0, 65.0, 98.0, 170.0, 314.0, 517.0, 985.0, 2021.0, 4517.0, 11774.0, 38137.0, 199954.0, 669989.0, 84590.0, 21635.0, 7411.0, 3122.0, 1439.0, 790.0, 406.0, 185.0, 121.0, 75.0, 56.0, 21.0, 13.0, 15.0, 13.0, 6.0, 6.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0867919921875, -0.08271217346191406, -0.07863235473632812, -0.07455253601074219, -0.07047271728515625, -0.06639289855957031, -0.062313079833984375, -0.05823326110839844, -0.0541534423828125, -0.05007362365722656, -0.045993804931640625, -0.04191398620605469, -0.03783416748046875, -0.03375434875488281, -0.029674530029296875, -0.025594711303710938, -0.021514892578125, -0.017435073852539062, -0.013355255126953125, -0.009275436401367188, -0.00519561767578125, -0.0011157989501953125, 0.002964019775390625, 0.0070438385009765625, 0.0111236572265625, 0.015203475952148438, 0.019283294677734375, 0.023363113403320312, 0.02744293212890625, 0.03152275085449219, 0.035602569580078125, 0.03968238830566406, 0.04376220703125, 0.04784202575683594, 0.051921844482421875, 0.05600166320800781, 0.06008148193359375, 0.06416130065917969, 0.06824111938476562, 0.07232093811035156, 0.0764007568359375, 0.08048057556152344, 0.08456039428710938, 0.08864021301269531, 0.09272003173828125, 0.09679985046386719, 0.10087966918945312, 0.10495948791503906, 0.109039306640625, 0.11311912536621094, 0.11719894409179688, 0.12127876281738281, 0.12535858154296875, 0.1294384002685547, 0.13351821899414062, 0.13759803771972656, 0.1416778564453125, 0.14575767517089844, 0.14983749389648438, 0.1539173126220703, 0.15799713134765625, 0.1620769500732422, 0.16615676879882812, 0.17023658752441406, 0.17431640625]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 9.0, 7.0, 3.0, 10.0, 8.0, 8.0, 18.0, 21.0, 19.0, 30.0, 35.0, 40.0, 44.0, 44.0, 47.0, 53.0, 54.0, 77.0, 45.0, 62.0, 49.0, 43.0, 58.0, 38.0, 24.0, 24.0, 38.0, 26.0, 25.0, 15.0, 9.0, 7.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1494140625, -0.1441936492919922, -0.13897323608398438, -0.13375282287597656, -0.12853240966796875, -0.12331199645996094, -0.11809158325195312, -0.11287117004394531, -0.1076507568359375, -0.10243034362792969, -0.09720993041992188, -0.09198951721191406, -0.08676910400390625, -0.08154869079589844, -0.07632827758789062, -0.07110786437988281, -0.065887451171875, -0.06066703796386719, -0.055446624755859375, -0.05022621154785156, -0.04500579833984375, -0.03978538513183594, -0.034564971923828125, -0.029344558715820312, -0.0241241455078125, -0.018903732299804688, -0.013683319091796875, -0.008462905883789062, -0.00324249267578125, 0.0019779205322265625, 0.007198333740234375, 0.012418746948242188, 0.01763916015625, 0.022859573364257812, 0.028079986572265625, 0.03330039978027344, 0.03852081298828125, 0.04374122619628906, 0.048961639404296875, 0.05418205261230469, 0.0594024658203125, 0.06462287902832031, 0.06984329223632812, 0.07506370544433594, 0.08028411865234375, 0.08550453186035156, 0.09072494506835938, 0.09594535827636719, 0.101165771484375, 0.10638618469238281, 0.11160659790039062, 0.11682701110839844, 0.12204742431640625, 0.12726783752441406, 0.13248825073242188, 0.1377086639404297, 0.1429290771484375, 0.1481494903564453, 0.15336990356445312, 0.15859031677246094, 0.16381072998046875, 0.16903114318847656, 0.17425155639648438, 0.1794719696044922, 0.1846923828125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 4.0, 5.0, 5.0, 17.0, 27.0, 30.0, 58.0, 76.0, 121.0, 210.0, 530.0, 3093.0, 95841.0, 935362.0, 11314.0, 1109.0, 306.0, 143.0, 95.0, 48.0, 47.0, 27.0, 18.0, 30.0, 11.0, 11.0, 5.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47314453125, -0.4600868225097656, -0.44702911376953125, -0.4339714050292969, -0.4209136962890625, -0.4078559875488281, -0.39479827880859375, -0.3817405700683594, -0.368682861328125, -0.3556251525878906, -0.34256744384765625, -0.3295097351074219, -0.3164520263671875, -0.3033943176269531, -0.29033660888671875, -0.2772789001464844, -0.26422119140625, -0.2511634826660156, -0.23810577392578125, -0.22504806518554688, -0.2119903564453125, -0.19893264770507812, -0.18587493896484375, -0.17281723022460938, -0.159759521484375, -0.14670181274414062, -0.13364410400390625, -0.12058639526367188, -0.1075286865234375, -0.09447097778320312, -0.08141326904296875, -0.06835556030273438, -0.0552978515625, -0.042240142822265625, -0.02918243408203125, -0.016124725341796875, -0.0030670166015625, 0.009990692138671875, 0.02304840087890625, 0.036106109619140625, 0.049163818359375, 0.062221527099609375, 0.07527923583984375, 0.08833694458007812, 0.1013946533203125, 0.11445236206054688, 0.12751007080078125, 0.14056777954101562, 0.15362548828125, 0.16668319702148438, 0.17974090576171875, 0.19279861450195312, 0.2058563232421875, 0.21891403198242188, 0.23197174072265625, 0.24502944946289062, 0.258087158203125, 0.2711448669433594, 0.28420257568359375, 0.2972602844238281, 0.3103179931640625, 0.3233757019042969, 0.33643341064453125, 0.3494911193847656, 0.362548828125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 4.0, 7.0, 7.0, 3.0, 9.0, 11.0, 17.0, 25.0, 43.0, 37.0, 54.0, 53.0, 57.0, 63.0, 65.0, 53.0, 72.0, 80.0, 52.0, 47.0, 51.0, 40.0, 36.0, 27.0, 19.0, 20.0, 18.0, 15.0, 10.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.264404296875, -0.2571239471435547, -0.24984359741210938, -0.24256324768066406, -0.23528289794921875, -0.22800254821777344, -0.22072219848632812, -0.2134418487548828, -0.2061614990234375, -0.1988811492919922, -0.19160079956054688, -0.18432044982910156, -0.17704010009765625, -0.16975975036621094, -0.16247940063476562, -0.1551990509033203, -0.147918701171875, -0.1406383514404297, -0.13335800170898438, -0.12607765197753906, -0.11879730224609375, -0.11151695251464844, -0.10423660278320312, -0.09695625305175781, -0.0896759033203125, -0.08239555358886719, -0.07511520385742188, -0.06783485412597656, -0.06055450439453125, -0.05327415466308594, -0.045993804931640625, -0.03871345520019531, -0.03143310546875, -0.024152755737304688, -0.016872406005859375, -0.009592056274414062, -0.00231170654296875, 0.0049686431884765625, 0.012248992919921875, 0.019529342651367188, 0.0268096923828125, 0.03409004211425781, 0.041370391845703125, 0.04865074157714844, 0.05593109130859375, 0.06321144104003906, 0.07049179077148438, 0.07777214050292969, 0.085052490234375, 0.09233283996582031, 0.09961318969726562, 0.10689353942871094, 0.11417388916015625, 0.12145423889160156, 0.12873458862304688, 0.1360149383544922, 0.1432952880859375, 0.1505756378173828, 0.15785598754882812, 0.16513633728027344, 0.17241668701171875, 0.17969703674316406, 0.18697738647460938, 0.1942577362060547, 0.2015380859375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 7.0, 10.0, 10.0, 17.0, 24.0, 33.0, 55.0, 78.0, 133.0, 247.0, 449.0, 918.0, 2384.0, 7469.0, 42421.0, 621680.0, 336352.0, 26908.0, 5720.0, 1900.0, 809.0, 386.0, 191.0, 112.0, 70.0, 49.0, 40.0, 22.0, 13.0, 9.0, 12.0, 6.0, 1.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0457763671875, -0.044599294662475586, -0.04342222213745117, -0.04224514961242676, -0.041068077087402344, -0.03989100456237793, -0.038713932037353516, -0.0375368595123291, -0.03635978698730469, -0.03518271446228027, -0.03400564193725586, -0.032828569412231445, -0.03165149688720703, -0.030474424362182617, -0.029297351837158203, -0.02812027931213379, -0.026943206787109375, -0.02576613426208496, -0.024589061737060547, -0.023411989212036133, -0.02223491668701172, -0.021057844161987305, -0.01988077163696289, -0.018703699111938477, -0.017526626586914062, -0.01634955406188965, -0.015172481536865234, -0.01399540901184082, -0.012818336486816406, -0.011641263961791992, -0.010464191436767578, -0.009287118911743164, -0.00811004638671875, -0.006932973861694336, -0.005755901336669922, -0.004578828811645508, -0.0034017562866210938, -0.0022246837615966797, -0.0010476112365722656, 0.00012946128845214844, 0.0013065338134765625, 0.0024836063385009766, 0.0036606788635253906, 0.004837751388549805, 0.006014823913574219, 0.007191896438598633, 0.008368968963623047, 0.009546041488647461, 0.010723114013671875, 0.011900186538696289, 0.013077259063720703, 0.014254331588745117, 0.015431404113769531, 0.016608476638793945, 0.01778554916381836, 0.018962621688842773, 0.020139694213867188, 0.0213167667388916, 0.022493839263916016, 0.02367091178894043, 0.024847984313964844, 0.026025056838989258, 0.027202129364013672, 0.028379201889038086, 0.0295562744140625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 5.0, 14.0, 9.0, 14.0, 22.0, 44.0, 94.0, 115.0, 149.0, 152.0, 150.0, 77.0, 49.0, 43.0, 16.0, 20.0, 6.0, 4.0, 4.0, 8.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.68899917602539e-06, -7.442198693752289e-06, -7.195398211479187e-06, -6.948597729206085e-06, -6.701797246932983e-06, -6.454996764659882e-06, -6.20819628238678e-06, -5.961395800113678e-06, -5.714595317840576e-06, -5.467794835567474e-06, -5.2209943532943726e-06, -4.974193871021271e-06, -4.727393388748169e-06, -4.480592906475067e-06, -4.233792424201965e-06, -3.9869919419288635e-06, -3.7401914596557617e-06, -3.49339097738266e-06, -3.246590495109558e-06, -2.9997900128364563e-06, -2.7529895305633545e-06, -2.5061890482902527e-06, -2.259388566017151e-06, -2.012588083744049e-06, -1.7657876014709473e-06, -1.5189871191978455e-06, -1.2721866369247437e-06, -1.0253861546516418e-06, -7.7858567237854e-07, -5.317851901054382e-07, -2.849847078323364e-07, -3.818422555923462e-08, 2.086162567138672e-07, 4.55416738986969e-07, 7.022172212600708e-07, 9.490177035331726e-07, 1.1958181858062744e-06, 1.4426186680793762e-06, 1.689419150352478e-06, 1.93621963262558e-06, 2.1830201148986816e-06, 2.4298205971717834e-06, 2.6766210794448853e-06, 2.923421561717987e-06, 3.170222043991089e-06, 3.4170225262641907e-06, 3.6638230085372925e-06, 3.910623490810394e-06, 4.157423973083496e-06, 4.404224455356598e-06, 4.6510249376297e-06, 4.8978254199028015e-06, 5.144625902175903e-06, 5.391426384449005e-06, 5.638226866722107e-06, 5.885027348995209e-06, 6.1318278312683105e-06, 6.378628313541412e-06, 6.625428795814514e-06, 6.872229278087616e-06, 7.119029760360718e-06, 7.36583024263382e-06, 7.612630724906921e-06, 7.859431207180023e-06, 8.106231689453125e-06]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 6.0, 10.0, 17.0, 16.0, 28.0, 39.0, 98.0, 156.0, 286.0, 619.0, 1754.0, 6793.0, 67260.0, 905192.0, 56972.0, 6346.0, 1686.0, 645.0, 296.0, 142.0, 75.0, 44.0, 25.0, 19.0, 6.0, 4.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.05230712890625, -0.050253868103027344, -0.04820060729980469, -0.04614734649658203, -0.044094085693359375, -0.04204082489013672, -0.03998756408691406, -0.037934303283691406, -0.03588104248046875, -0.033827781677246094, -0.03177452087402344, -0.02972126007080078, -0.027667999267578125, -0.02561473846435547, -0.023561477661132812, -0.021508216857910156, -0.0194549560546875, -0.017401695251464844, -0.015348434448242188, -0.013295173645019531, -0.011241912841796875, -0.009188652038574219, -0.0071353912353515625, -0.005082130432128906, -0.00302886962890625, -0.0009756088256835938, 0.0010776519775390625, 0.0031309127807617188, 0.005184173583984375, 0.007237434387207031, 0.009290695190429688, 0.011343955993652344, 0.013397216796875, 0.015450477600097656, 0.017503738403320312, 0.01955699920654297, 0.021610260009765625, 0.02366352081298828, 0.025716781616210938, 0.027770042419433594, 0.02982330322265625, 0.031876564025878906, 0.03392982482910156, 0.03598308563232422, 0.038036346435546875, 0.04008960723876953, 0.04214286804199219, 0.044196128845214844, 0.0462493896484375, 0.048302650451660156, 0.05035591125488281, 0.05240917205810547, 0.054462432861328125, 0.05651569366455078, 0.05856895446777344, 0.060622215270996094, 0.06267547607421875, 0.0647287368774414, 0.06678199768066406, 0.06883525848388672, 0.07088851928710938, 0.07294178009033203, 0.07499504089355469, 0.07704830169677734, 0.0791015625]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 1.0, 6.0, 5.0, 6.0, 13.0, 11.0, 9.0, 15.0, 26.0, 30.0, 33.0, 63.0, 83.0, 94.0, 122.0, 100.0, 103.0, 76.0, 46.0, 46.0, 28.0, 20.0, 17.0, 11.0, 8.0, 3.0, 3.0, 5.0, 2.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01136016845703125, -0.01098942756652832, -0.01061868667602539, -0.010247945785522461, -0.009877204895019531, -0.009506464004516602, -0.009135723114013672, -0.008764982223510742, -0.008394241333007812, -0.008023500442504883, -0.007652759552001953, -0.0072820186614990234, -0.006911277770996094, -0.006540536880493164, -0.006169795989990234, -0.005799055099487305, -0.005428314208984375, -0.005057573318481445, -0.004686832427978516, -0.004316091537475586, -0.003945350646972656, -0.0035746097564697266, -0.003203868865966797, -0.002833127975463867, -0.0024623870849609375, -0.002091646194458008, -0.0017209053039550781, -0.0013501644134521484, -0.0009794235229492188, -0.0006086826324462891, -0.00023794174194335938, 0.0001327991485595703, 0.0005035400390625, 0.0008742809295654297, 0.0012450218200683594, 0.001615762710571289, 0.0019865036010742188, 0.0023572444915771484, 0.002727985382080078, 0.003098726272583008, 0.0034694671630859375, 0.003840208053588867, 0.004210948944091797, 0.0045816898345947266, 0.004952430725097656, 0.005323171615600586, 0.005693912506103516, 0.006064653396606445, 0.006435394287109375, 0.006806135177612305, 0.007176876068115234, 0.007547616958618164, 0.007918357849121094, 0.008289098739624023, 0.008659839630126953, 0.009030580520629883, 0.009401321411132812, 0.009772062301635742, 0.010142803192138672, 0.010513544082641602, 0.010884284973144531, 0.011255025863647461, 0.01162576675415039, 0.01199650764465332, 0.01236724853515625]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 7.0, 6.0, 12.0, 27.0, 58.0, 90.0, 126.0, 164.0, 186.0, 114.0, 74.0, 62.0, 33.0, 19.0, 10.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.4505625069141388, -0.43900638818740845, -0.4274502396583557, -0.41589412093162537, -0.404338002204895, -0.3927818536758423, -0.38122573494911194, -0.3696696162223816, -0.35811346769332886, -0.3465573489665985, -0.3350012004375458, -0.32344508171081543, -0.3118889331817627, -0.30033281445503235, -0.288776695728302, -0.27722054719924927, -0.2656644284725189, -0.2541083097457886, -0.24255216121673584, -0.2309960424900055, -0.21943990886211395, -0.2078837752342224, -0.19632765650749207, -0.18477152287960052, -0.17321538925170898, -0.16165925562381744, -0.1501031219959259, -0.13854700326919556, -0.12699086964130402, -0.11543473601341248, -0.10387860983610153, -0.09232248365879059, -0.08076637983322144, -0.0692102462053299, -0.05765412002801895, -0.04609799012541771, -0.03454186022281647, -0.022985730320215225, -0.011429600417613983, 0.00012652575969696045, 0.011682659387588501, 0.023238789290189743, 0.034794919192790985, 0.04635104909539223, 0.05790717899799347, 0.06946331262588501, 0.08101943880319595, 0.0925755649805069, 0.10413169860839844, 0.11568783223628998, 0.12724396586418152, 0.13880008459091187, 0.1503562182188034, 0.16191235184669495, 0.1734684705734253, 0.18502460420131683, 0.19658073782920837, 0.20813687145709991, 0.21969300508499146, 0.2312491238117218, 0.24280525743961334, 0.2543613910675049, 0.26591750979423523, 0.2774736285209656, 0.2890297770500183]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 3.0, 1.0, 4.0, 8.0, 7.0, 9.0, 3.0, 6.0, 9.0, 19.0, 10.0, 14.0, 12.0, 33.0, 26.0, 28.0, 34.0, 23.0, 29.0, 30.0, 40.0, 34.0, 45.0, 40.0, 37.0, 49.0, 43.0, 44.0, 39.0, 42.0, 32.0, 28.0, 26.0, 34.0, 24.0, 23.0, 19.0, 17.0, 18.0, 12.0, 10.0, 8.0, 14.0, 7.0, 4.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.23896682262420654, -0.2311481088399887, -0.22332940995693207, -0.21551069617271423, -0.2076919972896576, -0.19987328350543976, -0.19205456972122192, -0.18423587083816528, -0.17641717195510864, -0.1685984581708908, -0.16077975928783417, -0.15296104550361633, -0.1451423466205597, -0.13732363283634186, -0.12950491905212402, -0.12168622016906738, -0.11386750638484955, -0.10604880005121231, -0.09823009371757507, -0.09041137993335724, -0.0825926810503006, -0.07477396726608276, -0.06695526093244553, -0.05913655459880829, -0.05131784826517105, -0.043499141931533813, -0.035680435597896576, -0.02786172553896904, -0.020043019205331802, -0.012224312871694565, -0.004405602812767029, 0.0034131035208702087, 0.011231809854507446, 0.019050516188144684, 0.02686922438442707, 0.03468793258070946, 0.042506638914346695, 0.05032534524798393, 0.05814405530691147, 0.0659627616405487, 0.07378146797418594, 0.08160017430782318, 0.08941888064146042, 0.09723758697509766, 0.10505630075931549, 0.11287499964237213, 0.12069371342658997, 0.1285124123096466, 0.13633112609386444, 0.14414983987808228, 0.15196853876113892, 0.15978725254535675, 0.1676059514284134, 0.17542466521263123, 0.18324336409568787, 0.1910620778799057, 0.19888079166412354, 0.20669950544834137, 0.214518204331398, 0.22233691811561584, 0.23015561699867249, 0.23797433078289032, 0.24579304456710815, 0.2536117434501648, 0.26143044233322144]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 0.0, 1.0, 1.0, 4.0, 10.0, 4.0, 9.0, 7.0, 21.0, 22.0, 26.0, 41.0, 53.0, 81.0, 99.0, 141.0, 207.0, 293.0, 385.0, 652.0, 950.0, 1511.0, 2585.0, 4842.0, 9592.0, 23540.0, 85643.0, 697571.0, 2606771.0, 633952.0, 81207.0, 22507.0, 9680.0, 4669.0, 2689.0, 1523.0, 953.0, 643.0, 422.0, 262.0, 198.0, 134.0, 100.0, 64.0, 53.0, 41.0, 38.0, 28.0, 14.0, 11.0, 12.0, 5.0, 7.0, 7.0, 5.0, 4.0, 1.0, 3.0], "bins": [-0.120361328125, -0.11687088012695312, -0.11338043212890625, -0.10988998413085938, -0.1063995361328125, -0.10290908813476562, -0.09941864013671875, -0.09592819213867188, -0.092437744140625, -0.08894729614257812, -0.08545684814453125, -0.08196640014648438, -0.0784759521484375, -0.07498550415039062, -0.07149505615234375, -0.06800460815429688, -0.06451416015625, -0.061023712158203125, -0.05753326416015625, -0.054042816162109375, -0.0505523681640625, -0.047061920166015625, -0.04357147216796875, -0.040081024169921875, -0.036590576171875, -0.033100128173828125, -0.02960968017578125, -0.026119232177734375, -0.0226287841796875, -0.019138336181640625, -0.01564788818359375, -0.012157440185546875, -0.0086669921875, -0.005176544189453125, -0.00168609619140625, 0.001804351806640625, 0.0052947998046875, 0.008785247802734375, 0.01227569580078125, 0.015766143798828125, 0.019256591796875, 0.022747039794921875, 0.02623748779296875, 0.029727935791015625, 0.0332183837890625, 0.036708831787109375, 0.04019927978515625, 0.043689727783203125, 0.04718017578125, 0.050670623779296875, 0.05416107177734375, 0.057651519775390625, 0.0611419677734375, 0.06463241577148438, 0.06812286376953125, 0.07161331176757812, 0.075103759765625, 0.07859420776367188, 0.08208465576171875, 0.08557510375976562, 0.0890655517578125, 0.09255599975585938, 0.09604644775390625, 0.09953689575195312, 0.10302734375]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 6.0, 5.0, 9.0, 4.0, 7.0, 19.0, 19.0, 26.0, 34.0, 31.0, 35.0, 42.0, 47.0, 57.0, 57.0, 46.0, 69.0, 68.0, 62.0, 51.0, 46.0, 46.0, 45.0, 26.0, 22.0, 35.0, 20.0, 14.0, 21.0, 15.0, 9.0, 10.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0888671875, -0.08586597442626953, -0.08286476135253906, -0.0798635482788086, -0.07686233520507812, -0.07386112213134766, -0.07085990905761719, -0.06785869598388672, -0.06485748291015625, -0.06185626983642578, -0.05885505676269531, -0.055853843688964844, -0.052852630615234375, -0.049851417541503906, -0.04685020446777344, -0.04384899139404297, -0.0408477783203125, -0.03784656524658203, -0.03484535217285156, -0.031844139099121094, -0.028842926025390625, -0.025841712951660156, -0.022840499877929688, -0.01983928680419922, -0.01683807373046875, -0.013836860656738281, -0.010835647583007812, -0.007834434509277344, -0.004833221435546875, -0.0018320083618164062, 0.0011692047119140625, 0.004170417785644531, 0.007171630859375, 0.010172843933105469, 0.013174057006835938, 0.016175270080566406, 0.019176483154296875, 0.022177696228027344, 0.025178909301757812, 0.02818012237548828, 0.03118133544921875, 0.03418254852294922, 0.03718376159667969, 0.040184974670410156, 0.043186187744140625, 0.046187400817871094, 0.04918861389160156, 0.05218982696533203, 0.0551910400390625, 0.05819225311279297, 0.06119346618652344, 0.0641946792602539, 0.06719589233398438, 0.07019710540771484, 0.07319831848144531, 0.07619953155517578, 0.07920074462890625, 0.08220195770263672, 0.08520317077636719, 0.08820438385009766, 0.09120559692382812, 0.0942068099975586, 0.09720802307128906, 0.10020923614501953, 0.10321044921875]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 8.0, 14.0, 12.0, 24.0, 43.0, 95.0, 208.0, 693.0, 4499.0, 153897.0, 4005177.0, 27040.0, 1826.0, 411.0, 168.0, 74.0, 35.0, 20.0, 12.0, 9.0, 8.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4326171875, -0.4183387756347656, -0.40406036376953125, -0.3897819519042969, -0.3755035400390625, -0.3612251281738281, -0.34694671630859375, -0.3326683044433594, -0.318389892578125, -0.3041114807128906, -0.28983306884765625, -0.2755546569824219, -0.2612762451171875, -0.24699783325195312, -0.23271942138671875, -0.21844100952148438, -0.20416259765625, -0.18988418579101562, -0.17560577392578125, -0.16132736206054688, -0.1470489501953125, -0.13277053833007812, -0.11849212646484375, -0.10421371459960938, -0.089935302734375, -0.07565689086914062, -0.06137847900390625, -0.047100067138671875, -0.0328216552734375, -0.018543243408203125, -0.00426483154296875, 0.010013580322265625, 0.0242919921875, 0.038570404052734375, 0.05284881591796875, 0.06712722778320312, 0.0814056396484375, 0.09568405151367188, 0.10996246337890625, 0.12424087524414062, 0.138519287109375, 0.15279769897460938, 0.16707611083984375, 0.18135452270507812, 0.1956329345703125, 0.20991134643554688, 0.22418975830078125, 0.23846817016601562, 0.25274658203125, 0.2670249938964844, 0.28130340576171875, 0.2955818176269531, 0.3098602294921875, 0.3241386413574219, 0.33841705322265625, 0.3526954650878906, 0.366973876953125, 0.3812522888183594, 0.39553070068359375, 0.4098091125488281, 0.4240875244140625, 0.4383659362792969, 0.45264434814453125, 0.4669227600097656, 0.481201171875]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 7.0, 4.0, 2.0, 8.0, 7.0, 6.0, 20.0, 22.0, 22.0, 30.0, 33.0, 59.0, 88.0, 114.0, 215.0, 336.0, 609.0, 725.0, 625.0, 411.0, 264.0, 149.0, 87.0, 60.0, 39.0, 42.0, 26.0, 15.0, 11.0, 13.0, 4.0, 4.0, 10.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.039306640625, -0.03788423538208008, -0.036461830139160156, -0.035039424896240234, -0.03361701965332031, -0.03219461441040039, -0.03077220916748047, -0.029349803924560547, -0.027927398681640625, -0.026504993438720703, -0.02508258819580078, -0.02366018295288086, -0.022237777709960938, -0.020815372467041016, -0.019392967224121094, -0.017970561981201172, -0.01654815673828125, -0.015125751495361328, -0.013703346252441406, -0.012280941009521484, -0.010858535766601562, -0.00943613052368164, -0.008013725280761719, -0.006591320037841797, -0.005168914794921875, -0.003746509552001953, -0.0023241043090820312, -0.0009016990661621094, 0.0005207061767578125, 0.0019431114196777344, 0.0033655166625976562, 0.004787921905517578, 0.0062103271484375, 0.007632732391357422, 0.009055137634277344, 0.010477542877197266, 0.011899948120117188, 0.01332235336303711, 0.014744758605957031, 0.016167163848876953, 0.017589569091796875, 0.019011974334716797, 0.02043437957763672, 0.02185678482055664, 0.023279190063476562, 0.024701595306396484, 0.026124000549316406, 0.027546405792236328, 0.02896881103515625, 0.030391216278076172, 0.031813621520996094, 0.033236026763916016, 0.03465843200683594, 0.03608083724975586, 0.03750324249267578, 0.0389256477355957, 0.040348052978515625, 0.04177045822143555, 0.04319286346435547, 0.04461526870727539, 0.04603767395019531, 0.047460079193115234, 0.048882484436035156, 0.05030488967895508, 0.051727294921875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 4.0, 10.0, 12.0, 22.0, 32.0, 44.0, 61.0, 73.0, 109.0, 113.0, 97.0, 100.0, 95.0, 78.0, 36.0, 43.0, 25.0, 20.0, 10.0, 12.0, 10.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22854658961296082, -0.22285278141498566, -0.2171589583158493, -0.21146515011787415, -0.205771341919899, -0.20007753372192383, -0.19438371062278748, -0.18868990242481232, -0.18299609422683716, -0.177302286028862, -0.17160846292972565, -0.1659146547317505, -0.16022084653377533, -0.15452703833580017, -0.14883321523666382, -0.14313940703868866, -0.1374455988407135, -0.13175179064273834, -0.126057967543602, -0.12036415934562683, -0.11467035114765167, -0.10897653549909592, -0.10328271985054016, -0.097588911652565, -0.09189508855342865, -0.0862012729048729, -0.08050746470689774, -0.07481364905834198, -0.06911984086036682, -0.06342602521181107, -0.05773221328854561, -0.05203840136528015, -0.04634459316730499, -0.040650781244039536, -0.03495696932077408, -0.029263155534863472, -0.023569343611598015, -0.017875531688332558, -0.012181717902421951, -0.006487905979156494, -0.000794094055891037, 0.0048997183330357075, 0.010593530721962452, 0.016287343576550484, 0.02198115549981594, 0.027674967423081398, 0.033368781208992004, 0.03906259313225746, 0.04475640505552292, 0.050450216978788376, 0.05614402890205383, 0.06183784455060959, 0.06753165274858475, 0.0732254683971405, 0.07891927659511566, 0.08461309224367142, 0.09030690789222717, 0.09600072354078293, 0.10169453173875809, 0.10738834738731384, 0.113082155585289, 0.11877597123384476, 0.12446978688240051, 0.13016359508037567, 0.13585740327835083]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 7.0, 3.0, 6.0, 8.0, 4.0, 6.0, 18.0, 19.0, 19.0, 23.0, 33.0, 22.0, 27.0, 26.0, 45.0, 34.0, 43.0, 47.0, 37.0, 49.0, 53.0, 45.0, 48.0, 41.0, 40.0, 38.0, 34.0, 30.0, 37.0, 30.0, 17.0, 23.0, 21.0, 20.0, 14.0, 8.0, 16.0, 6.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10078470408916473, -0.09767913073301315, -0.09457355737686157, -0.09146799147129059, -0.08836241811513901, -0.08525684475898743, -0.08215127885341644, -0.07904570549726486, -0.07594013214111328, -0.0728345587849617, -0.06972898542881012, -0.06662341952323914, -0.06351784616708755, -0.060412272810935974, -0.05730670318007469, -0.05420113354921341, -0.05109556019306183, -0.04798998683691025, -0.044884417206048965, -0.04177884757518768, -0.0386732742190361, -0.03556770086288452, -0.03246213123202324, -0.029356559738516808, -0.026250988245010376, -0.023145416751503944, -0.020039845257997513, -0.01693427376449108, -0.01382870227098465, -0.010723130777478218, -0.0076175592839717865, -0.004511987790465355, -0.0014064162969589233, 0.0016991551965475082, 0.00480472669005394, 0.007910298183560371, 0.011015869677066803, 0.014121441170573235, 0.017227012664079666, 0.020332584157586098, 0.02343815565109253, 0.02654372714459896, 0.029649298638105392, 0.032754868268966675, 0.035860441625118256, 0.038966014981269836, 0.04207158461213112, 0.0451771542429924, 0.04828272759914398, 0.05138830095529556, 0.054493870586156845, 0.05759944021701813, 0.06070501357316971, 0.06381058692932129, 0.06691615283489227, 0.07002172619104385, 0.07312729954719543, 0.07623287290334702, 0.0793384462594986, 0.08244401216506958, 0.08554958552122116, 0.08865515887737274, 0.09176072478294373, 0.0948662981390953, 0.09797187149524689]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 6.0, 8.0, 7.0, 9.0, 16.0, 24.0, 44.0, 39.0, 72.0, 93.0, 157.0, 248.0, 455.0, 774.0, 1298.0, 2438.0, 4528.0, 9428.0, 20521.0, 60095.0, 279263.0, 498608.0, 112020.0, 31798.0, 12993.0, 6254.0, 3240.0, 1727.0, 939.0, 547.0, 293.0, 214.0, 134.0, 88.0, 58.0, 33.0, 33.0, 20.0, 12.0, 11.0, 9.0, 0.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03985595703125, -0.038619041442871094, -0.03738212585449219, -0.03614521026611328, -0.034908294677734375, -0.03367137908935547, -0.03243446350097656, -0.031197547912597656, -0.02996063232421875, -0.028723716735839844, -0.027486801147460938, -0.02624988555908203, -0.025012969970703125, -0.02377605438232422, -0.022539138793945312, -0.021302223205566406, -0.0200653076171875, -0.018828392028808594, -0.017591476440429688, -0.01635456085205078, -0.015117645263671875, -0.013880729675292969, -0.012643814086914062, -0.011406898498535156, -0.01016998291015625, -0.008933067321777344, -0.0076961517333984375, -0.006459236145019531, -0.005222320556640625, -0.003985404968261719, -0.0027484893798828125, -0.0015115737915039062, -0.000274658203125, 0.0009622573852539062, 0.0021991729736328125, 0.0034360885620117188, 0.004673004150390625, 0.005909919738769531, 0.0071468353271484375, 0.008383750915527344, 0.00962066650390625, 0.010857582092285156, 0.012094497680664062, 0.013331413269042969, 0.014568328857421875, 0.01580524444580078, 0.017042160034179688, 0.018279075622558594, 0.0195159912109375, 0.020752906799316406, 0.021989822387695312, 0.02322673797607422, 0.024463653564453125, 0.02570056915283203, 0.026937484741210938, 0.028174400329589844, 0.02941131591796875, 0.030648231506347656, 0.03188514709472656, 0.03312206268310547, 0.034358978271484375, 0.03559589385986328, 0.03683280944824219, 0.038069725036621094, 0.039306640625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 5.0, 4.0, 9.0, 7.0, 9.0, 16.0, 16.0, 17.0, 15.0, 19.0, 33.0, 31.0, 26.0, 30.0, 39.0, 27.0, 49.0, 66.0, 52.0, 47.0, 56.0, 52.0, 32.0, 48.0, 43.0, 32.0, 34.0, 33.0, 28.0, 19.0, 17.0, 25.0, 12.0, 19.0, 9.0, 8.0, 7.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.058837890625, -0.056914329528808594, -0.05499076843261719, -0.05306720733642578, -0.051143646240234375, -0.04922008514404297, -0.04729652404785156, -0.045372962951660156, -0.04344940185546875, -0.041525840759277344, -0.03960227966308594, -0.03767871856689453, -0.035755157470703125, -0.03383159637451172, -0.03190803527832031, -0.029984474182128906, -0.0280609130859375, -0.026137351989746094, -0.024213790893554688, -0.02229022979736328, -0.020366668701171875, -0.01844310760498047, -0.016519546508789062, -0.014595985412597656, -0.01267242431640625, -0.010748863220214844, -0.008825302124023438, -0.006901741027832031, -0.004978179931640625, -0.0030546188354492188, -0.0011310577392578125, 0.0007925033569335938, 0.002716064453125, 0.004639625549316406, 0.0065631866455078125, 0.008486747741699219, 0.010410308837890625, 0.012333869934082031, 0.014257431030273438, 0.016180992126464844, 0.01810455322265625, 0.020028114318847656, 0.021951675415039062, 0.02387523651123047, 0.025798797607421875, 0.02772235870361328, 0.029645919799804688, 0.031569480895996094, 0.0334930419921875, 0.035416603088378906, 0.03734016418457031, 0.03926372528076172, 0.041187286376953125, 0.04311084747314453, 0.04503440856933594, 0.046957969665527344, 0.04888153076171875, 0.050805091857910156, 0.05272865295410156, 0.05465221405029297, 0.056575775146484375, 0.05849933624267578, 0.06042289733886719, 0.062346458435058594, 0.06427001953125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 6.0, 6.0, 4.0, 12.0, 10.0, 17.0, 22.0, 31.0, 40.0, 57.0, 91.0, 209.0, 439.0, 1299.0, 4339.0, 18015.0, 129246.0, 744998.0, 125895.0, 17380.0, 4195.0, 1287.0, 470.0, 188.0, 107.0, 54.0, 34.0, 29.0, 13.0, 10.0, 12.0, 8.0, 4.0, 5.0, 8.0, 3.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046356201171875, -0.04472923278808594, -0.043102264404296875, -0.04147529602050781, -0.03984832763671875, -0.03822135925292969, -0.036594390869140625, -0.03496742248535156, -0.0333404541015625, -0.03171348571777344, -0.030086517333984375, -0.028459548950195312, -0.02683258056640625, -0.025205612182617188, -0.023578643798828125, -0.021951675415039062, -0.02032470703125, -0.018697738647460938, -0.017070770263671875, -0.015443801879882812, -0.01381683349609375, -0.012189865112304688, -0.010562896728515625, -0.008935928344726562, -0.0073089599609375, -0.0056819915771484375, -0.004055023193359375, -0.0024280548095703125, -0.00080108642578125, 0.0008258819580078125, 0.002452850341796875, 0.0040798187255859375, 0.005706787109375, 0.0073337554931640625, 0.008960723876953125, 0.010587692260742188, 0.01221466064453125, 0.013841629028320312, 0.015468597412109375, 0.017095565795898438, 0.0187225341796875, 0.020349502563476562, 0.021976470947265625, 0.023603439331054688, 0.02523040771484375, 0.026857376098632812, 0.028484344482421875, 0.030111312866210938, 0.03173828125, 0.03336524963378906, 0.034992218017578125, 0.03661918640136719, 0.03824615478515625, 0.03987312316894531, 0.041500091552734375, 0.04312705993652344, 0.0447540283203125, 0.04638099670410156, 0.048007965087890625, 0.04963493347167969, 0.05126190185546875, 0.05288887023925781, 0.054515838623046875, 0.05614280700683594, 0.057769775390625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 6.0, 5.0, 13.0, 7.0, 7.0, 13.0, 15.0, 13.0, 12.0, 22.0, 24.0, 18.0, 38.0, 36.0, 44.0, 41.0, 48.0, 58.0, 28.0, 43.0, 46.0, 58.0, 49.0, 46.0, 39.0, 48.0, 35.0, 32.0, 29.0, 23.0, 15.0, 18.0, 19.0, 7.0, 12.0, 10.0, 6.0, 4.0, 8.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.12200927734375, -0.11800289154052734, -0.11399650573730469, -0.10999011993408203, -0.10598373413085938, -0.10197734832763672, -0.09797096252441406, -0.0939645767211914, -0.08995819091796875, -0.0859518051147461, -0.08194541931152344, -0.07793903350830078, -0.07393264770507812, -0.06992626190185547, -0.06591987609863281, -0.061913490295410156, -0.0579071044921875, -0.053900718688964844, -0.04989433288574219, -0.04588794708251953, -0.041881561279296875, -0.03787517547607422, -0.03386878967285156, -0.029862403869628906, -0.02585601806640625, -0.021849632263183594, -0.017843246459960938, -0.013836860656738281, -0.009830474853515625, -0.005824089050292969, -0.0018177032470703125, 0.0021886825561523438, 0.006195068359375, 0.010201454162597656, 0.014207839965820312, 0.01821422576904297, 0.022220611572265625, 0.02622699737548828, 0.030233383178710938, 0.034239768981933594, 0.03824615478515625, 0.042252540588378906, 0.04625892639160156, 0.05026531219482422, 0.054271697998046875, 0.05827808380126953, 0.06228446960449219, 0.06629085540771484, 0.0702972412109375, 0.07430362701416016, 0.07831001281738281, 0.08231639862060547, 0.08632278442382812, 0.09032917022705078, 0.09433555603027344, 0.0983419418334961, 0.10234832763671875, 0.1063547134399414, 0.11036109924316406, 0.11436748504638672, 0.11837387084960938, 0.12238025665283203, 0.1263866424560547, 0.13039302825927734, 0.1343994140625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 6.0, 2.0, 11.0, 8.0, 10.0, 14.0, 9.0, 26.0, 35.0, 49.0, 68.0, 114.0, 142.0, 241.0, 376.0, 622.0, 1032.0, 1910.0, 3602.0, 8001.0, 22183.0, 105460.0, 628460.0, 219045.0, 35580.0, 11047.0, 4774.0, 2402.0, 1274.0, 688.0, 486.0, 270.0, 186.0, 125.0, 85.0, 53.0, 39.0, 17.0, 21.0, 25.0, 10.0, 12.0, 12.0, 11.0, 5.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.016357421875, -0.01588571071624756, -0.015413999557495117, -0.014942288398742676, -0.014470577239990234, -0.013998866081237793, -0.013527154922485352, -0.01305544376373291, -0.012583732604980469, -0.012112021446228027, -0.011640310287475586, -0.011168599128723145, -0.010696887969970703, -0.010225176811218262, -0.00975346565246582, -0.009281754493713379, -0.008810043334960938, -0.008338332176208496, -0.007866621017456055, -0.007394909858703613, -0.006923198699951172, -0.0064514875411987305, -0.005979776382446289, -0.005508065223693848, -0.005036354064941406, -0.004564642906188965, -0.0040929317474365234, -0.003621220588684082, -0.0031495094299316406, -0.0026777982711791992, -0.002206087112426758, -0.0017343759536743164, -0.001262664794921875, -0.0007909536361694336, -0.0003192424774169922, 0.00015246868133544922, 0.0006241798400878906, 0.001095890998840332, 0.0015676021575927734, 0.002039313316345215, 0.0025110244750976562, 0.0029827356338500977, 0.003454446792602539, 0.0039261579513549805, 0.004397869110107422, 0.004869580268859863, 0.005341291427612305, 0.005813002586364746, 0.0062847137451171875, 0.006756424903869629, 0.00722813606262207, 0.007699847221374512, 0.008171558380126953, 0.008643269538879395, 0.009114980697631836, 0.009586691856384277, 0.010058403015136719, 0.01053011417388916, 0.011001825332641602, 0.011473536491394043, 0.011945247650146484, 0.012416958808898926, 0.012888669967651367, 0.013360381126403809, 0.01383209228515625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 4.0, 16.0, 8.0, 19.0, 26.0, 45.0, 43.0, 90.0, 89.0, 124.0, 108.0, 124.0, 90.0, 70.0, 48.0, 33.0, 19.0, 10.0, 12.0, 9.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.510185241699219e-06, -7.243826985359192e-06, -6.977468729019165e-06, -6.711110472679138e-06, -6.444752216339111e-06, -6.1783939599990845e-06, -5.912035703659058e-06, -5.645677447319031e-06, -5.379319190979004e-06, -5.112960934638977e-06, -4.84660267829895e-06, -4.580244421958923e-06, -4.3138861656188965e-06, -4.04752790927887e-06, -3.7811696529388428e-06, -3.514811396598816e-06, -3.248453140258789e-06, -2.982094883918762e-06, -2.7157366275787354e-06, -2.4493783712387085e-06, -2.1830201148986816e-06, -1.9166618585586548e-06, -1.650303602218628e-06, -1.383945345878601e-06, -1.1175870895385742e-06, -8.512288331985474e-07, -5.848705768585205e-07, -3.1851232051849365e-07, -5.21540641784668e-08, 2.1420419216156006e-07, 4.805624485015869e-07, 7.469207048416138e-07, 1.0132789611816406e-06, 1.2796372175216675e-06, 1.5459954738616943e-06, 1.8123537302017212e-06, 2.078711986541748e-06, 2.345070242881775e-06, 2.6114284992218018e-06, 2.8777867555618286e-06, 3.1441450119018555e-06, 3.4105032682418823e-06, 3.676861524581909e-06, 3.943219780921936e-06, 4.209578037261963e-06, 4.47593629360199e-06, 4.742294549942017e-06, 5.0086528062820435e-06, 5.27501106262207e-06, 5.541369318962097e-06, 5.807727575302124e-06, 6.074085831642151e-06, 6.340444087982178e-06, 6.606802344322205e-06, 6.8731606006622314e-06, 7.139518857002258e-06, 7.405877113342285e-06, 7.672235369682312e-06, 7.938593626022339e-06, 8.204951882362366e-06, 8.471310138702393e-06, 8.73766839504242e-06, 9.004026651382446e-06, 9.270384907722473e-06, 9.5367431640625e-06]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 6.0, 7.0, 6.0, 6.0, 14.0, 19.0, 26.0, 51.0, 71.0, 134.0, 218.0, 479.0, 968.0, 2269.0, 5625.0, 19753.0, 169328.0, 739909.0, 88020.0, 13751.0, 4472.0, 1768.0, 777.0, 382.0, 191.0, 112.0, 71.0, 42.0, 28.0, 16.0, 10.0, 5.0, 7.0, 3.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0249481201171875, -0.024126768112182617, -0.023305416107177734, -0.02248406410217285, -0.02166271209716797, -0.020841360092163086, -0.020020008087158203, -0.01919865608215332, -0.018377304077148438, -0.017555952072143555, -0.016734600067138672, -0.01591324806213379, -0.015091896057128906, -0.014270544052124023, -0.01344919204711914, -0.012627840042114258, -0.011806488037109375, -0.010985136032104492, -0.01016378402709961, -0.009342432022094727, -0.008521080017089844, -0.007699728012084961, -0.006878376007080078, -0.006057024002075195, -0.0052356719970703125, -0.00441431999206543, -0.003592967987060547, -0.002771615982055664, -0.0019502639770507812, -0.0011289119720458984, -0.0003075599670410156, 0.0005137920379638672, 0.00133514404296875, 0.002156496047973633, 0.0029778480529785156, 0.0037992000579833984, 0.004620552062988281, 0.005441904067993164, 0.006263256072998047, 0.00708460807800293, 0.007905960083007812, 0.008727312088012695, 0.009548664093017578, 0.010370016098022461, 0.011191368103027344, 0.012012720108032227, 0.01283407211303711, 0.013655424118041992, 0.014476776123046875, 0.015298128128051758, 0.01611948013305664, 0.016940832138061523, 0.017762184143066406, 0.01858353614807129, 0.019404888153076172, 0.020226240158081055, 0.021047592163085938, 0.02186894416809082, 0.022690296173095703, 0.023511648178100586, 0.02433300018310547, 0.02515435218811035, 0.025975704193115234, 0.026797056198120117, 0.027618408203125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 2.0, 8.0, 7.0, 11.0, 16.0, 24.0, 33.0, 72.0, 92.0, 148.0, 185.0, 126.0, 98.0, 62.0, 48.0, 20.0, 15.0, 10.0, 5.0, 2.0, 7.0, 2.0, 4.0, 0.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00662994384765625, -0.0064321160316467285, -0.006234288215637207, -0.0060364603996276855, -0.005838632583618164, -0.005640804767608643, -0.005442976951599121, -0.0052451491355896, -0.005047321319580078, -0.004849493503570557, -0.004651665687561035, -0.004453837871551514, -0.004256010055541992, -0.004058182239532471, -0.0038603544235229492, -0.0036625266075134277, -0.0034646987915039062, -0.0032668709754943848, -0.0030690431594848633, -0.002871215343475342, -0.0026733875274658203, -0.002475559711456299, -0.0022777318954467773, -0.002079904079437256, -0.0018820762634277344, -0.0016842484474182129, -0.0014864206314086914, -0.00128859281539917, -0.0010907649993896484, -0.000892937183380127, -0.0006951093673706055, -0.000497281551361084, -0.0002994537353515625, -0.00010162591934204102, 9.620189666748047e-05, 0.00029402971267700195, 0.0004918575286865234, 0.0006896853446960449, 0.0008875131607055664, 0.0010853409767150879, 0.0012831687927246094, 0.0014809966087341309, 0.0016788244247436523, 0.0018766522407531738, 0.0020744800567626953, 0.002272307872772217, 0.0024701356887817383, 0.0026679635047912598, 0.0028657913208007812, 0.0030636191368103027, 0.0032614469528198242, 0.0034592747688293457, 0.003657102584838867, 0.0038549304008483887, 0.00405275821685791, 0.004250586032867432, 0.004448413848876953, 0.004646241664886475, 0.004844069480895996, 0.005041897296905518, 0.005239725112915039, 0.0054375529289245605, 0.005635380744934082, 0.0058332085609436035, 0.006031036376953125]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 9.0, 10.0, 15.0, 51.0, 60.0, 99.0, 140.0, 152.0, 132.0, 134.0, 74.0, 56.0, 32.0, 18.0, 12.0, 7.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2007479965686798, -0.19636370241641998, -0.19197940826416016, -0.18759509921073914, -0.1832108050584793, -0.17882651090621948, -0.17444221675395966, -0.17005792260169983, -0.16567362844944, -0.16128933429718018, -0.15690504014492035, -0.15252074599266052, -0.1481364369392395, -0.14375214278697968, -0.13936784863471985, -0.13498355448246002, -0.1305992603302002, -0.12621496617794037, -0.12183066457509995, -0.11744637042284012, -0.11306207627058029, -0.10867777466773987, -0.10429348051548004, -0.09990918636322021, -0.0955248773097992, -0.09114058315753937, -0.08675628155469894, -0.08237198740243912, -0.07798769325017929, -0.07360339164733887, -0.06921909749507904, -0.06483480334281921, -0.060450516641139984, -0.05606621876358986, -0.05168192461133003, -0.04729762673377991, -0.04291333258152008, -0.038529034703969955, -0.03414473682641983, -0.029760440811514854, -0.02537614479660988, -0.020991848781704903, -0.016607552766799927, -0.012223254889249802, -0.007838958874344826, -0.00345466285943985, 0.0009296350181102753, 0.005313931033015251, 0.009698227047920227, 0.014082523062825203, 0.01846681907773018, 0.022851116955280304, 0.02723541297018528, 0.031619708985090256, 0.03600400686264038, 0.04038830101490021, 0.04477259889245033, 0.04915689677000046, 0.053541190922260284, 0.05792548879981041, 0.062309786677360535, 0.06669408082962036, 0.07107837498188019, 0.07546267658472061, 0.07984697073698044]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 2.0, 5.0, 2.0, 6.0, 6.0, 9.0, 14.0, 10.0, 21.0, 21.0, 28.0, 24.0, 35.0, 36.0, 40.0, 41.0, 39.0, 49.0, 49.0, 58.0, 61.0, 41.0, 49.0, 44.0, 41.0, 40.0, 30.0, 42.0, 30.0, 23.0, 23.0, 23.0, 14.0, 16.0, 10.0, 10.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06404274702072144, -0.062102433294057846, -0.06016211956739426, -0.05822180584073067, -0.05628149211406708, -0.05434117838740349, -0.0524008646607399, -0.05046054720878601, -0.04852023720741272, -0.04657992348074913, -0.04463960975408554, -0.04269929602742195, -0.04075898230075836, -0.03881866857409477, -0.03687835484743118, -0.034938037395477295, -0.032997723668813705, -0.031057409942150116, -0.029117096215486526, -0.027176782488822937, -0.025236468762159348, -0.023296155035495758, -0.02135583944618702, -0.01941552571952343, -0.01747521199285984, -0.015534898266196251, -0.013594584539532661, -0.011654269881546497, -0.009713956154882908, -0.007773642428219318, -0.005833327770233154, -0.003893014043569565, -0.0019527003169059753, -1.238635741174221e-05, 0.001927927602082491, 0.0038682417944073677, 0.005808555521070957, 0.007748869247734547, 0.00968918390572071, 0.0116294976323843, 0.01356981135904789, 0.01551012508571148, 0.01745043881237507, 0.019390754401683807, 0.021331068128347397, 0.023271381855010986, 0.025211695581674576, 0.027152009308338165, 0.029092323035001755, 0.031032636761665344, 0.032972950488328934, 0.03491326421499252, 0.03685357794165611, 0.0387938916683197, 0.04073420912027359, 0.04267451912164688, 0.04461483657360077, 0.04655515030026436, 0.04849546402692795, 0.05043577775359154, 0.05237609148025513, 0.054316405206918716, 0.056256718933582306, 0.058197036385536194, 0.060137346386909485]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 5.0, 2.0, 6.0, 9.0, 9.0, 17.0, 7.0, 33.0, 45.0, 33.0, 67.0, 73.0, 120.0, 185.0, 272.0, 364.0, 586.0, 874.0, 1475.0, 2388.0, 4032.0, 7352.0, 13613.0, 29518.0, 87082.0, 331149.0, 393576.0, 106481.0, 34402.0, 15107.0, 8017.0, 4457.0, 2571.0, 1554.0, 1006.0, 647.0, 440.0, 296.0, 209.0, 146.0, 91.0, 63.0, 45.0, 37.0, 25.0, 23.0, 25.0, 8.0, 8.0, 5.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05548095703125, -0.05363655090332031, -0.051792144775390625, -0.04994773864746094, -0.04810333251953125, -0.04625892639160156, -0.044414520263671875, -0.04257011413574219, -0.0407257080078125, -0.03888130187988281, -0.037036895751953125, -0.03519248962402344, -0.03334808349609375, -0.03150367736816406, -0.029659271240234375, -0.027814865112304688, -0.025970458984375, -0.024126052856445312, -0.022281646728515625, -0.020437240600585938, -0.01859283447265625, -0.016748428344726562, -0.014904022216796875, -0.013059616088867188, -0.0112152099609375, -0.009370803833007812, -0.007526397705078125, -0.0056819915771484375, -0.00383758544921875, -0.0019931793212890625, -0.000148773193359375, 0.0016956329345703125, 0.0035400390625, 0.0053844451904296875, 0.007228851318359375, 0.009073257446289062, 0.01091766357421875, 0.012762069702148438, 0.014606475830078125, 0.016450881958007812, 0.0182952880859375, 0.020139694213867188, 0.021984100341796875, 0.023828506469726562, 0.02567291259765625, 0.027517318725585938, 0.029361724853515625, 0.031206130981445312, 0.033050537109375, 0.03489494323730469, 0.036739349365234375, 0.03858375549316406, 0.04042816162109375, 0.04227256774902344, 0.044116973876953125, 0.04596138000488281, 0.0478057861328125, 0.04965019226074219, 0.051494598388671875, 0.05333900451660156, 0.05518341064453125, 0.05702781677246094, 0.058872222900390625, 0.06071662902832031, 0.06256103515625]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 5.0, 5.0, 6.0, 4.0, 10.0, 14.0, 14.0, 17.0, 28.0, 24.0, 30.0, 24.0, 42.0, 35.0, 45.0, 44.0, 51.0, 72.0, 45.0, 49.0, 47.0, 47.0, 46.0, 48.0, 30.0, 37.0, 36.0, 26.0, 18.0, 15.0, 32.0, 14.0, 16.0, 9.0, 7.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.15087890625, -0.1466541290283203, -0.14242935180664062, -0.13820457458496094, -0.13397979736328125, -0.12975502014160156, -0.12553024291992188, -0.12130546569824219, -0.1170806884765625, -0.11285591125488281, -0.10863113403320312, -0.10440635681152344, -0.10018157958984375, -0.09595680236816406, -0.09173202514648438, -0.08750724792480469, -0.083282470703125, -0.07905769348144531, -0.07483291625976562, -0.07060813903808594, -0.06638336181640625, -0.06215858459472656, -0.057933807373046875, -0.05370903015136719, -0.0494842529296875, -0.04525947570800781, -0.041034698486328125, -0.03680992126464844, -0.03258514404296875, -0.028360366821289062, -0.024135589599609375, -0.019910812377929688, -0.01568603515625, -0.011461257934570312, -0.007236480712890625, -0.0030117034912109375, 0.00121307373046875, 0.0054378509521484375, 0.009662628173828125, 0.013887405395507812, 0.0181121826171875, 0.022336959838867188, 0.026561737060546875, 0.030786514282226562, 0.03501129150390625, 0.03923606872558594, 0.043460845947265625, 0.04768562316894531, 0.051910400390625, 0.05613517761230469, 0.060359954833984375, 0.06458473205566406, 0.06880950927734375, 0.07303428649902344, 0.07725906372070312, 0.08148384094238281, 0.0857086181640625, 0.08993339538574219, 0.09415817260742188, 0.09838294982910156, 0.10260772705078125, 0.10683250427246094, 0.11105728149414062, 0.11528205871582031, 0.1195068359375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 1.0, 3.0, 4.0, 10.0, 15.0, 12.0, 22.0, 22.0, 29.0, 44.0, 41.0, 97.0, 107.0, 213.0, 441.0, 1249.0, 5551.0, 37811.0, 715767.0, 263285.0, 18900.0, 3208.0, 797.0, 357.0, 173.0, 107.0, 93.0, 53.0, 42.0, 24.0, 22.0, 16.0, 9.0, 4.0, 6.0, 5.0, 4.0, 2.0, 8.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.1610107421875, -0.1562519073486328, -0.15149307250976562, -0.14673423767089844, -0.14197540283203125, -0.13721656799316406, -0.13245773315429688, -0.1276988983154297, -0.1229400634765625, -0.11818122863769531, -0.11342239379882812, -0.10866355895996094, -0.10390472412109375, -0.09914588928222656, -0.09438705444335938, -0.08962821960449219, -0.084869384765625, -0.08011054992675781, -0.07535171508789062, -0.07059288024902344, -0.06583404541015625, -0.06107521057128906, -0.056316375732421875, -0.05155754089355469, -0.0467987060546875, -0.04203987121582031, -0.037281036376953125, -0.03252220153808594, -0.02776336669921875, -0.023004531860351562, -0.018245697021484375, -0.013486862182617188, -0.00872802734375, -0.0039691925048828125, 0.000789642333984375, 0.0055484771728515625, 0.01030731201171875, 0.015066146850585938, 0.019824981689453125, 0.024583816528320312, 0.0293426513671875, 0.03410148620605469, 0.038860321044921875, 0.04361915588378906, 0.04837799072265625, 0.05313682556152344, 0.057895660400390625, 0.06265449523925781, 0.067413330078125, 0.07217216491699219, 0.07693099975585938, 0.08168983459472656, 0.08644866943359375, 0.09120750427246094, 0.09596633911132812, 0.10072517395019531, 0.1054840087890625, 0.11024284362792969, 0.11500167846679688, 0.11976051330566406, 0.12451934814453125, 0.12927818298339844, 0.13403701782226562, 0.1387958526611328, 0.1435546875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 4.0, 7.0, 4.0, 6.0, 9.0, 8.0, 11.0, 15.0, 16.0, 19.0, 33.0, 24.0, 41.0, 32.0, 28.0, 42.0, 35.0, 40.0, 46.0, 55.0, 53.0, 56.0, 43.0, 49.0, 30.0, 44.0, 21.0, 29.0, 27.0, 30.0, 28.0, 23.0, 16.0, 13.0, 14.0, 9.0, 3.0, 9.0, 11.0, 6.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1373291015625, -0.1331806182861328, -0.12903213500976562, -0.12488365173339844, -0.12073516845703125, -0.11658668518066406, -0.11243820190429688, -0.10828971862792969, -0.1041412353515625, -0.09999275207519531, -0.09584426879882812, -0.09169578552246094, -0.08754730224609375, -0.08339881896972656, -0.07925033569335938, -0.07510185241699219, -0.070953369140625, -0.06680488586425781, -0.06265640258789062, -0.05850791931152344, -0.05435943603515625, -0.05021095275878906, -0.046062469482421875, -0.04191398620605469, -0.0377655029296875, -0.03361701965332031, -0.029468536376953125, -0.025320053100585938, -0.02117156982421875, -0.017023086547851562, -0.012874603271484375, -0.008726119995117188, -0.00457763671875, -0.0004291534423828125, 0.003719329833984375, 0.007867813110351562, 0.01201629638671875, 0.016164779663085938, 0.020313262939453125, 0.024461746215820312, 0.0286102294921875, 0.03275871276855469, 0.036907196044921875, 0.04105567932128906, 0.04520416259765625, 0.04935264587402344, 0.053501129150390625, 0.05764961242675781, 0.061798095703125, 0.06594657897949219, 0.07009506225585938, 0.07424354553222656, 0.07839202880859375, 0.08254051208496094, 0.08668899536132812, 0.09083747863769531, 0.0949859619140625, 0.09913444519042969, 0.10328292846679688, 0.10743141174316406, 0.11157989501953125, 0.11572837829589844, 0.11987686157226562, 0.12402534484863281, 0.128173828125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 4.0, 11.0, 12.0, 22.0, 23.0, 33.0, 54.0, 87.0, 228.0, 548.0, 2004.0, 14981.0, 418281.0, 589725.0, 19070.0, 2377.0, 591.0, 227.0, 102.0, 57.0, 43.0, 23.0, 16.0, 11.0, 8.0, 3.0, 6.0, 0.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0438232421875, -0.04236459732055664, -0.04090595245361328, -0.03944730758666992, -0.03798866271972656, -0.0365300178527832, -0.035071372985839844, -0.033612728118896484, -0.032154083251953125, -0.030695438385009766, -0.029236793518066406, -0.027778148651123047, -0.026319503784179688, -0.024860858917236328, -0.02340221405029297, -0.02194356918334961, -0.02048492431640625, -0.01902627944946289, -0.01756763458251953, -0.016108989715576172, -0.014650344848632812, -0.013191699981689453, -0.011733055114746094, -0.010274410247802734, -0.008815765380859375, -0.007357120513916016, -0.005898475646972656, -0.004439830780029297, -0.0029811859130859375, -0.0015225410461425781, -6.389617919921875e-05, 0.0013947486877441406, 0.0028533935546875, 0.004312038421630859, 0.005770683288574219, 0.007229328155517578, 0.008687973022460938, 0.010146617889404297, 0.011605262756347656, 0.013063907623291016, 0.014522552490234375, 0.015981197357177734, 0.017439842224121094, 0.018898487091064453, 0.020357131958007812, 0.021815776824951172, 0.02327442169189453, 0.02473306655883789, 0.02619171142578125, 0.02765035629272461, 0.02910900115966797, 0.030567646026611328, 0.03202629089355469, 0.03348493576049805, 0.034943580627441406, 0.036402225494384766, 0.037860870361328125, 0.039319515228271484, 0.040778160095214844, 0.0422368049621582, 0.04369544982910156, 0.04515409469604492, 0.04661273956298828, 0.04807138442993164, 0.049530029296875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 7.0, 9.0, 7.0, 13.0, 23.0, 9.0, 27.0, 44.0, 36.0, 50.0, 90.0, 79.0, 101.0, 119.0, 78.0, 101.0, 44.0, 41.0, 32.0, 27.0, 17.0, 15.0, 12.0, 8.0, 5.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.516674041748047e-06, -3.3760443329811096e-06, -3.2354146242141724e-06, -3.094784915447235e-06, -2.954155206680298e-06, -2.8135254979133606e-06, -2.6728957891464233e-06, -2.532266080379486e-06, -2.391636371612549e-06, -2.2510066628456116e-06, -2.1103769540786743e-06, -1.969747245311737e-06, -1.8291175365447998e-06, -1.6884878277778625e-06, -1.5478581190109253e-06, -1.407228410243988e-06, -1.2665987014770508e-06, -1.1259689927101135e-06, -9.853392839431763e-07, -8.44709575176239e-07, -7.040798664093018e-07, -5.634501576423645e-07, -4.2282044887542725e-07, -2.8219074010849e-07, -1.4156103134155273e-07, -9.313225746154785e-10, 1.3969838619232178e-07, 2.8032809495925903e-07, 4.209578037261963e-07, 5.615875124931335e-07, 7.022172212600708e-07, 8.428469300270081e-07, 9.834766387939453e-07, 1.1241063475608826e-06, 1.2647360563278198e-06, 1.405365765094757e-06, 1.5459954738616943e-06, 1.6866251826286316e-06, 1.8272548913955688e-06, 1.967884600162506e-06, 2.1085143089294434e-06, 2.2491440176963806e-06, 2.389773726463318e-06, 2.530403435230255e-06, 2.6710331439971924e-06, 2.8116628527641296e-06, 2.952292561531067e-06, 3.092922270298004e-06, 3.2335519790649414e-06, 3.3741816878318787e-06, 3.514811396598816e-06, 3.655441105365753e-06, 3.7960708141326904e-06, 3.936700522899628e-06, 4.077330231666565e-06, 4.217959940433502e-06, 4.3585896492004395e-06, 4.499219357967377e-06, 4.639849066734314e-06, 4.780478775501251e-06, 4.9211084842681885e-06, 5.061738193035126e-06, 5.202367901802063e-06, 5.342997610569e-06, 5.4836273193359375e-06]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 8.0, 6.0, 7.0, 4.0, 13.0, 19.0, 21.0, 17.0, 44.0, 128.0, 275.0, 872.0, 2779.0, 13770.0, 474735.0, 536802.0, 14894.0, 2765.0, 837.0, 297.0, 122.0, 48.0, 29.0, 14.0, 15.0, 10.0, 5.0, 4.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.057586669921875, -0.05572986602783203, -0.05387306213378906, -0.052016258239746094, -0.050159454345703125, -0.048302650451660156, -0.04644584655761719, -0.04458904266357422, -0.04273223876953125, -0.04087543487548828, -0.03901863098144531, -0.037161827087402344, -0.035305023193359375, -0.033448219299316406, -0.03159141540527344, -0.02973461151123047, -0.0278778076171875, -0.02602100372314453, -0.024164199829101562, -0.022307395935058594, -0.020450592041015625, -0.018593788146972656, -0.016736984252929688, -0.014880180358886719, -0.01302337646484375, -0.011166572570800781, -0.009309768676757812, -0.007452964782714844, -0.005596160888671875, -0.0037393569946289062, -0.0018825531005859375, -2.574920654296875e-05, 0.0018310546875, 0.0036878585815429688, 0.0055446624755859375, 0.007401466369628906, 0.009258270263671875, 0.011115074157714844, 0.012971878051757812, 0.014828681945800781, 0.01668548583984375, 0.01854228973388672, 0.020399093627929688, 0.022255897521972656, 0.024112701416015625, 0.025969505310058594, 0.027826309204101562, 0.02968311309814453, 0.0315399169921875, 0.03339672088623047, 0.03525352478027344, 0.037110328674316406, 0.038967132568359375, 0.040823936462402344, 0.04268074035644531, 0.04453754425048828, 0.04639434814453125, 0.04825115203857422, 0.05010795593261719, 0.051964759826660156, 0.053821563720703125, 0.055678367614746094, 0.05753517150878906, 0.05939197540283203, 0.061248779296875]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 4.0, 5.0, 13.0, 15.0, 14.0, 27.0, 49.0, 60.0, 72.0, 118.0, 140.0, 143.0, 87.0, 79.0, 51.0, 39.0, 15.0, 17.0, 10.0, 2.0, 1.0, 3.0, 6.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0170440673828125, -0.01652050018310547, -0.015996932983398438, -0.015473365783691406, -0.014949798583984375, -0.014426231384277344, -0.013902664184570312, -0.013379096984863281, -0.01285552978515625, -0.012331962585449219, -0.011808395385742188, -0.011284828186035156, -0.010761260986328125, -0.010237693786621094, -0.009714126586914062, -0.009190559387207031, -0.0086669921875, -0.008143424987792969, -0.0076198577880859375, -0.007096290588378906, -0.006572723388671875, -0.006049156188964844, -0.0055255889892578125, -0.005002021789550781, -0.00447845458984375, -0.003954887390136719, -0.0034313201904296875, -0.0029077529907226562, -0.002384185791015625, -0.0018606185913085938, -0.0013370513916015625, -0.0008134841918945312, -0.0002899169921875, 0.00023365020751953125, 0.0007572174072265625, 0.0012807846069335938, 0.001804351806640625, 0.0023279190063476562, 0.0028514862060546875, 0.0033750534057617188, 0.00389862060546875, 0.004422187805175781, 0.0049457550048828125, 0.005469322204589844, 0.005992889404296875, 0.006516456604003906, 0.0070400238037109375, 0.007563591003417969, 0.008087158203125, 0.008610725402832031, 0.009134292602539062, 0.009657859802246094, 0.010181427001953125, 0.010704994201660156, 0.011228561401367188, 0.011752128601074219, 0.01227569580078125, 0.012799263000488281, 0.013322830200195312, 0.013846397399902344, 0.014369964599609375, 0.014893531799316406, 0.015417098999023438, 0.01594066619873047, 0.0164642333984375]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 27.0, 108.0, 352.0, 328.0, 146.0, 38.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2014520168304443, -1.1774336099624634, -1.1534150838851929, -1.129396677017212, -1.1053781509399414, -1.0813597440719604, -1.0573413372039795, -1.033322811126709, -1.009304404258728, -0.9852859377861023, -0.9612674713134766, -0.9372490644454956, -0.9132305979728699, -0.8892121315002441, -0.8651936650276184, -0.8411751985549927, -0.8171567916870117, -0.793138325214386, -0.7691198587417603, -0.7451014518737793, -0.7210829854011536, -0.6970645189285278, -0.6730460524559021, -0.6490275859832764, -0.6250091195106506, -0.6009906530380249, -0.5769721865653992, -0.5529537796974182, -0.5289353132247925, -0.5049168467521667, -0.480898380279541, -0.45687994360923767, -0.4328615367412567, -0.408843070268631, -0.38482463359832764, -0.3608061671257019, -0.33678773045539856, -0.3127692639827728, -0.2887508273124695, -0.26473236083984375, -0.2407139092683792, -0.21669545769691467, -0.19267700612545013, -0.1686585545539856, -0.14464008808135986, -0.12062164396047592, -0.09660318493843079, -0.07258473336696625, -0.04856628179550171, -0.02454782836139202, -0.0005293749272823334, 0.023489080369472504, 0.04750753194093704, 0.07152598351240158, 0.09554444253444672, 0.11956289410591125, 0.1435813456773758, 0.16759979724884033, 0.19161824882030487, 0.2156367003917694, 0.23965516686439514, 0.2636736035346985, 0.2876920700073242, 0.31171053647994995, 0.3357289731502533]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 5.0, 6.0, 4.0, 5.0, 15.0, 9.0, 14.0, 18.0, 29.0, 22.0, 27.0, 22.0, 30.0, 30.0, 41.0, 53.0, 41.0, 49.0, 42.0, 49.0, 54.0, 48.0, 44.0, 44.0, 42.0, 37.0, 33.0, 24.0, 29.0, 32.0, 27.0, 18.0, 18.0, 10.0, 12.0, 8.0, 7.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.23862014710903168, -0.23129092156887054, -0.2239616960287094, -0.21663247048854828, -0.20930324494838715, -0.20197400450706482, -0.1946447789669037, -0.18731555342674255, -0.17998632788658142, -0.1726571023464203, -0.16532787680625916, -0.15799865126609802, -0.1506694257259369, -0.14334020018577576, -0.13601097464561462, -0.1286817342042923, -0.12135251611471176, -0.11402329057455063, -0.1066940650343895, -0.09936483204364777, -0.09203560650348663, -0.0847063809633255, -0.07737715542316437, -0.07004792988300323, -0.0627187043428421, -0.05538947880268097, -0.04806024953722954, -0.040731023997068405, -0.033401794731616974, -0.02607256919145584, -0.018743343651294708, -0.011414114385843277, -0.004084885120391846, 0.003244341816753149, 0.010573568753898144, 0.01790279522538185, 0.025232022628188133, 0.032561250030994415, 0.03989047557115555, 0.04721970483660698, 0.05454893037676811, 0.061878155916929245, 0.06920738518238068, 0.07653661072254181, 0.08386583626270294, 0.09119506180286407, 0.09852428734302521, 0.10585352033376694, 0.11318274587392807, 0.1205119714140892, 0.12784120440483093, 0.13517042994499207, 0.1424996554851532, 0.14982888102531433, 0.15715810656547546, 0.1644873321056366, 0.17181655764579773, 0.17914578318595886, 0.18647500872612, 0.19380423426628113, 0.20113345980644226, 0.2084626853466034, 0.21579191088676453, 0.22312115132808685, 0.23045037686824799]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 11.0, 9.0, 13.0, 15.0, 23.0, 31.0, 27.0, 60.0, 93.0, 129.0, 245.0, 458.0, 932.0, 2012.0, 4507.0, 12198.0, 54653.0, 1149307.0, 2792097.0, 146474.0, 19365.0, 6480.0, 2542.0, 1209.0, 558.0, 298.0, 167.0, 108.0, 63.0, 49.0, 34.0, 23.0, 19.0, 16.0, 10.0, 8.0, 9.0, 4.0, 4.0, 4.0, 6.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1455078125, -0.1406879425048828, -0.13586807250976562, -0.13104820251464844, -0.12622833251953125, -0.12140846252441406, -0.11658859252929688, -0.11176872253417969, -0.1069488525390625, -0.10212898254394531, -0.09730911254882812, -0.09248924255371094, -0.08766937255859375, -0.08284950256347656, -0.07802963256835938, -0.07320976257324219, -0.068389892578125, -0.06357002258300781, -0.058750152587890625, -0.05393028259277344, -0.04911041259765625, -0.04429054260253906, -0.039470672607421875, -0.03465080261230469, -0.0298309326171875, -0.025011062622070312, -0.020191192626953125, -0.015371322631835938, -0.01055145263671875, -0.0057315826416015625, -0.000911712646484375, 0.0039081573486328125, 0.00872802734375, 0.013547897338867188, 0.018367767333984375, 0.023187637329101562, 0.02800750732421875, 0.03282737731933594, 0.037647247314453125, 0.04246711730957031, 0.0472869873046875, 0.05210685729980469, 0.056926727294921875, 0.06174659729003906, 0.06656646728515625, 0.07138633728027344, 0.07620620727539062, 0.08102607727050781, 0.085845947265625, 0.09066581726074219, 0.09548568725585938, 0.10030555725097656, 0.10512542724609375, 0.10994529724121094, 0.11476516723632812, 0.11958503723144531, 0.1244049072265625, 0.1292247772216797, 0.13404464721679688, 0.13886451721191406, 0.14368438720703125, 0.14850425720214844, 0.15332412719726562, 0.1581439971923828, 0.1629638671875]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 3.0, 7.0, 6.0, 8.0, 8.0, 4.0, 6.0, 14.0, 18.0, 21.0, 22.0, 28.0, 24.0, 20.0, 42.0, 48.0, 36.0, 55.0, 46.0, 52.0, 55.0, 56.0, 44.0, 40.0, 43.0, 43.0, 37.0, 24.0, 30.0, 31.0, 20.0, 23.0, 19.0, 24.0, 13.0, 8.0, 7.0, 9.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06585693359375, -0.06384086608886719, -0.061824798583984375, -0.05980873107910156, -0.05779266357421875, -0.05577659606933594, -0.053760528564453125, -0.05174446105957031, -0.0497283935546875, -0.04771232604980469, -0.045696258544921875, -0.04368019104003906, -0.04166412353515625, -0.03964805603027344, -0.037631988525390625, -0.03561592102050781, -0.033599853515625, -0.03158378601074219, -0.029567718505859375, -0.027551651000976562, -0.02553558349609375, -0.023519515991210938, -0.021503448486328125, -0.019487380981445312, -0.0174713134765625, -0.015455245971679688, -0.013439178466796875, -0.011423110961914062, -0.00940704345703125, -0.0073909759521484375, -0.005374908447265625, -0.0033588409423828125, -0.0013427734375, 0.0006732940673828125, 0.002689361572265625, 0.0047054290771484375, 0.00672149658203125, 0.008737564086914062, 0.010753631591796875, 0.012769699096679688, 0.0147857666015625, 0.016801834106445312, 0.018817901611328125, 0.020833969116210938, 0.02285003662109375, 0.024866104125976562, 0.026882171630859375, 0.028898239135742188, 0.030914306640625, 0.03293037414550781, 0.034946441650390625, 0.03696250915527344, 0.03897857666015625, 0.04099464416503906, 0.043010711669921875, 0.04502677917480469, 0.0470428466796875, 0.04905891418457031, 0.051074981689453125, 0.05309104919433594, 0.05510711669921875, 0.05712318420410156, 0.059139251708984375, 0.06115531921386719, 0.06317138671875]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 8.0, 7.0, 14.0, 18.0, 24.0, 50.0, 59.0, 111.0, 209.0, 498.0, 1689.0, 8866.0, 110193.0, 3951781.0, 109228.0, 8790.0, 1731.0, 505.0, 206.0, 94.0, 65.0, 46.0, 25.0, 21.0, 9.0, 10.0, 4.0, 9.0, 0.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.295166015625, -0.2854881286621094, -0.27581024169921875, -0.2661323547363281, -0.2564544677734375, -0.24677658081054688, -0.23709869384765625, -0.22742080688476562, -0.217742919921875, -0.20806503295898438, -0.19838714599609375, -0.18870925903320312, -0.1790313720703125, -0.16935348510742188, -0.15967559814453125, -0.14999771118164062, -0.14031982421875, -0.13064193725585938, -0.12096405029296875, -0.11128616333007812, -0.1016082763671875, -0.09193038940429688, -0.08225250244140625, -0.07257461547851562, -0.062896728515625, -0.053218841552734375, -0.04354095458984375, -0.033863067626953125, -0.0241851806640625, -0.014507293701171875, -0.00482940673828125, 0.004848480224609375, 0.0145263671875, 0.024204254150390625, 0.03388214111328125, 0.043560028076171875, 0.0532379150390625, 0.06291580200195312, 0.07259368896484375, 0.08227157592773438, 0.091949462890625, 0.10162734985351562, 0.11130523681640625, 0.12098312377929688, 0.1306610107421875, 0.14033889770507812, 0.15001678466796875, 0.15969467163085938, 0.16937255859375, 0.17905044555664062, 0.18872833251953125, 0.19840621948242188, 0.2080841064453125, 0.21776199340820312, 0.22743988037109375, 0.23711776733398438, 0.246795654296875, 0.2564735412597656, 0.26615142822265625, 0.2758293151855469, 0.2855072021484375, 0.2951850891113281, 0.30486297607421875, 0.3145408630371094, 0.32421875]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 6.0, 6.0, 7.0, 8.0, 14.0, 23.0, 15.0, 34.0, 39.0, 48.0, 84.0, 120.0, 198.0, 348.0, 526.0, 732.0, 648.0, 422.0, 275.0, 158.0, 81.0, 77.0, 55.0, 40.0, 27.0, 18.0, 13.0, 13.0, 7.0, 11.0, 7.0, 8.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.052947998046875, -0.05154561996459961, -0.05014324188232422, -0.04874086380004883, -0.04733848571777344, -0.04593610763549805, -0.044533729553222656, -0.043131351470947266, -0.041728973388671875, -0.040326595306396484, -0.038924217224121094, -0.0375218391418457, -0.03611946105957031, -0.03471708297729492, -0.03331470489501953, -0.03191232681274414, -0.03050994873046875, -0.02910757064819336, -0.02770519256591797, -0.026302814483642578, -0.024900436401367188, -0.023498058319091797, -0.022095680236816406, -0.020693302154541016, -0.019290924072265625, -0.017888545989990234, -0.016486167907714844, -0.015083789825439453, -0.013681411743164062, -0.012279033660888672, -0.010876655578613281, -0.00947427749633789, -0.0080718994140625, -0.006669521331787109, -0.005267143249511719, -0.003864765167236328, -0.0024623870849609375, -0.0010600090026855469, 0.00034236907958984375, 0.0017447471618652344, 0.003147125244140625, 0.004549503326416016, 0.005951881408691406, 0.007354259490966797, 0.008756637573242188, 0.010159015655517578, 0.011561393737792969, 0.01296377182006836, 0.01436614990234375, 0.01576852798461914, 0.01717090606689453, 0.018573284149169922, 0.019975662231445312, 0.021378040313720703, 0.022780418395996094, 0.024182796478271484, 0.025585174560546875, 0.026987552642822266, 0.028389930725097656, 0.029792308807373047, 0.031194686889648438, 0.03259706497192383, 0.03399944305419922, 0.03540182113647461, 0.03680419921875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 4.0, 1.0, 5.0, 10.0, 7.0, 9.0, 7.0, 13.0, 15.0, 22.0, 26.0, 32.0, 34.0, 41.0, 50.0, 55.0, 48.0, 56.0, 64.0, 69.0, 51.0, 54.0, 54.0, 43.0, 36.0, 49.0, 27.0, 19.0, 20.0, 17.0, 8.0, 10.0, 8.0, 5.0, 11.0, 5.0, 2.0, 4.0, 2.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.1027679517865181, -0.09981711208820343, -0.09686627238988876, -0.0939154252409935, -0.09096458554267883, -0.08801374584436417, -0.0850629061460495, -0.08211205899715424, -0.07916121929883957, -0.0762103796005249, -0.07325953990221024, -0.07030869275331497, -0.0673578530550003, -0.06440701335668564, -0.06145617365837097, -0.058505330234766006, -0.05555449053645134, -0.05260365083813667, -0.04965280741453171, -0.04670196771621704, -0.043751124292612076, -0.04080028459429741, -0.037849441170692444, -0.03489860147237778, -0.03194776177406311, -0.028996920213103294, -0.02604607865214348, -0.02309523895382881, -0.020144395530223846, -0.01719355583190918, -0.014242714270949364, -0.011291872709989548, -0.008341029286384583, -0.0053901877254247665, -0.002439346630126238, 0.0005114944651722908, 0.0034623360261321068, 0.006413177587091923, 0.009364018216729164, 0.01231485977768898, 0.015265701338648796, 0.018216542899608612, 0.021167384460568428, 0.024118226021528244, 0.02706906571984291, 0.030019909143447876, 0.03297074884176254, 0.03592158854007721, 0.038872431963682175, 0.04182327166199684, 0.04477411508560181, 0.04772495478391647, 0.05067579820752144, 0.053626637905836105, 0.05657748132944107, 0.05952832102775574, 0.062479160726070404, 0.06543000042438507, 0.06838084012269974, 0.071331687271595, 0.07428252696990967, 0.07723336666822433, 0.080184206366539, 0.08313505351543427, 0.08608589321374893]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 4.0, 3.0, 14.0, 7.0, 12.0, 7.0, 17.0, 20.0, 11.0, 26.0, 31.0, 22.0, 26.0, 33.0, 33.0, 38.0, 44.0, 44.0, 54.0, 54.0, 41.0, 44.0, 40.0, 46.0, 46.0, 35.0, 42.0, 27.0, 34.0, 19.0, 20.0, 14.0, 11.0, 19.0, 20.0, 12.0, 10.0, 10.0, 5.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.085527203977108, -0.08281069993972778, -0.08009420335292816, -0.07737770676612854, -0.07466120272874832, -0.0719446986913681, -0.06922820210456848, -0.06651170551776886, -0.06379520148038864, -0.06107870116829872, -0.0583622008562088, -0.05564570054411888, -0.05292920023202896, -0.05021269991993904, -0.04749619960784912, -0.0447796992957592, -0.04206319898366928, -0.03934669867157936, -0.03663019835948944, -0.03391369804739952, -0.0311971977353096, -0.02848069742321968, -0.02576419711112976, -0.02304769679903984, -0.02033119648694992, -0.01761469617486, -0.01489819586277008, -0.01218169555068016, -0.00946519523859024, -0.0067486949265003204, -0.0040321946144104, -0.0013156943023204803, 0.0014008134603500366, 0.004117313772439957, 0.006833814084529877, 0.009550314396619797, 0.012266814708709717, 0.014983315020799637, 0.017699815332889557, 0.020416315644979477, 0.023132815957069397, 0.025849316269159317, 0.028565816581249237, 0.03128231689333916, 0.03399881720542908, 0.036715317517519, 0.03943181782960892, 0.04214831814169884, 0.04486481845378876, 0.04758131876587868, 0.0502978190779686, 0.05301431939005852, 0.05573081970214844, 0.05844732001423836, 0.06116382032632828, 0.0638803243637085, 0.06659682095050812, 0.06931331753730774, 0.07202982157468796, 0.07474632561206818, 0.0774628221988678, 0.08017931878566742, 0.08289582282304764, 0.08561232686042786, 0.08832882344722748]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 10.0, 15.0, 10.0, 23.0, 34.0, 35.0, 61.0, 107.0, 153.0, 246.0, 392.0, 724.0, 1259.0, 2242.0, 4099.0, 8658.0, 23162.0, 127062.0, 655597.0, 176433.0, 28087.0, 9813.0, 4582.0, 2463.0, 1313.0, 757.0, 436.0, 303.0, 173.0, 103.0, 78.0, 43.0, 23.0, 30.0, 10.0, 8.0, 8.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03851318359375, -0.037210941314697266, -0.03590869903564453, -0.0346064567565918, -0.03330421447753906, -0.03200197219848633, -0.030699729919433594, -0.02939748764038086, -0.028095245361328125, -0.02679300308227539, -0.025490760803222656, -0.024188518524169922, -0.022886276245117188, -0.021584033966064453, -0.02028179168701172, -0.018979549407958984, -0.01767730712890625, -0.016375064849853516, -0.015072822570800781, -0.013770580291748047, -0.012468338012695312, -0.011166095733642578, -0.009863853454589844, -0.00856161117553711, -0.007259368896484375, -0.005957126617431641, -0.004654884338378906, -0.003352642059326172, -0.0020503997802734375, -0.0007481575012207031, 0.0005540847778320312, 0.0018563270568847656, 0.0031585693359375, 0.004460811614990234, 0.005763053894042969, 0.007065296173095703, 0.008367538452148438, 0.009669780731201172, 0.010972023010253906, 0.01227426528930664, 0.013576507568359375, 0.01487874984741211, 0.016180992126464844, 0.017483234405517578, 0.018785476684570312, 0.020087718963623047, 0.02138996124267578, 0.022692203521728516, 0.02399444580078125, 0.025296688079833984, 0.02659893035888672, 0.027901172637939453, 0.029203414916992188, 0.030505657196044922, 0.031807899475097656, 0.03311014175415039, 0.034412384033203125, 0.03571462631225586, 0.037016868591308594, 0.03831911087036133, 0.03962135314941406, 0.0409235954284668, 0.04222583770751953, 0.043528079986572266, 0.044830322265625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 6.0, 3.0, 8.0, 2.0, 11.0, 9.0, 17.0, 14.0, 21.0, 29.0, 26.0, 29.0, 40.0, 33.0, 39.0, 54.0, 39.0, 45.0, 62.0, 52.0, 63.0, 45.0, 40.0, 49.0, 41.0, 39.0, 26.0, 23.0, 31.0, 26.0, 13.0, 15.0, 11.0, 16.0, 11.0, 9.0, 6.0, 6.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06646728515625, -0.0644845962524414, -0.06250190734863281, -0.06051921844482422, -0.058536529541015625, -0.05655384063720703, -0.05457115173339844, -0.052588462829589844, -0.05060577392578125, -0.048623085021972656, -0.04664039611816406, -0.04465770721435547, -0.042675018310546875, -0.04069232940673828, -0.03870964050292969, -0.036726951599121094, -0.0347442626953125, -0.032761573791503906, -0.030778884887695312, -0.02879619598388672, -0.026813507080078125, -0.02483081817626953, -0.022848129272460938, -0.020865440368652344, -0.01888275146484375, -0.016900062561035156, -0.014917373657226562, -0.012934684753417969, -0.010951995849609375, -0.008969306945800781, -0.0069866180419921875, -0.005003929138183594, -0.003021240234375, -0.0010385513305664062, 0.0009441375732421875, 0.0029268264770507812, 0.004909515380859375, 0.006892204284667969, 0.008874893188476562, 0.010857582092285156, 0.01284027099609375, 0.014822959899902344, 0.016805648803710938, 0.01878833770751953, 0.020771026611328125, 0.02275371551513672, 0.024736404418945312, 0.026719093322753906, 0.0287017822265625, 0.030684471130371094, 0.03266716003417969, 0.03464984893798828, 0.036632537841796875, 0.03861522674560547, 0.04059791564941406, 0.042580604553222656, 0.04456329345703125, 0.046545982360839844, 0.04852867126464844, 0.05051136016845703, 0.052494049072265625, 0.05447673797607422, 0.05645942687988281, 0.058442115783691406, 0.0604248046875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 4.0, 2.0, 7.0, 7.0, 10.0, 11.0, 14.0, 18.0, 28.0, 33.0, 56.0, 99.0, 198.0, 379.0, 821.0, 2308.0, 7341.0, 33551.0, 333778.0, 594582.0, 59167.0, 10872.0, 3152.0, 1111.0, 464.0, 228.0, 92.0, 74.0, 49.0, 26.0, 20.0, 16.0, 7.0, 7.0, 8.0, 5.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037200927734375, -0.035924434661865234, -0.03464794158935547, -0.0333714485168457, -0.03209495544433594, -0.030818462371826172, -0.029541969299316406, -0.02826547622680664, -0.026988983154296875, -0.02571249008178711, -0.024435997009277344, -0.023159503936767578, -0.021883010864257812, -0.020606517791748047, -0.01933002471923828, -0.018053531646728516, -0.01677703857421875, -0.015500545501708984, -0.014224052429199219, -0.012947559356689453, -0.011671066284179688, -0.010394573211669922, -0.009118080139160156, -0.00784158706665039, -0.006565093994140625, -0.005288600921630859, -0.004012107849121094, -0.002735614776611328, -0.0014591217041015625, -0.00018262863159179688, 0.0010938644409179688, 0.0023703575134277344, 0.0036468505859375, 0.004923343658447266, 0.006199836730957031, 0.007476329803466797, 0.008752822875976562, 0.010029315948486328, 0.011305809020996094, 0.01258230209350586, 0.013858795166015625, 0.01513528823852539, 0.016411781311035156, 0.017688274383544922, 0.018964767456054688, 0.020241260528564453, 0.02151775360107422, 0.022794246673583984, 0.02407073974609375, 0.025347232818603516, 0.02662372589111328, 0.027900218963623047, 0.029176712036132812, 0.030453205108642578, 0.031729698181152344, 0.03300619125366211, 0.034282684326171875, 0.03555917739868164, 0.036835670471191406, 0.03811216354370117, 0.03938865661621094, 0.0406651496887207, 0.04194164276123047, 0.043218135833740234, 0.04449462890625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 3.0, 5.0, 10.0, 7.0, 15.0, 23.0, 15.0, 21.0, 26.0, 26.0, 32.0, 31.0, 39.0, 34.0, 28.0, 47.0, 54.0, 37.0, 45.0, 52.0, 34.0, 50.0, 41.0, 62.0, 31.0, 26.0, 28.0, 28.0, 19.0, 14.0, 27.0, 21.0, 15.0, 9.0, 8.0, 8.0, 4.0, 5.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.137451171875, -0.13332176208496094, -0.12919235229492188, -0.1250629425048828, -0.12093353271484375, -0.11680412292480469, -0.11267471313476562, -0.10854530334472656, -0.1044158935546875, -0.10028648376464844, -0.09615707397460938, -0.09202766418457031, -0.08789825439453125, -0.08376884460449219, -0.07963943481445312, -0.07551002502441406, -0.071380615234375, -0.06725120544433594, -0.06312179565429688, -0.05899238586425781, -0.05486297607421875, -0.05073356628417969, -0.046604156494140625, -0.04247474670410156, -0.0383453369140625, -0.03421592712402344, -0.030086517333984375, -0.025957107543945312, -0.02182769775390625, -0.017698287963867188, -0.013568878173828125, -0.009439468383789062, -0.00531005859375, -0.0011806488037109375, 0.002948760986328125, 0.0070781707763671875, 0.01120758056640625, 0.015336990356445312, 0.019466400146484375, 0.023595809936523438, 0.0277252197265625, 0.03185462951660156, 0.035984039306640625, 0.04011344909667969, 0.04424285888671875, 0.04837226867675781, 0.052501678466796875, 0.05663108825683594, 0.060760498046875, 0.06488990783691406, 0.06901931762695312, 0.07314872741699219, 0.07727813720703125, 0.08140754699707031, 0.08553695678710938, 0.08966636657714844, 0.0937957763671875, 0.09792518615722656, 0.10205459594726562, 0.10618400573730469, 0.11031341552734375, 0.11444282531738281, 0.11857223510742188, 0.12270164489746094, 0.1268310546875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 7.0, 6.0, 7.0, 22.0, 40.0, 50.0, 85.0, 143.0, 368.0, 873.0, 2530.0, 11345.0, 136673.0, 811649.0, 73422.0, 8055.0, 1962.0, 688.0, 295.0, 149.0, 71.0, 45.0, 20.0, 16.0, 9.0, 7.0, 6.0, 2.0, 3.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0173187255859375, -0.01663684844970703, -0.015954971313476562, -0.015273094177246094, -0.014591217041015625, -0.013909339904785156, -0.013227462768554688, -0.012545585632324219, -0.01186370849609375, -0.011181831359863281, -0.010499954223632812, -0.009818077087402344, -0.009136199951171875, -0.008454322814941406, -0.0077724456787109375, -0.007090568542480469, -0.00640869140625, -0.005726814270019531, -0.0050449371337890625, -0.004363059997558594, -0.003681182861328125, -0.0029993057250976562, -0.0023174285888671875, -0.0016355514526367188, -0.00095367431640625, -0.00027179718017578125, 0.0004100799560546875, 0.0010919570922851562, 0.001773834228515625, 0.0024557113647460938, 0.0031375885009765625, 0.0038194656372070312, 0.0045013427734375, 0.005183219909667969, 0.0058650970458984375, 0.006546974182128906, 0.007228851318359375, 0.007910728454589844, 0.008592605590820312, 0.009274482727050781, 0.00995635986328125, 0.010638236999511719, 0.011320114135742188, 0.012001991271972656, 0.012683868408203125, 0.013365745544433594, 0.014047622680664062, 0.014729499816894531, 0.015411376953125, 0.01609325408935547, 0.016775131225585938, 0.017457008361816406, 0.018138885498046875, 0.018820762634277344, 0.019502639770507812, 0.02018451690673828, 0.02086639404296875, 0.02154827117919922, 0.022230148315429688, 0.022912025451660156, 0.023593902587890625, 0.024275779724121094, 0.024957656860351562, 0.02563953399658203, 0.0263214111328125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 6.0, 8.0, 18.0, 22.0, 37.0, 51.0, 71.0, 118.0, 135.0, 145.0, 110.0, 112.0, 67.0, 43.0, 18.0, 14.0, 11.0, 2.0, 5.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.59634780883789e-06, -9.299255907535553e-06, -9.002164006233215e-06, -8.705072104930878e-06, -8.40798020362854e-06, -8.110888302326202e-06, -7.813796401023865e-06, -7.516704499721527e-06, -7.2196125984191895e-06, -6.922520697116852e-06, -6.625428795814514e-06, -6.3283368945121765e-06, -6.031244993209839e-06, -5.734153091907501e-06, -5.4370611906051636e-06, -5.139969289302826e-06, -4.842877388000488e-06, -4.545785486698151e-06, -4.248693585395813e-06, -3.951601684093475e-06, -3.6545097827911377e-06, -3.3574178814888e-06, -3.0603259801864624e-06, -2.7632340788841248e-06, -2.466142177581787e-06, -2.1690502762794495e-06, -1.8719583749771118e-06, -1.5748664736747742e-06, -1.2777745723724365e-06, -9.806826710700989e-07, -6.835907697677612e-07, -3.864988684654236e-07, -8.940696716308594e-08, 2.076849341392517e-07, 5.047768354415894e-07, 8.01868736743927e-07, 1.0989606380462646e-06, 1.3960525393486023e-06, 1.69314444065094e-06, 1.9902363419532776e-06, 2.2873282432556152e-06, 2.584420144557953e-06, 2.8815120458602905e-06, 3.178603947162628e-06, 3.475695848464966e-06, 3.7727877497673035e-06, 4.069879651069641e-06, 4.366971552371979e-06, 4.664063453674316e-06, 4.961155354976654e-06, 5.258247256278992e-06, 5.555339157581329e-06, 5.852431058883667e-06, 6.149522960186005e-06, 6.446614861488342e-06, 6.74370676279068e-06, 7.040798664093018e-06, 7.337890565395355e-06, 7.634982466697693e-06, 7.93207436800003e-06, 8.229166269302368e-06, 8.526258170604706e-06, 8.823350071907043e-06, 9.120441973209381e-06, 9.417533874511719e-06]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 6.0, 3.0, 7.0, 5.0, 13.0, 7.0, 27.0, 26.0, 36.0, 49.0, 68.0, 95.0, 132.0, 197.0, 288.0, 444.0, 621.0, 1023.0, 1838.0, 3003.0, 5599.0, 11208.0, 23930.0, 55666.0, 134985.0, 275806.0, 281411.0, 141066.0, 59268.0, 25609.0, 11906.0, 5947.0, 3194.0, 1860.0, 1099.0, 667.0, 456.0, 296.0, 182.0, 137.0, 102.0, 73.0, 54.0, 40.0, 32.0, 17.0, 20.0, 17.0, 12.0, 6.0, 4.0, 2.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.00681304931640625, -0.0066002607345581055, -0.006387472152709961, -0.006174683570861816, -0.005961894989013672, -0.005749106407165527, -0.005536317825317383, -0.005323529243469238, -0.005110740661621094, -0.004897952079772949, -0.004685163497924805, -0.00447237491607666, -0.004259586334228516, -0.004046797752380371, -0.0038340091705322266, -0.003621220588684082, -0.0034084320068359375, -0.003195643424987793, -0.0029828548431396484, -0.002770066261291504, -0.0025572776794433594, -0.002344489097595215, -0.0021317005157470703, -0.0019189119338989258, -0.0017061233520507812, -0.0014933347702026367, -0.0012805461883544922, -0.0010677576065063477, -0.0008549690246582031, -0.0006421804428100586, -0.00042939186096191406, -0.00021660327911376953, -3.814697265625e-06, 0.00020897388458251953, 0.00042176246643066406, 0.0006345510482788086, 0.0008473396301269531, 0.0010601282119750977, 0.0012729167938232422, 0.0014857053756713867, 0.0016984939575195312, 0.0019112825393676758, 0.0021240711212158203, 0.002336859703063965, 0.0025496482849121094, 0.002762436866760254, 0.0029752254486083984, 0.003188014030456543, 0.0034008026123046875, 0.003613591194152832, 0.0038263797760009766, 0.004039168357849121, 0.004251956939697266, 0.00446474552154541, 0.004677534103393555, 0.004890322685241699, 0.005103111267089844, 0.005315899848937988, 0.005528688430786133, 0.005741477012634277, 0.005954265594482422, 0.006167054176330566, 0.006379842758178711, 0.0065926313400268555, 0.006805419921875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 4.0, 1.0, 4.0, 2.0, 2.0, 3.0, 15.0, 6.0, 11.0, 13.0, 16.0, 23.0, 18.0, 27.0, 36.0, 51.0, 58.0, 57.0, 65.0, 50.0, 56.0, 57.0, 60.0, 61.0, 44.0, 43.0, 52.0, 30.0, 19.0, 24.0, 19.0, 16.0, 12.0, 6.0, 12.0, 6.0, 6.0, 8.0, 0.0, 4.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.002399444580078125, -0.002327144145965576, -0.0022548437118530273, -0.0021825432777404785, -0.0021102428436279297, -0.002037942409515381, -0.001965641975402832, -0.0018933415412902832, -0.0018210411071777344, -0.0017487406730651855, -0.0016764402389526367, -0.0016041398048400879, -0.001531839370727539, -0.0014595389366149902, -0.0013872385025024414, -0.0013149380683898926, -0.0012426376342773438, -0.001170337200164795, -0.001098036766052246, -0.0010257363319396973, -0.0009534358978271484, -0.0008811354637145996, -0.0008088350296020508, -0.000736534595489502, -0.0006642341613769531, -0.0005919337272644043, -0.0005196332931518555, -0.00044733285903930664, -0.0003750324249267578, -0.000302731990814209, -0.00023043155670166016, -0.00015813112258911133, -8.58306884765625e-05, -1.3530254364013672e-05, 5.8770179748535156e-05, 0.00013107061386108398, 0.0002033710479736328, 0.00027567148208618164, 0.00034797191619873047, 0.0004202723503112793, 0.0004925727844238281, 0.000564873218536377, 0.0006371736526489258, 0.0007094740867614746, 0.0007817745208740234, 0.0008540749549865723, 0.0009263753890991211, 0.00099867582321167, 0.0010709762573242188, 0.0011432766914367676, 0.0012155771255493164, 0.0012878775596618652, 0.001360177993774414, 0.0014324784278869629, 0.0015047788619995117, 0.0015770792961120605, 0.0016493797302246094, 0.0017216801643371582, 0.001793980598449707, 0.0018662810325622559, 0.0019385814666748047, 0.0020108819007873535, 0.0020831823348999023, 0.002155482769012451, 0.002227783203125]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 3.0, 1.0, 4.0, 5.0, 2.0, 2.0, 5.0, 6.0, 7.0, 5.0, 19.0, 18.0, 23.0, 22.0, 35.0, 29.0, 31.0, 43.0, 56.0, 50.0, 49.0, 63.0, 52.0, 59.0, 50.0, 41.0, 39.0, 46.0, 40.0, 30.0, 33.0, 17.0, 21.0, 13.0, 15.0, 7.0, 4.0, 13.0, 8.0, 8.0, 5.0, 7.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.05102512985467911, -0.04939844086766243, -0.04777175560593605, -0.04614506661891937, -0.044518377631902695, -0.042891692370176315, -0.04126500338315964, -0.03963831812143326, -0.03801162913441658, -0.0363849401473999, -0.03475825488567352, -0.033131565898656845, -0.03150487691164017, -0.029878191649913788, -0.02825150266289711, -0.02662481553852558, -0.024998126551508904, -0.023371439427137375, -0.021744750440120697, -0.02011806331574917, -0.01849137619137764, -0.016864687204360962, -0.015238000079989433, -0.013611312955617905, -0.011984624899923801, -0.010357936844229698, -0.00873124971985817, -0.007104561664164066, -0.00547787407413125, -0.0038511864840984344, -0.002224498428404331, -0.0005978113040328026, 0.0010288767516613007, 0.0026555643416941166, 0.0042822519317269325, 0.005908939987421036, 0.007535627577453852, 0.009162315167486668, 0.010789003223180771, 0.0124156903475523, 0.014042378403246403, 0.015669066458940506, 0.017295753583312035, 0.018922440707683563, 0.02054912969470024, 0.02217581681907177, 0.0238025039434433, 0.025429192930459976, 0.027055880054831505, 0.028682567179203033, 0.03030925616621971, 0.03193594515323639, 0.03356263041496277, 0.035189319401979446, 0.036816008388996124, 0.038442693650722504, 0.04006938263773918, 0.04169607162475586, 0.04332275688648224, 0.04494944587349892, 0.046576134860515594, 0.048202820122241974, 0.04982950910925865, 0.05145619809627533, 0.05308288335800171]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 8.0, 8.0, 6.0, 6.0, 18.0, 11.0, 19.0, 15.0, 30.0, 22.0, 22.0, 37.0, 29.0, 40.0, 45.0, 53.0, 41.0, 61.0, 52.0, 45.0, 42.0, 46.0, 46.0, 45.0, 34.0, 34.0, 36.0, 20.0, 15.0, 19.0, 23.0, 17.0, 13.0, 16.0, 12.0, 6.0, 7.0, 1.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05878680944442749, -0.0570182241499424, -0.055249642580747604, -0.05348105728626251, -0.05171247199177742, -0.04994388669729233, -0.048175305128097534, -0.04640671983361244, -0.04463813453912735, -0.04286954924464226, -0.041100967675447464, -0.03933238238096237, -0.03756379708647728, -0.03579521179199219, -0.034026630222797394, -0.0322580449283123, -0.030489463359117508, -0.028720879927277565, -0.026952294632792473, -0.02518371120095253, -0.023415125906467438, -0.021646542474627495, -0.019877959042787552, -0.01810937374830246, -0.016340790316462517, -0.0145722059533, -0.012803621590137482, -0.011035038158297539, -0.009266453795135021, -0.007497869431972504, -0.005729286000132561, -0.003960701636970043, -0.0021921172738075256, -0.00042353314347565174, 0.0013450509868562222, 0.0031136348843574524, 0.00488221924751997, 0.0066508036106824875, 0.00841938704252243, 0.010187971405684948, 0.011956555768847466, 0.013725140132009983, 0.0154937244951725, 0.017262307927012444, 0.019030891358852386, 0.02079947665333748, 0.02256806008517742, 0.024336643517017365, 0.026105228811502457, 0.0278738122433424, 0.029642397537827492, 0.031410980969667435, 0.03317956626415253, 0.03494814783334732, 0.03671673312783241, 0.038485318422317505, 0.0402538999915123, 0.04202248528599739, 0.043791066855192184, 0.04555965214967728, 0.04732823744416237, 0.04909682273864746, 0.050865404307842255, 0.05263398960232735, 0.05440257489681244]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 8.0, 6.0, 11.0, 12.0, 23.0, 35.0, 61.0, 78.0, 109.0, 227.0, 404.0, 620.0, 1148.0, 2323.0, 4282.0, 8485.0, 19840.0, 54875.0, 206434.0, 473940.0, 188463.0, 51387.0, 18733.0, 8186.0, 4183.0, 1999.0, 1127.0, 644.0, 369.0, 203.0, 126.0, 73.0, 48.0, 31.0, 19.0, 21.0, 12.0, 5.0, 6.0, 1.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09771728515625, -0.09451007843017578, -0.09130287170410156, -0.08809566497802734, -0.08488845825195312, -0.0816812515258789, -0.07847404479980469, -0.07526683807373047, -0.07205963134765625, -0.06885242462158203, -0.06564521789550781, -0.062438011169433594, -0.059230804443359375, -0.056023597717285156, -0.05281639099121094, -0.04960918426513672, -0.0464019775390625, -0.04319477081298828, -0.03998756408691406, -0.036780357360839844, -0.033573150634765625, -0.030365943908691406, -0.027158737182617188, -0.02395153045654297, -0.02074432373046875, -0.01753711700439453, -0.014329910278320312, -0.011122703552246094, -0.007915496826171875, -0.004708290100097656, -0.0015010833740234375, 0.0017061233520507812, 0.004913330078125, 0.008120536804199219, 0.011327743530273438, 0.014534950256347656, 0.017742156982421875, 0.020949363708496094, 0.024156570434570312, 0.02736377716064453, 0.03057098388671875, 0.03377819061279297, 0.03698539733886719, 0.040192604064941406, 0.043399810791015625, 0.046607017517089844, 0.04981422424316406, 0.05302143096923828, 0.0562286376953125, 0.05943584442138672, 0.06264305114746094, 0.06585025787353516, 0.06905746459960938, 0.0722646713256836, 0.07547187805175781, 0.07867908477783203, 0.08188629150390625, 0.08509349822998047, 0.08830070495605469, 0.0915079116821289, 0.09471511840820312, 0.09792232513427734, 0.10112953186035156, 0.10433673858642578, 0.1075439453125]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 5.0, 4.0, 3.0, 9.0, 16.0, 14.0, 22.0, 18.0, 28.0, 20.0, 29.0, 33.0, 40.0, 49.0, 38.0, 58.0, 55.0, 63.0, 53.0, 55.0, 48.0, 39.0, 45.0, 34.0, 41.0, 31.0, 27.0, 27.0, 19.0, 11.0, 16.0, 14.0, 13.0, 6.0, 8.0, 5.0, 0.0, 4.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.117431640625, -0.11417102813720703, -0.11091041564941406, -0.1076498031616211, -0.10438919067382812, -0.10112857818603516, -0.09786796569824219, -0.09460735321044922, -0.09134674072265625, -0.08808612823486328, -0.08482551574707031, -0.08156490325927734, -0.07830429077148438, -0.0750436782836914, -0.07178306579589844, -0.06852245330810547, -0.0652618408203125, -0.06200122833251953, -0.05874061584472656, -0.055480003356933594, -0.052219390869140625, -0.048958778381347656, -0.04569816589355469, -0.04243755340576172, -0.03917694091796875, -0.03591632843017578, -0.03265571594238281, -0.029395103454589844, -0.026134490966796875, -0.022873878479003906, -0.019613265991210938, -0.01635265350341797, -0.013092041015625, -0.009831428527832031, -0.0065708160400390625, -0.0033102035522460938, -4.9591064453125e-05, 0.0032110214233398438, 0.0064716339111328125, 0.009732246398925781, 0.01299285888671875, 0.01625347137451172, 0.019514083862304688, 0.022774696350097656, 0.026035308837890625, 0.029295921325683594, 0.03255653381347656, 0.03581714630126953, 0.0390777587890625, 0.04233837127685547, 0.04559898376464844, 0.048859596252441406, 0.052120208740234375, 0.055380821228027344, 0.05864143371582031, 0.06190204620361328, 0.06516265869140625, 0.06842327117919922, 0.07168388366699219, 0.07494449615478516, 0.07820510864257812, 0.0814657211303711, 0.08472633361816406, 0.08798694610595703, 0.09124755859375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 2.0, 6.0, 4.0, 11.0, 15.0, 22.0, 25.0, 37.0, 57.0, 84.0, 120.0, 202.0, 318.0, 634.0, 1332.0, 3177.0, 8166.0, 24798.0, 94689.0, 428919.0, 371525.0, 79452.0, 21892.0, 7447.0, 2932.0, 1221.0, 598.0, 317.0, 186.0, 139.0, 82.0, 39.0, 28.0, 17.0, 21.0, 18.0, 8.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1328125, -0.12865447998046875, -0.1244964599609375, -0.12033843994140625, -0.116180419921875, -0.11202239990234375, -0.1078643798828125, -0.10370635986328125, -0.09954833984375, -0.09539031982421875, -0.0912322998046875, -0.08707427978515625, -0.082916259765625, -0.07875823974609375, -0.0746002197265625, -0.07044219970703125, -0.0662841796875, -0.06212615966796875, -0.0579681396484375, -0.05381011962890625, -0.049652099609375, -0.04549407958984375, -0.0413360595703125, -0.03717803955078125, -0.03302001953125, -0.02886199951171875, -0.0247039794921875, -0.02054595947265625, -0.016387939453125, -0.01222991943359375, -0.0080718994140625, -0.00391387939453125, 0.000244140625, 0.00440216064453125, 0.0085601806640625, 0.01271820068359375, 0.016876220703125, 0.02103424072265625, 0.0251922607421875, 0.02935028076171875, 0.03350830078125, 0.03766632080078125, 0.0418243408203125, 0.04598236083984375, 0.050140380859375, 0.05429840087890625, 0.0584564208984375, 0.06261444091796875, 0.0667724609375, 0.07093048095703125, 0.0750885009765625, 0.07924652099609375, 0.083404541015625, 0.08756256103515625, 0.0917205810546875, 0.09587860107421875, 0.10003662109375, 0.10419464111328125, 0.1083526611328125, 0.11251068115234375, 0.116668701171875, 0.12082672119140625, 0.1249847412109375, 0.12914276123046875, 0.13330078125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 3.0, 3.0, 5.0, 8.0, 10.0, 21.0, 27.0, 12.0, 16.0, 36.0, 30.0, 30.0, 58.0, 45.0, 49.0, 56.0, 54.0, 67.0, 48.0, 66.0, 58.0, 46.0, 42.0, 42.0, 32.0, 41.0, 21.0, 17.0, 14.0, 3.0, 7.0, 5.0, 9.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1131591796875, -0.10931205749511719, -0.10546493530273438, -0.10161781311035156, -0.09777069091796875, -0.09392356872558594, -0.09007644653320312, -0.08622932434082031, -0.0823822021484375, -0.07853507995605469, -0.07468795776367188, -0.07084083557128906, -0.06699371337890625, -0.06314659118652344, -0.059299468994140625, -0.05545234680175781, -0.051605224609375, -0.04775810241699219, -0.043910980224609375, -0.04006385803222656, -0.03621673583984375, -0.03236961364746094, -0.028522491455078125, -0.024675369262695312, -0.0208282470703125, -0.016981124877929688, -0.013134002685546875, -0.009286880493164062, -0.00543975830078125, -0.0015926361083984375, 0.002254486083984375, 0.0061016082763671875, 0.00994873046875, 0.013795852661132812, 0.017642974853515625, 0.021490097045898438, 0.02533721923828125, 0.029184341430664062, 0.033031463623046875, 0.03687858581542969, 0.0407257080078125, 0.04457283020019531, 0.048419952392578125, 0.05226707458496094, 0.05611419677734375, 0.05996131896972656, 0.06380844116210938, 0.06765556335449219, 0.071502685546875, 0.07534980773925781, 0.07919692993164062, 0.08304405212402344, 0.08689117431640625, 0.09073829650878906, 0.09458541870117188, 0.09843254089355469, 0.1022796630859375, 0.10612678527832031, 0.10997390747070312, 0.11382102966308594, 0.11766815185546875, 0.12151527404785156, 0.12536239624023438, 0.1292095184326172, 0.133056640625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 5.0, 5.0, 5.0, 2.0, 7.0, 7.0, 21.0, 26.0, 33.0, 60.0, 116.0, 165.0, 300.0, 528.0, 887.0, 1702.0, 3426.0, 7415.0, 18074.0, 53113.0, 177722.0, 450940.0, 225855.0, 68437.0, 22479.0, 8723.0, 4045.0, 1962.0, 1071.0, 569.0, 318.0, 201.0, 141.0, 67.0, 49.0, 25.0, 15.0, 15.0, 10.0, 5.0, 7.0, 5.0, 1.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.018463134765625, -0.01789689064025879, -0.017330646514892578, -0.016764402389526367, -0.016198158264160156, -0.015631914138793945, -0.015065670013427734, -0.014499425888061523, -0.013933181762695312, -0.013366937637329102, -0.01280069351196289, -0.01223444938659668, -0.011668205261230469, -0.011101961135864258, -0.010535717010498047, -0.009969472885131836, -0.009403228759765625, -0.008836984634399414, -0.008270740509033203, -0.007704496383666992, -0.007138252258300781, -0.00657200813293457, -0.006005764007568359, -0.0054395198822021484, -0.0048732757568359375, -0.0043070316314697266, -0.0037407875061035156, -0.0031745433807373047, -0.0026082992553710938, -0.002042055130004883, -0.0014758110046386719, -0.0009095668792724609, -0.00034332275390625, 0.00022292137145996094, 0.0007891654968261719, 0.0013554096221923828, 0.0019216537475585938, 0.0024878978729248047, 0.0030541419982910156, 0.0036203861236572266, 0.0041866302490234375, 0.0047528743743896484, 0.005319118499755859, 0.00588536262512207, 0.006451606750488281, 0.007017850875854492, 0.007584095001220703, 0.008150339126586914, 0.008716583251953125, 0.009282827377319336, 0.009849071502685547, 0.010415315628051758, 0.010981559753417969, 0.01154780387878418, 0.01211404800415039, 0.012680292129516602, 0.013246536254882812, 0.013812780380249023, 0.014379024505615234, 0.014945268630981445, 0.015511512756347656, 0.016077756881713867, 0.016644001007080078, 0.01721024513244629, 0.0177764892578125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 7.0, 5.0, 6.0, 9.0, 5.0, 18.0, 19.0, 19.0, 36.0, 46.0, 54.0, 66.0, 76.0, 78.0, 95.0, 100.0, 61.0, 50.0, 57.0, 34.0, 30.0, 29.0, 23.0, 18.0, 17.0, 6.0, 7.0, 10.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6954879760742188e-06, -3.579072654247284e-06, -3.462657332420349e-06, -3.3462420105934143e-06, -3.2298266887664795e-06, -3.1134113669395447e-06, -2.99699604511261e-06, -2.880580723285675e-06, -2.7641654014587402e-06, -2.6477500796318054e-06, -2.5313347578048706e-06, -2.414919435977936e-06, -2.298504114151001e-06, -2.182088792324066e-06, -2.0656734704971313e-06, -1.9492581486701965e-06, -1.8328428268432617e-06, -1.716427505016327e-06, -1.600012183189392e-06, -1.4835968613624573e-06, -1.3671815395355225e-06, -1.2507662177085876e-06, -1.1343508958816528e-06, -1.017935574054718e-06, -9.015202522277832e-07, -7.851049304008484e-07, -6.686896085739136e-07, -5.522742867469788e-07, -4.3585896492004395e-07, -3.1944364309310913e-07, -2.0302832126617432e-07, -8.66129994392395e-08, 2.9802322387695312e-08, 1.4621764421463013e-07, 2.6263296604156494e-07, 3.7904828786849976e-07, 4.954636096954346e-07, 6.118789315223694e-07, 7.282942533493042e-07, 8.44709575176239e-07, 9.611248970031738e-07, 1.0775402188301086e-06, 1.1939555406570435e-06, 1.3103708624839783e-06, 1.426786184310913e-06, 1.543201506137848e-06, 1.6596168279647827e-06, 1.7760321497917175e-06, 1.8924474716186523e-06, 2.008862793445587e-06, 2.125278115272522e-06, 2.2416934370994568e-06, 2.3581087589263916e-06, 2.4745240807533264e-06, 2.5909394025802612e-06, 2.707354724407196e-06, 2.823770046234131e-06, 2.9401853680610657e-06, 3.0566006898880005e-06, 3.1730160117149353e-06, 3.28943133354187e-06, 3.405846655368805e-06, 3.5222619771957397e-06, 3.6386772990226746e-06, 3.7550926208496094e-06]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 9.0, 6.0, 10.0, 16.0, 12.0, 30.0, 46.0, 55.0, 66.0, 113.0, 173.0, 245.0, 355.0, 583.0, 830.0, 1291.0, 2104.0, 3457.0, 5889.0, 10642.0, 21665.0, 48487.0, 127491.0, 373708.0, 267867.0, 102218.0, 40126.0, 18191.0, 9284.0, 5222.0, 2958.0, 1880.0, 1200.0, 807.0, 470.0, 313.0, 227.0, 144.0, 119.0, 61.0, 47.0, 37.0, 28.0, 18.0, 12.0, 6.0, 13.0, 6.0, 10.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.0181732177734375, -0.017603397369384766, -0.01703357696533203, -0.016463756561279297, -0.015893936157226562, -0.015324115753173828, -0.014754295349121094, -0.01418447494506836, -0.013614654541015625, -0.01304483413696289, -0.012475013732910156, -0.011905193328857422, -0.011335372924804688, -0.010765552520751953, -0.010195732116699219, -0.009625911712646484, -0.00905609130859375, -0.008486270904541016, -0.007916450500488281, -0.007346630096435547, -0.0067768096923828125, -0.006206989288330078, -0.005637168884277344, -0.005067348480224609, -0.004497528076171875, -0.003927707672119141, -0.0033578872680664062, -0.002788066864013672, -0.0022182464599609375, -0.0016484260559082031, -0.0010786056518554688, -0.0005087852478027344, 6.103515625e-05, 0.0006308555603027344, 0.0012006759643554688, 0.0017704963684082031, 0.0023403167724609375, 0.002910137176513672, 0.0034799575805664062, 0.004049777984619141, 0.004619598388671875, 0.005189418792724609, 0.005759239196777344, 0.006329059600830078, 0.0068988800048828125, 0.007468700408935547, 0.008038520812988281, 0.008608341217041016, 0.00917816162109375, 0.009747982025146484, 0.010317802429199219, 0.010887622833251953, 0.011457443237304688, 0.012027263641357422, 0.012597084045410156, 0.01316690444946289, 0.013736724853515625, 0.01430654525756836, 0.014876365661621094, 0.015446186065673828, 0.016016006469726562, 0.016585826873779297, 0.01715564727783203, 0.017725467681884766, 0.0182952880859375]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 9.0, 6.0, 11.0, 13.0, 12.0, 22.0, 29.0, 53.0, 56.0, 82.0, 101.0, 206.0, 102.0, 85.0, 64.0, 42.0, 37.0, 25.0, 11.0, 8.0, 6.0, 3.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014404296875, -0.013816356658935547, -0.013228416442871094, -0.01264047622680664, -0.012052536010742188, -0.011464595794677734, -0.010876655578613281, -0.010288715362548828, -0.009700775146484375, -0.009112834930419922, -0.008524894714355469, -0.007936954498291016, -0.0073490142822265625, -0.006761074066162109, -0.006173133850097656, -0.005585193634033203, -0.00499725341796875, -0.004409313201904297, -0.0038213729858398438, -0.0032334327697753906, -0.0026454925537109375, -0.0020575523376464844, -0.0014696121215820312, -0.0008816719055175781, -0.000293731689453125, 0.0002942085266113281, 0.0008821487426757812, 0.0014700889587402344, 0.0020580291748046875, 0.0026459693908691406, 0.0032339096069335938, 0.003821849822998047, 0.0044097900390625, 0.004997730255126953, 0.005585670471191406, 0.006173610687255859, 0.0067615509033203125, 0.007349491119384766, 0.007937431335449219, 0.008525371551513672, 0.009113311767578125, 0.009701251983642578, 0.010289192199707031, 0.010877132415771484, 0.011465072631835938, 0.01205301284790039, 0.012640953063964844, 0.013228893280029297, 0.01381683349609375, 0.014404773712158203, 0.014992713928222656, 0.01558065414428711, 0.016168594360351562, 0.016756534576416016, 0.01734447479248047, 0.017932415008544922, 0.018520355224609375, 0.019108295440673828, 0.01969623565673828, 0.020284175872802734, 0.020872116088867188, 0.02146005630493164, 0.022047996520996094, 0.022635936737060547, 0.023223876953125]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 3.0, 7.0, 9.0, 8.0, 24.0, 33.0, 50.0, 62.0, 119.0, 136.0, 141.0, 119.0, 104.0, 61.0, 53.0, 32.0, 16.0, 7.0, 13.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.36785775423049927, -0.359567791223526, -0.35127779841423035, -0.3429878354072571, -0.3346978425979614, -0.32640787959098816, -0.3181179165840149, -0.30982792377471924, -0.30153796076774597, -0.2932479977607727, -0.28495800495147705, -0.2766680419445038, -0.2683780789375305, -0.26008808612823486, -0.2517981231212616, -0.24350814521312714, -0.23521816730499268, -0.22692818939685822, -0.21863821148872375, -0.2103482484817505, -0.20205827057361603, -0.19376829266548157, -0.1854783296585083, -0.17718835175037384, -0.16889837384223938, -0.16060839593410492, -0.15231841802597046, -0.1440284550189972, -0.13573847711086273, -0.12744849920272827, -0.11915852874517441, -0.11086855828762054, -0.10257861018180847, -0.09428863227367401, -0.08599866181612015, -0.07770869135856628, -0.06941871345043182, -0.06112873926758766, -0.0528387650847435, -0.04454879090189934, -0.036258816719055176, -0.027968842536211014, -0.019678868353366852, -0.01138889417052269, -0.003098919987678528, 0.005191054195165634, 0.013481028378009796, 0.021771002560853958, 0.03006097674369812, 0.03835095092654228, 0.046640925109386444, 0.054930899292230606, 0.06322087347507477, 0.07151085138320923, 0.07980082184076309, 0.08809079229831696, 0.09638077020645142, 0.10467074811458588, 0.11296071857213974, 0.1212506890296936, 0.12954066693782806, 0.13783064484596252, 0.1461206078529358, 0.15441058576107025, 0.1627005636692047]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 5.0, 3.0, 5.0, 9.0, 9.0, 11.0, 15.0, 8.0, 20.0, 27.0, 13.0, 23.0, 37.0, 29.0, 40.0, 38.0, 33.0, 46.0, 47.0, 36.0, 49.0, 39.0, 43.0, 43.0, 64.0, 48.0, 24.0, 42.0, 22.0, 23.0, 28.0, 18.0, 17.0, 17.0, 11.0, 13.0, 14.0, 7.0, 6.0, 4.0, 4.0, 5.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17499539256095886, -0.16934356093406677, -0.16369174420833588, -0.1580399125814438, -0.1523880958557129, -0.1467362642288208, -0.1410844326019287, -0.13543261587619781, -0.12978079915046692, -0.12412897497415543, -0.11847715079784393, -0.11282531917095184, -0.10717350244522095, -0.10152167081832886, -0.09586984664201736, -0.09021802246570587, -0.08456619083881378, -0.07891436666250229, -0.0732625424861908, -0.0676107108592987, -0.06195889040827751, -0.05630706623196602, -0.05065523833036423, -0.045003414154052734, -0.03935158997774124, -0.03369976580142975, -0.028047939762473106, -0.022396113723516464, -0.01674428954720497, -0.011092465370893478, -0.005440637469291687, 0.0002111867070198059, 0.005863025784492493, 0.01151485089212656, 0.017166675999760628, 0.02281850203871727, 0.028470326215028763, 0.034122150391340256, 0.03977397829294205, 0.04542580246925354, 0.05107762664556503, 0.056729450821876526, 0.06238127499818802, 0.06803309917449951, 0.0736849308013916, 0.0793367475271225, 0.08498857915401459, 0.09064040333032608, 0.09629222750663757, 0.10194405168294907, 0.10759587585926056, 0.11324770748615265, 0.11889952421188354, 0.12455135583877563, 0.13020318746566772, 0.13585500419139862, 0.14150682091712952, 0.1471586525440216, 0.1528104692697525, 0.1584623008966446, 0.1641141176223755, 0.16976594924926758, 0.17541778087615967, 0.18106959760189056, 0.18672142922878265]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 2.0, 10.0, 3.0, 6.0, 16.0, 23.0, 23.0, 41.0, 46.0, 65.0, 74.0, 97.0, 135.0, 177.0, 219.0, 327.0, 366.0, 636.0, 946.0, 1544.0, 5191.0, 1035301.0, 1867.0, 960.0, 709.0, 434.0, 356.0, 252.0, 192.0, 160.0, 99.0, 86.0, 55.0, 52.0, 36.0, 22.0, 20.0, 10.0, 15.0, 8.0, 9.0, 2.0, 2.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.23735788464546204, -0.23019158840179443, -0.22302527725696564, -0.21585898101329803, -0.20869266986846924, -0.20152637362480164, -0.19436007738113403, -0.18719376623630524, -0.18002746999263763, -0.17286117374897003, -0.16569486260414124, -0.15852856636047363, -0.15136225521564484, -0.14419595897197723, -0.13702964782714844, -0.12986335158348083, -0.12269704788923264, -0.11553074419498444, -0.10836444050073624, -0.10119813680648804, -0.09403184056282043, -0.08686553686857224, -0.07969923317432404, -0.07253293693065643, -0.06536662578582764, -0.05820032209157944, -0.051034022122621536, -0.04386771842837334, -0.036701418459415436, -0.029535114765167236, -0.022368811070919037, -0.015202511101961136, -0.008036211133003235, -0.0008699088357388973, 0.00629639346152544, 0.013462696224451065, 0.020628998056054115, 0.027795299887657166, 0.034961603581905365, 0.042127903550863266, 0.049294207245111465, 0.056460510939359665, 0.06362681090831757, 0.07079311460256577, 0.07795941829681396, 0.08512571454048157, 0.09229202568531036, 0.09945832192897797, 0.10662462562322617, 0.11379092931747437, 0.12095723301172256, 0.12812353670597076, 0.13528983294963837, 0.14245614409446716, 0.14962244033813477, 0.15678873658180237, 0.16395504772663116, 0.17112134397029877, 0.17828765511512756, 0.18545395135879517, 0.19262026250362396, 0.19978655874729156, 0.20695286989212036, 0.21411916613578796, 0.22128546237945557]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 11.0, 35.0, 81.0, 164.0, 351.0, 715.0, 2182.0, 51463196.0, 2178.0, 719.0, 375.0, 181.0, 77.0, 36.0, 10.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.037178039550781, -14.60129451751709, -14.165410995483398, -13.729527473449707, -13.293643951416016, -12.857759475708008, -12.421875953674316, -11.985992431640625, -11.550108909606934, -11.114225387573242, -10.67834186553955, -10.24245834350586, -9.806573867797852, -9.370691299438477, -8.934806823730469, -8.498923301696777, -8.063039779663086, -7.6271562576293945, -7.191272735595703, -6.7553887367248535, -6.319505214691162, -5.883621692657471, -5.447737693786621, -5.01185417175293, -4.575970649719238, -4.140087127685547, -3.7042033672332764, -3.268319606781006, -2.8324360847473145, -2.396552562713623, -1.9606688022613525, -1.524785041809082, -1.0889015197753906, -0.6530178785324097, -0.2171342372894287, 0.21874940395355225, 0.6546330451965332, 1.0905165672302246, 1.5264003276824951, 1.9622840881347656, 2.398167610168457, 2.8340511322021484, 3.269934892654419, 3.7058186531066895, 4.141702175140381, 4.577585697174072, 5.013469696044922, 5.449353218078613, 5.885236740112305, 6.321120262145996, 6.7570037841796875, 7.192887783050537, 7.6287713050842285, 8.064655303955078, 8.50053882598877, 8.936422348022461, 9.372305870056152, 9.808189392089844, 10.244072914123535, 10.679956436157227, 11.115840911865234, 11.55172348022461, 11.987607955932617, 12.423491477966309, 12.859375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 6.0, 11.0, 17.0, 15.0, 28.0, 23.0, 67.0, 86.0, 124.0, 189.0, 339.0, 450.0, 812.0, 1119.0, 1941.0, 3300.0, 5780.0, 10671.0, 20078.0, 39358.0, 77760.0, 152343.0, 293168.0, 526494.0, 3530526.0, 820511.0, 382079.0, 205652.0, 105403.0, 53032.0, 27279.0, 14125.0, 7610.0, 4362.0, 2522.0, 1457.0, 967.0, 629.0, 357.0, 273.0, 166.0, 95.0, 63.0, 48.0, 29.0, 26.0, 20.0, 11.0, 4.0, 3.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3759765625, -0.3644866943359375, -0.352996826171875, -0.3415069580078125, -0.33001708984375, -0.3185272216796875, -0.307037353515625, -0.2955474853515625, -0.2840576171875, -0.2725677490234375, -0.261077880859375, -0.2495880126953125, -0.23809814453125, -0.2266082763671875, -0.215118408203125, -0.2036285400390625, -0.192138671875, -0.1806488037109375, -0.169158935546875, -0.1576690673828125, -0.14617919921875, -0.1346893310546875, -0.123199462890625, -0.1117095947265625, -0.1002197265625, -0.0887298583984375, -0.077239990234375, -0.0657501220703125, -0.05426025390625, -0.0427703857421875, -0.031280517578125, -0.0197906494140625, -0.00830078125, 0.0031890869140625, 0.014678955078125, 0.0261688232421875, 0.03765869140625, 0.0491485595703125, 0.060638427734375, 0.0721282958984375, 0.0836181640625, 0.0951080322265625, 0.106597900390625, 0.1180877685546875, 0.12957763671875, 0.1410675048828125, 0.152557373046875, 0.1640472412109375, 0.175537109375, 0.1870269775390625, 0.198516845703125, 0.2100067138671875, 0.22149658203125, 0.2329864501953125, 0.244476318359375, 0.2559661865234375, 0.2674560546875, 0.2789459228515625, 0.290435791015625, 0.3019256591796875, 0.31341552734375, 0.3249053955078125, 0.336395263671875, 0.3478851318359375, 0.359375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 7.0, 5.0, 12.0, 15.0, 19.0, 17.0, 15.0, 23.0, 22.0, 26.0, 35.0, 33.0, 29.0, 33.0, 33.0, 45.0, 55.0, 142.0, 681.0, 298.0, 55.0, 64.0, 39.0, 46.0, 38.0, 50.0, 23.0, 30.0, 30.0, 11.0, 20.0, 19.0, 7.0, 14.0, 6.0, 7.0, 3.0, 2.0, 5.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.091796875, -2.0279693603515625, -1.964141845703125, -1.9003143310546875, -1.83648681640625, -1.7726593017578125, -1.708831787109375, -1.6450042724609375, -1.5811767578125, -1.5173492431640625, -1.453521728515625, -1.3896942138671875, -1.32586669921875, -1.2620391845703125, -1.198211669921875, -1.1343841552734375, -1.070556640625, -1.0067291259765625, -0.942901611328125, -0.8790740966796875, -0.81524658203125, -0.7514190673828125, -0.687591552734375, -0.6237640380859375, -0.5599365234375, -0.4961090087890625, -0.432281494140625, -0.3684539794921875, -0.30462646484375, -0.2407989501953125, -0.176971435546875, -0.1131439208984375, -0.04931640625, 0.0145111083984375, 0.078338623046875, 0.1421661376953125, 0.20599365234375, 0.2698211669921875, 0.333648681640625, 0.3974761962890625, 0.4613037109375, 0.5251312255859375, 0.588958740234375, 0.6527862548828125, 0.71661376953125, 0.7804412841796875, 0.844268798828125, 0.9080963134765625, 0.971923828125, 1.0357513427734375, 1.099578857421875, 1.1634063720703125, 1.22723388671875, 1.2910614013671875, 1.354888916015625, 1.4187164306640625, 1.4825439453125, 1.5463714599609375, 1.610198974609375, 1.6740264892578125, 1.73785400390625, 1.8016815185546875, 1.865509033203125, 1.9293365478515625, 1.9931640625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 8.0, 5.0, 8.0, 9.0, 24.0, 33.0, 62.0, 94.0, 152.0, 220.0, 407.0, 553.0, 937.0, 1504.0, 2424.0, 3930.0, 6448.0, 10332.0, 17564.0, 29004.0, 48549.0, 78882.0, 125231.0, 195277.0, 285537.0, 386234.0, 2747942.0, 1255965.0, 361722.0, 264218.0, 177348.0, 113117.0, 69998.0, 42484.0, 26041.0, 15348.0, 9438.0, 5562.0, 3427.0, 2020.0, 1271.0, 780.0, 486.0, 310.0, 201.0, 118.0, 92.0, 52.0, 30.0, 15.0, 11.0, 13.0, 6.0, 4.0], "bins": [-0.230224609375, -0.2239837646484375, -0.217742919921875, -0.2115020751953125, -0.20526123046875, -0.1990203857421875, -0.192779541015625, -0.1865386962890625, -0.1802978515625, -0.1740570068359375, -0.167816162109375, -0.1615753173828125, -0.15533447265625, -0.1490936279296875, -0.142852783203125, -0.1366119384765625, -0.13037109375, -0.1241302490234375, -0.117889404296875, -0.1116485595703125, -0.10540771484375, -0.0991668701171875, -0.092926025390625, -0.0866851806640625, -0.0804443359375, -0.0742034912109375, -0.067962646484375, -0.0617218017578125, -0.05548095703125, -0.0492401123046875, -0.042999267578125, -0.0367584228515625, -0.030517578125, -0.0242767333984375, -0.018035888671875, -0.0117950439453125, -0.00555419921875, 0.0006866455078125, 0.006927490234375, 0.0131683349609375, 0.0194091796875, 0.0256500244140625, 0.031890869140625, 0.0381317138671875, 0.04437255859375, 0.0506134033203125, 0.056854248046875, 0.0630950927734375, 0.0693359375, 0.0755767822265625, 0.081817626953125, 0.0880584716796875, 0.09429931640625, 0.1005401611328125, 0.106781005859375, 0.1130218505859375, 0.1192626953125, 0.1255035400390625, 0.131744384765625, 0.1379852294921875, 0.14422607421875, 0.1504669189453125, 0.156707763671875, 0.1629486083984375, 0.169189453125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 6.0, 3.0, 1.0, 1.0, 5.0, 7.0, 10.0, 8.0, 10.0, 11.0, 11.0, 16.0, 13.0, 14.0, 18.0, 16.0, 22.0, 21.0, 20.0, 28.0, 18.0, 31.0, 30.0, 45.0, 33.0, 40.0, 386.0, 635.0, 113.0, 30.0, 42.0, 30.0, 34.0, 33.0, 30.0, 39.0, 24.0, 20.0, 22.0, 22.0, 21.0, 19.0, 15.0, 11.0, 14.0, 10.0, 5.0, 9.0, 10.0, 3.0, 4.0, 5.0, 5.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0], "bins": [-1.5595703125, -1.511199951171875, -1.46282958984375, -1.414459228515625, -1.3660888671875, -1.317718505859375, -1.26934814453125, -1.220977783203125, -1.172607421875, -1.124237060546875, -1.07586669921875, -1.027496337890625, -0.9791259765625, -0.930755615234375, -0.88238525390625, -0.834014892578125, -0.78564453125, -0.737274169921875, -0.68890380859375, -0.640533447265625, -0.5921630859375, -0.543792724609375, -0.49542236328125, -0.447052001953125, -0.398681640625, -0.350311279296875, -0.30194091796875, -0.253570556640625, -0.2052001953125, -0.156829833984375, -0.10845947265625, -0.060089111328125, -0.01171875, 0.036651611328125, 0.08502197265625, 0.133392333984375, 0.1817626953125, 0.230133056640625, 0.27850341796875, 0.326873779296875, 0.375244140625, 0.423614501953125, 0.47198486328125, 0.520355224609375, 0.5687255859375, 0.617095947265625, 0.66546630859375, 0.713836669921875, 0.76220703125, 0.810577392578125, 0.85894775390625, 0.907318115234375, 0.9556884765625, 1.004058837890625, 1.05242919921875, 1.100799560546875, 1.149169921875, 1.197540283203125, 1.24591064453125, 1.294281005859375, 1.3426513671875, 1.391021728515625, 1.43939208984375, 1.487762451171875, 1.5361328125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 4.0, 6.0, 2.0, 4.0, 9.0, 14.0, 14.0, 15.0, 18.0, 29.0, 30.0, 38.0, 45.0, 77.0, 72.0, 115.0, 163.0, 183.0, 263.0, 338.0, 514.0, 726.0, 992.0, 1683.0, 3165.0, 6413.0, 15056.0, 37747.0, 100554.0, 5125828.0, 840043.0, 94186.0, 34932.0, 13846.0, 6075.0, 3041.0, 1633.0, 1030.0, 688.0, 500.0, 361.0, 257.0, 183.0, 118.0, 126.0, 64.0, 48.0, 43.0, 31.0, 27.0, 17.0, 15.0, 25.0, 13.0, 10.0, 8.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0], "bins": [-0.7294921875, -0.7059326171875, -0.682373046875, -0.6588134765625, -0.63525390625, -0.6116943359375, -0.588134765625, -0.5645751953125, -0.541015625, -0.5174560546875, -0.493896484375, -0.4703369140625, -0.44677734375, -0.4232177734375, -0.399658203125, -0.3760986328125, -0.3525390625, -0.3289794921875, -0.305419921875, -0.2818603515625, -0.25830078125, -0.2347412109375, -0.211181640625, -0.1876220703125, -0.1640625, -0.1405029296875, -0.116943359375, -0.0933837890625, -0.06982421875, -0.0462646484375, -0.022705078125, 0.0008544921875, 0.0244140625, 0.0479736328125, 0.071533203125, 0.0950927734375, 0.11865234375, 0.1422119140625, 0.165771484375, 0.1893310546875, 0.212890625, 0.2364501953125, 0.260009765625, 0.2835693359375, 0.30712890625, 0.3306884765625, 0.354248046875, 0.3778076171875, 0.4013671875, 0.4249267578125, 0.448486328125, 0.4720458984375, 0.49560546875, 0.5191650390625, 0.542724609375, 0.5662841796875, 0.58984375, 0.6134033203125, 0.636962890625, 0.6605224609375, 0.68408203125, 0.7076416015625, 0.731201171875, 0.7547607421875, 0.7783203125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 8.0, 5.0, 7.0, 11.0, 11.0, 11.0, 16.0, 23.0, 23.0, 22.0, 27.0, 45.0, 29.0, 38.0, 50.0, 29.0, 47.0, 51.0, 349.0, 737.0, 80.0, 41.0, 34.0, 36.0, 43.0, 32.0, 30.0, 36.0, 34.0, 17.0, 20.0, 17.0, 15.0, 13.0, 4.0, 7.0, 6.0, 10.0, 2.0, 2.0, 6.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.126953125, -2.0609130859375, -1.994873046875, -1.9288330078125, -1.86279296875, -1.7967529296875, -1.730712890625, -1.6646728515625, -1.5986328125, -1.5325927734375, -1.466552734375, -1.4005126953125, -1.33447265625, -1.2684326171875, -1.202392578125, -1.1363525390625, -1.0703125, -1.0042724609375, -0.938232421875, -0.8721923828125, -0.80615234375, -0.7401123046875, -0.674072265625, -0.6080322265625, -0.5419921875, -0.4759521484375, -0.409912109375, -0.3438720703125, -0.27783203125, -0.2117919921875, -0.145751953125, -0.0797119140625, -0.013671875, 0.0523681640625, 0.118408203125, 0.1844482421875, 0.25048828125, 0.3165283203125, 0.382568359375, 0.4486083984375, 0.5146484375, 0.5806884765625, 0.646728515625, 0.7127685546875, 0.77880859375, 0.8448486328125, 0.910888671875, 0.9769287109375, 1.04296875, 1.1090087890625, 1.175048828125, 1.2410888671875, 1.30712890625, 1.3731689453125, 1.439208984375, 1.5052490234375, 1.5712890625, 1.6373291015625, 1.703369140625, 1.7694091796875, 1.83544921875, 1.9014892578125, 1.967529296875, 2.0335693359375, 2.099609375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 1.0, 4.0, 3.0, 5.0, 9.0, 13.0, 14.0, 29.0, 33.0, 38.0, 54.0, 79.0, 158.0, 243.0, 92.0, 69.0, 34.0, 29.0, 27.0, 17.0, 18.0, 10.0, 7.0, 4.0, 1.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.225685119628906, -18.520082473754883, -17.814477920532227, -17.108875274658203, -16.403270721435547, -15.697668075561523, -14.9920654296875, -14.28646183013916, -13.58085823059082, -12.87525463104248, -12.16965103149414, -11.464048385620117, -10.758444786071777, -10.052841186523438, -9.347238540649414, -8.641634941101074, -7.936031341552734, -7.2304277420043945, -6.524824619293213, -5.819221496582031, -5.113617897033691, -4.408014297485352, -3.70241117477417, -2.9968080520629883, -2.2912044525146484, -1.5856010913848877, -0.879997730255127, -0.1743943691253662, 0.5312089920043945, 1.2368123531341553, 1.942415714263916, 2.6480188369750977, 3.3536205291748047, 4.0592241287231445, 4.764827251434326, 5.470430374145508, 6.176033973693848, 6.8816375732421875, 7.587240695953369, 8.29284381866455, 8.99844741821289, 9.70405101776123, 10.40965461730957, 11.115257263183594, 11.820860862731934, 12.526464462280273, 13.232067108154297, 13.937670707702637, 14.643274307250977, 15.348877906799316, 16.054481506347656, 16.76008415222168, 17.465686798095703, 18.17129135131836, 18.876893997192383, 19.582496643066406, 20.288101196289062, 20.993703842163086, 21.699308395385742, 22.404911041259766, 23.110515594482422, 23.816118240356445, 24.52172088623047, 25.227325439453125, 25.93292808532715]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 2.0, 5.0, 6.0, 6.0, 11.0, 8.0, 11.0, 10.0, 22.0, 15.0, 20.0, 22.0, 31.0, 34.0, 42.0, 74.0, 123.0, 155.0, 87.0, 54.0, 37.0, 31.0, 34.0, 28.0, 15.0, 24.0, 15.0, 12.0, 8.0, 13.0, 5.0, 7.0, 5.0, 8.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-44.22477722167969, -42.76165008544922, -41.29852294921875, -39.83539581298828, -38.37226867675781, -36.909141540527344, -35.446014404296875, -33.982887268066406, -32.51976013183594, -31.05663299560547, -29.593505859375, -28.13037872314453, -26.667251586914062, -25.204124450683594, -23.740997314453125, -22.277870178222656, -20.814741134643555, -19.351613998413086, -17.888486862182617, -16.42535972595215, -14.96223258972168, -13.499105453491211, -12.035977363586426, -10.572850227355957, -9.109723091125488, -7.6465959548950195, -6.183468818664551, -4.720341205596924, -3.257214069366455, -1.7940869331359863, -0.3309593200683594, 1.1321678161621094, 2.595294952392578, 4.058422088623047, 5.521549224853516, 6.984676837921143, 8.447803497314453, 9.910930633544922, 11.374058723449707, 12.837185859680176, 14.300312995910645, 15.763440132141113, 17.2265682220459, 18.689695358276367, 20.152822494506836, 21.615949630737305, 23.079076766967773, 24.542203903198242, 26.00533103942871, 27.46845817565918, 28.93158531188965, 30.394712448120117, 31.857839584350586, 33.32096862792969, 34.784095764160156, 36.247222900390625, 37.710350036621094, 39.17347717285156, 40.63660430908203, 42.0997314453125, 43.56285858154297, 45.02598571777344, 46.489112854003906, 47.952239990234375, 49.415367126464844]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 9.0, 8.0, 16.0, 15.0, 18.0, 34.0, 50.0, 61.0, 110.0, 163.0, 269.0, 366.0, 661.0, 1119.0, 2171.0, 4570.0, 11810.0, 46200.0, 3299952.0, 769936.0, 36147.0, 10864.0, 4482.0, 2202.0, 1171.0, 651.0, 425.0, 262.0, 165.0, 111.0, 79.0, 55.0, 42.0, 30.0, 13.0, 20.0, 11.0, 7.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038787841796875, -0.03749227523803711, -0.03619670867919922, -0.03490114212036133, -0.03360557556152344, -0.03231000900268555, -0.031014442443847656, -0.029718875885009766, -0.028423309326171875, -0.027127742767333984, -0.025832176208496094, -0.024536609649658203, -0.023241043090820312, -0.021945476531982422, -0.02064990997314453, -0.01935434341430664, -0.01805877685546875, -0.01676321029663086, -0.015467643737792969, -0.014172077178955078, -0.012876510620117188, -0.011580944061279297, -0.010285377502441406, -0.008989810943603516, -0.007694244384765625, -0.006398677825927734, -0.005103111267089844, -0.003807544708251953, -0.0025119781494140625, -0.0012164115905761719, 7.915496826171875e-05, 0.0013747215270996094, 0.0026702880859375, 0.003965854644775391, 0.005261421203613281, 0.006556987762451172, 0.007852554321289062, 0.009148120880126953, 0.010443687438964844, 0.011739253997802734, 0.013034820556640625, 0.014330387115478516, 0.015625953674316406, 0.016921520233154297, 0.018217086791992188, 0.019512653350830078, 0.02080821990966797, 0.02210378646850586, 0.02339935302734375, 0.02469491958618164, 0.02599048614501953, 0.027286052703857422, 0.028581619262695312, 0.029877185821533203, 0.031172752380371094, 0.032468318939208984, 0.033763885498046875, 0.035059452056884766, 0.036355018615722656, 0.03765058517456055, 0.03894615173339844, 0.04024171829223633, 0.04153728485107422, 0.04283285140991211, 0.04412841796875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 1.0, 4.0, 4.0, 5.0, 6.0, 10.0, 11.0, 15.0, 19.0, 27.0, 32.0, 29.0, 40.0, 57.0, 394.0, 87.0, 55.0, 45.0, 27.0, 19.0, 22.0, 15.0, 15.0, 15.0, 6.0, 8.0, 7.0, 6.0, 2.0, 2.0, 5.0, 3.0, 5.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0204620361328125, -0.019802093505859375, -0.01914215087890625, -0.018482208251953125, -0.017822265625, -0.017162322998046875, -0.01650238037109375, -0.015842437744140625, -0.0151824951171875, -0.014522552490234375, -0.01386260986328125, -0.013202667236328125, -0.012542724609375, -0.011882781982421875, -0.01122283935546875, -0.010562896728515625, -0.0099029541015625, -0.009243011474609375, -0.00858306884765625, -0.007923126220703125, -0.00726318359375, -0.006603240966796875, -0.00594329833984375, -0.005283355712890625, -0.0046234130859375, -0.003963470458984375, -0.00330352783203125, -0.002643585205078125, -0.001983642578125, -0.001323699951171875, -0.00066375732421875, -3.814697265625e-06, 0.0006561279296875, 0.001316070556640625, 0.00197601318359375, 0.002635955810546875, 0.0032958984375, 0.003955841064453125, 0.00461578369140625, 0.005275726318359375, 0.0059356689453125, 0.006595611572265625, 0.00725555419921875, 0.007915496826171875, 0.008575439453125, 0.009235382080078125, 0.00989532470703125, 0.010555267333984375, 0.0112152099609375, 0.011875152587890625, 0.01253509521484375, 0.013195037841796875, 0.01385498046875, 0.014514923095703125, 0.01517486572265625, 0.015834808349609375, 0.0164947509765625, 0.017154693603515625, 0.01781463623046875, 0.018474578857421875, 0.019134521484375, 0.019794464111328125, 0.02045440673828125, 0.021114349365234375, 0.0217742919921875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 7.0, 5.0, 5.0, 10.0, 19.0, 31.0, 48.0, 80.0, 120.0, 214.0, 571.0, 1459.0, 4465.0, 18442.0, 125084.0, 3660554.0, 334354.0, 36554.0, 8262.0, 2415.0, 832.0, 314.0, 174.0, 72.0, 60.0, 36.0, 32.0, 29.0, 12.0, 11.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0594482421875, -0.05773353576660156, -0.056018829345703125, -0.05430412292480469, -0.05258941650390625, -0.05087471008300781, -0.049160003662109375, -0.04744529724121094, -0.0457305908203125, -0.04401588439941406, -0.042301177978515625, -0.04058647155761719, -0.03887176513671875, -0.03715705871582031, -0.035442352294921875, -0.03372764587402344, -0.032012939453125, -0.030298233032226562, -0.028583526611328125, -0.026868820190429688, -0.02515411376953125, -0.023439407348632812, -0.021724700927734375, -0.020009994506835938, -0.0182952880859375, -0.016580581665039062, -0.014865875244140625, -0.013151168823242188, -0.01143646240234375, -0.009721755981445312, -0.008007049560546875, -0.0062923431396484375, -0.00457763671875, -0.0028629302978515625, -0.001148223876953125, 0.0005664825439453125, 0.00228118896484375, 0.0039958953857421875, 0.005710601806640625, 0.0074253082275390625, 0.0091400146484375, 0.010854721069335938, 0.012569427490234375, 0.014284133911132812, 0.01599884033203125, 0.017713546752929688, 0.019428253173828125, 0.021142959594726562, 0.022857666015625, 0.024572372436523438, 0.026287078857421875, 0.028001785278320312, 0.02971649169921875, 0.03143119812011719, 0.033145904541015625, 0.03486061096191406, 0.0365753173828125, 0.03829002380371094, 0.040004730224609375, 0.04171943664550781, 0.04343414306640625, 0.04514884948730469, 0.046863555908203125, 0.04857826232910156, 0.05029296875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 4.0, 3.0, 7.0, 9.0, 7.0, 10.0, 17.0, 25.0, 27.0, 39.0, 68.0, 61.0, 119.0, 216.0, 537.0, 1313.0, 746.0, 312.0, 149.0, 108.0, 61.0, 49.0, 35.0, 20.0, 24.0, 27.0, 13.0, 14.0, 9.0, 15.0, 8.0, 5.0, 4.0, 10.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0191802978515625, -0.018611431121826172, -0.018042564392089844, -0.017473697662353516, -0.016904830932617188, -0.01633596420288086, -0.01576709747314453, -0.015198230743408203, -0.014629364013671875, -0.014060497283935547, -0.013491630554199219, -0.01292276382446289, -0.012353897094726562, -0.011785030364990234, -0.011216163635253906, -0.010647296905517578, -0.01007843017578125, -0.009509563446044922, -0.008940696716308594, -0.008371829986572266, -0.0078029632568359375, -0.007234096527099609, -0.006665229797363281, -0.006096363067626953, -0.005527496337890625, -0.004958629608154297, -0.004389762878417969, -0.0038208961486816406, -0.0032520294189453125, -0.0026831626892089844, -0.0021142959594726562, -0.0015454292297363281, -0.0009765625, -0.0004076957702636719, 0.00016117095947265625, 0.0007300376892089844, 0.0012989044189453125, 0.0018677711486816406, 0.0024366378784179688, 0.003005504608154297, 0.003574371337890625, 0.004143238067626953, 0.004712104797363281, 0.005280971527099609, 0.0058498382568359375, 0.006418704986572266, 0.006987571716308594, 0.007556438446044922, 0.00812530517578125, 0.008694171905517578, 0.009263038635253906, 0.009831905364990234, 0.010400772094726562, 0.01096963882446289, 0.011538505554199219, 0.012107372283935547, 0.012676239013671875, 0.013245105743408203, 0.013813972473144531, 0.01438283920288086, 0.014951705932617188, 0.015520572662353516, 0.016089439392089844, 0.016658306121826172, 0.0172271728515625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 5.0, 40.0, 402.0, 481.0, 61.0, 10.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06465546041727066, -0.05390220135450363, -0.0431489422917366, -0.032395679503679276, -0.021642420440912247, -0.010889161378145218, -0.00013589859008789062, 0.010617360472679138, 0.021370619535446167, 0.032123878598213196, 0.042877137660980225, 0.05363040044903755, 0.06438365578651428, 0.07513691484928131, 0.08589018136262894, 0.09664344042539597, 0.107396699488163, 0.11814995855093002, 0.12890322506427765, 0.13965648412704468, 0.1504097431898117, 0.16116300225257874, 0.17191626131534576, 0.1826695203781128, 0.19342277944087982, 0.20417603850364685, 0.21492929756641388, 0.2256825566291809, 0.23643581569194794, 0.24718907475471497, 0.2579423487186432, 0.268695592880249, 0.27944883704185486, 0.2902021110057831, 0.3009553551673889, 0.31170862913131714, 0.322461873292923, 0.3332151472568512, 0.34396839141845703, 0.35472166538238525, 0.3654749095439911, 0.3762281835079193, 0.38698142766952515, 0.39773470163345337, 0.4084879457950592, 0.4192412197589874, 0.42999446392059326, 0.4407477378845215, 0.4515010118484497, 0.46225428581237793, 0.47300752997398376, 0.483760803937912, 0.4945140480995178, 0.505267322063446, 0.5160205960273743, 0.5267738103866577, 0.5375270843505859, 0.5482803583145142, 0.5590336322784424, 0.5697868466377258, 0.580540120601654, 0.5912933945655823, 0.6020466685295105, 0.612799882888794, 0.6235531568527222]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 0.0, 1.0, 4.0, 11.0, 3.0, 3.0, 9.0, 13.0, 15.0, 12.0, 19.0, 21.0, 30.0, 25.0, 38.0, 41.0, 73.0, 52.0, 55.0, 52.0, 59.0, 51.0, 50.0, 48.0, 50.0, 51.0, 49.0, 31.0, 32.0, 25.0, 22.0, 19.0, 20.0, 5.0, 8.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.09513932466506958, -0.0924723893404007, -0.08980545401573181, -0.08713851869106293, -0.08447158336639404, -0.08180464804172516, -0.07913771271705627, -0.07647077739238739, -0.0738038420677185, -0.07113690674304962, -0.06846997141838074, -0.06580303609371185, -0.06313610076904297, -0.060469165444374084, -0.0578022301197052, -0.055135294795036316, -0.05246835947036743, -0.04980142414569855, -0.04713448882102966, -0.04446755349636078, -0.041800618171691895, -0.03913368284702301, -0.036466747522354126, -0.03379981219768524, -0.031132876873016357, -0.028465941548347473, -0.02579900622367859, -0.023132070899009705, -0.02046513557434082, -0.017798200249671936, -0.015131264925003052, -0.012464329600334167, -0.009797394275665283, -0.007130458950996399, -0.004463523626327515, -0.0017965883016586304, 0.0008703470230102539, 0.003537282347679138, 0.0062042176723480225, 0.008871152997016907, 0.011538088321685791, 0.014205023646354675, 0.01687195897102356, 0.019538894295692444, 0.022205829620361328, 0.024872764945030212, 0.027539700269699097, 0.03020663559436798, 0.032873570919036865, 0.03554050624370575, 0.038207441568374634, 0.04087437689304352, 0.0435413122177124, 0.04620824754238129, 0.04887518286705017, 0.051542118191719055, 0.05420905351638794, 0.056875988841056824, 0.05954292416572571, 0.06220985949039459, 0.06487679481506348, 0.06754373013973236, 0.07021066546440125, 0.07287760078907013, 0.07554453611373901]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 12.0, 13.0, 9.0, 14.0, 27.0, 46.0, 45.0, 75.0, 121.0, 153.0, 244.0, 383.0, 519.0, 765.0, 1279.0, 2027.0, 3212.0, 5691.0, 9989.0, 19980.0, 44920.0, 144195.0, 661855.0, 85401.0, 32294.0, 15261.0, 7942.0, 4417.0, 2774.0, 1731.0, 1101.0, 656.0, 455.0, 349.0, 199.0, 131.0, 86.0, 66.0, 34.0, 26.0, 19.0, 9.0, 8.0, 8.0, 7.0, 1.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0438232421875, -0.04250764846801758, -0.041192054748535156, -0.039876461029052734, -0.03856086730957031, -0.03724527359008789, -0.03592967987060547, -0.03461408615112305, -0.033298492431640625, -0.0319828987121582, -0.03066730499267578, -0.02935171127319336, -0.028036117553710938, -0.026720523834228516, -0.025404930114746094, -0.024089336395263672, -0.02277374267578125, -0.021458148956298828, -0.020142555236816406, -0.018826961517333984, -0.017511367797851562, -0.01619577407836914, -0.014880180358886719, -0.013564586639404297, -0.012248992919921875, -0.010933399200439453, -0.009617805480957031, -0.00830221176147461, -0.0069866180419921875, -0.005671024322509766, -0.004355430603027344, -0.003039836883544922, -0.0017242431640625, -0.0004086494445800781, 0.0009069442749023438, 0.0022225379943847656, 0.0035381317138671875, 0.004853725433349609, 0.006169319152832031, 0.007484912872314453, 0.008800506591796875, 0.010116100311279297, 0.011431694030761719, 0.01274728775024414, 0.014062881469726562, 0.015378475189208984, 0.016694068908691406, 0.018009662628173828, 0.01932525634765625, 0.020640850067138672, 0.021956443786621094, 0.023272037506103516, 0.024587631225585938, 0.02590322494506836, 0.02721881866455078, 0.028534412384033203, 0.029850006103515625, 0.031165599822998047, 0.03248119354248047, 0.03379678726196289, 0.03511238098144531, 0.036427974700927734, 0.037743568420410156, 0.03905916213989258, 0.040374755859375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 4.0, 4.0, 3.0, 2.0, 6.0, 6.0, 6.0, 12.0, 15.0, 22.0, 27.0, 22.0, 33.0, 42.0, 55.0, 252.0, 220.0, 67.0, 41.0, 29.0, 24.0, 18.0, 24.0, 9.0, 19.0, 7.0, 5.0, 9.0, 1.0, 5.0, 3.0, 3.0, 7.0, 4.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020751953125, -0.020085811614990234, -0.01941967010498047, -0.018753528594970703, -0.018087387084960938, -0.017421245574951172, -0.016755104064941406, -0.01608896255493164, -0.015422821044921875, -0.01475667953491211, -0.014090538024902344, -0.013424396514892578, -0.012758255004882812, -0.012092113494873047, -0.011425971984863281, -0.010759830474853516, -0.01009368896484375, -0.009427547454833984, -0.008761405944824219, -0.008095264434814453, -0.0074291229248046875, -0.006762981414794922, -0.006096839904785156, -0.005430698394775391, -0.004764556884765625, -0.004098415374755859, -0.0034322738647460938, -0.002766132354736328, -0.0020999908447265625, -0.0014338493347167969, -0.0007677078247070312, -0.00010156631469726562, 0.0005645751953125, 0.0012307167053222656, 0.0018968582153320312, 0.002562999725341797, 0.0032291412353515625, 0.003895282745361328, 0.004561424255371094, 0.005227565765380859, 0.005893707275390625, 0.006559848785400391, 0.007225990295410156, 0.007892131805419922, 0.008558273315429688, 0.009224414825439453, 0.009890556335449219, 0.010556697845458984, 0.01122283935546875, 0.011888980865478516, 0.012555122375488281, 0.013221263885498047, 0.013887405395507812, 0.014553546905517578, 0.015219688415527344, 0.01588582992553711, 0.016551971435546875, 0.01721811294555664, 0.017884254455566406, 0.018550395965576172, 0.019216537475585938, 0.019882678985595703, 0.02054882049560547, 0.021214962005615234, 0.021881103515625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 1.0, 7.0, 9.0, 12.0, 16.0, 16.0, 24.0, 36.0, 59.0, 89.0, 97.0, 139.0, 231.0, 418.0, 776.0, 1721.0, 5350.0, 22662.0, 150600.0, 694923.0, 141035.0, 21619.0, 5060.0, 1751.0, 759.0, 397.0, 242.0, 137.0, 103.0, 77.0, 49.0, 38.0, 35.0, 21.0, 12.0, 16.0, 9.0, 6.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.057464599609375, -0.05574846267700195, -0.054032325744628906, -0.05231618881225586, -0.05060005187988281, -0.048883914947509766, -0.04716777801513672, -0.04545164108276367, -0.043735504150390625, -0.04201936721801758, -0.04030323028564453, -0.038587093353271484, -0.03687095642089844, -0.03515481948852539, -0.033438682556152344, -0.0317225456237793, -0.03000640869140625, -0.028290271759033203, -0.026574134826660156, -0.02485799789428711, -0.023141860961914062, -0.021425724029541016, -0.01970958709716797, -0.017993450164794922, -0.016277313232421875, -0.014561176300048828, -0.012845039367675781, -0.011128902435302734, -0.009412765502929688, -0.007696628570556641, -0.005980491638183594, -0.004264354705810547, -0.0025482177734375, -0.0008320808410644531, 0.0008840560913085938, 0.0026001930236816406, 0.0043163299560546875, 0.006032466888427734, 0.007748603820800781, 0.009464740753173828, 0.011180877685546875, 0.012897014617919922, 0.014613151550292969, 0.016329288482666016, 0.018045425415039062, 0.01976156234741211, 0.021477699279785156, 0.023193836212158203, 0.02490997314453125, 0.026626110076904297, 0.028342247009277344, 0.03005838394165039, 0.03177452087402344, 0.033490657806396484, 0.03520679473876953, 0.03692293167114258, 0.038639068603515625, 0.04035520553588867, 0.04207134246826172, 0.043787479400634766, 0.04550361633300781, 0.04721975326538086, 0.048935890197753906, 0.05065202713012695, 0.0523681640625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 6.0, 10.0, 12.0, 8.0, 16.0, 15.0, 26.0, 25.0, 35.0, 23.0, 41.0, 40.0, 40.0, 48.0, 36.0, 50.0, 56.0, 42.0, 41.0, 57.0, 45.0, 33.0, 32.0, 33.0, 28.0, 29.0, 21.0, 31.0, 21.0, 21.0, 19.0, 13.0, 17.0, 6.0, 8.0, 5.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.08544921875, -0.08315610885620117, -0.08086299896240234, -0.07856988906860352, -0.07627677917480469, -0.07398366928100586, -0.07169055938720703, -0.0693974494934082, -0.06710433959960938, -0.06481122970581055, -0.06251811981201172, -0.06022500991821289, -0.05793190002441406, -0.055638790130615234, -0.053345680236816406, -0.05105257034301758, -0.04875946044921875, -0.04646635055541992, -0.044173240661621094, -0.041880130767822266, -0.03958702087402344, -0.03729391098022461, -0.03500080108642578, -0.03270769119262695, -0.030414581298828125, -0.028121471405029297, -0.02582836151123047, -0.02353525161743164, -0.021242141723632812, -0.018949031829833984, -0.016655921936035156, -0.014362812042236328, -0.0120697021484375, -0.009776592254638672, -0.007483482360839844, -0.005190372467041016, -0.0028972625732421875, -0.0006041526794433594, 0.0016889572143554688, 0.003982067108154297, 0.006275177001953125, 0.008568286895751953, 0.010861396789550781, 0.01315450668334961, 0.015447616577148438, 0.017740726470947266, 0.020033836364746094, 0.022326946258544922, 0.02462005615234375, 0.026913166046142578, 0.029206275939941406, 0.031499385833740234, 0.03379249572753906, 0.03608560562133789, 0.03837871551513672, 0.04067182540893555, 0.042964935302734375, 0.0452580451965332, 0.04755115509033203, 0.04984426498413086, 0.05213737487792969, 0.054430484771728516, 0.056723594665527344, 0.05901670455932617, 0.061309814453125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 9.0, 20.0, 21.0, 25.0, 79.0, 129.0, 239.0, 556.0, 1603.0, 7862.0, 197388.0, 819547.0, 17024.0, 2608.0, 762.0, 308.0, 170.0, 79.0, 46.0, 26.0, 11.0, 13.0, 8.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0316162109375, -0.030601978302001953, -0.029587745666503906, -0.02857351303100586, -0.027559280395507812, -0.026545047760009766, -0.02553081512451172, -0.024516582489013672, -0.023502349853515625, -0.022488117218017578, -0.02147388458251953, -0.020459651947021484, -0.019445419311523438, -0.01843118667602539, -0.017416954040527344, -0.016402721405029297, -0.01538848876953125, -0.014374256134033203, -0.013360023498535156, -0.01234579086303711, -0.011331558227539062, -0.010317325592041016, -0.009303092956542969, -0.008288860321044922, -0.007274627685546875, -0.006260395050048828, -0.005246162414550781, -0.004231929779052734, -0.0032176971435546875, -0.0022034645080566406, -0.0011892318725585938, -0.00017499923706054688, 0.0008392333984375, 0.0018534660339355469, 0.0028676986694335938, 0.0038819313049316406, 0.0048961639404296875, 0.005910396575927734, 0.006924629211425781, 0.007938861846923828, 0.008953094482421875, 0.009967327117919922, 0.010981559753417969, 0.011995792388916016, 0.013010025024414062, 0.01402425765991211, 0.015038490295410156, 0.016052722930908203, 0.01706695556640625, 0.018081188201904297, 0.019095420837402344, 0.02010965347290039, 0.021123886108398438, 0.022138118743896484, 0.02315235137939453, 0.024166584014892578, 0.025180816650390625, 0.026195049285888672, 0.02720928192138672, 0.028223514556884766, 0.029237747192382812, 0.03025197982788086, 0.031266212463378906, 0.03228044509887695, 0.033294677734375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 6.0, 8.0, 13.0, 9.0, 13.0, 21.0, 24.0, 25.0, 30.0, 39.0, 55.0, 60.0, 66.0, 45.0, 71.0, 69.0, 66.0, 63.0, 41.0, 53.0, 48.0, 27.0, 28.0, 30.0, 28.0, 32.0, 10.0, 7.0, 6.0, 9.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1563301086425781e-05, -1.1213123798370361e-05, -1.0862946510314941e-05, -1.0512769222259521e-05, -1.0162591934204102e-05, -9.812414646148682e-06, -9.462237358093262e-06, -9.112060070037842e-06, -8.761882781982422e-06, -8.411705493927002e-06, -8.061528205871582e-06, -7.711350917816162e-06, -7.361173629760742e-06, -7.010996341705322e-06, -6.660819053649902e-06, -6.310641765594482e-06, -5.9604644775390625e-06, -5.610287189483643e-06, -5.260109901428223e-06, -4.909932613372803e-06, -4.559755325317383e-06, -4.209578037261963e-06, -3.859400749206543e-06, -3.509223461151123e-06, -3.159046173095703e-06, -2.808868885040283e-06, -2.4586915969848633e-06, -2.1085143089294434e-06, -1.7583370208740234e-06, -1.4081597328186035e-06, -1.0579824447631836e-06, -7.078051567077637e-07, -3.5762786865234375e-07, -7.450580596923828e-09, 3.427267074584961e-07, 6.92903995513916e-07, 1.043081283569336e-06, 1.3932585716247559e-06, 1.7434358596801758e-06, 2.0936131477355957e-06, 2.4437904357910156e-06, 2.7939677238464355e-06, 3.1441450119018555e-06, 3.4943222999572754e-06, 3.844499588012695e-06, 4.194676876068115e-06, 4.544854164123535e-06, 4.895031452178955e-06, 5.245208740234375e-06, 5.595386028289795e-06, 5.945563316345215e-06, 6.295740604400635e-06, 6.645917892456055e-06, 6.996095180511475e-06, 7.3462724685668945e-06, 7.696449756622314e-06, 8.046627044677734e-06, 8.396804332733154e-06, 8.746981620788574e-06, 9.097158908843994e-06, 9.447336196899414e-06, 9.797513484954834e-06, 1.0147690773010254e-05, 1.0497868061065674e-05, 1.0848045349121094e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 3.0, 6.0, 5.0, 6.0, 7.0, 18.0, 26.0, 40.0, 49.0, 89.0, 167.0, 366.0, 780.0, 2370.0, 9471.0, 75666.0, 756400.0, 181316.0, 16377.0, 3431.0, 1056.0, 417.0, 209.0, 113.0, 59.0, 38.0, 24.0, 16.0, 10.0, 6.0, 4.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.02227783203125, -0.021635055541992188, -0.020992279052734375, -0.020349502563476562, -0.01970672607421875, -0.019063949584960938, -0.018421173095703125, -0.017778396606445312, -0.0171356201171875, -0.016492843627929688, -0.015850067138671875, -0.015207290649414062, -0.01456451416015625, -0.013921737670898438, -0.013278961181640625, -0.012636184692382812, -0.011993408203125, -0.011350631713867188, -0.010707855224609375, -0.010065078735351562, -0.00942230224609375, -0.008779525756835938, -0.008136749267578125, -0.0074939727783203125, -0.0068511962890625, -0.0062084197998046875, -0.005565643310546875, -0.0049228668212890625, -0.00428009033203125, -0.0036373138427734375, -0.002994537353515625, -0.0023517608642578125, -0.001708984375, -0.0010662078857421875, -0.000423431396484375, 0.0002193450927734375, 0.00086212158203125, 0.0015048980712890625, 0.002147674560546875, 0.0027904510498046875, 0.0034332275390625, 0.0040760040283203125, 0.004718780517578125, 0.0053615570068359375, 0.00600433349609375, 0.0066471099853515625, 0.007289886474609375, 0.007932662963867188, 0.008575439453125, 0.009218215942382812, 0.009860992431640625, 0.010503768920898438, 0.01114654541015625, 0.011789321899414062, 0.012432098388671875, 0.013074874877929688, 0.0137176513671875, 0.014360427856445312, 0.015003204345703125, 0.015645980834960938, 0.01628875732421875, 0.016931533813476562, 0.017574310302734375, 0.018217086791992188, 0.01885986328125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 3.0, 11.0, 12.0, 11.0, 15.0, 17.0, 34.0, 41.0, 78.0, 73.0, 108.0, 106.0, 97.0, 87.0, 73.0, 66.0, 48.0, 38.0, 30.0, 18.0, 13.0, 6.0, 8.0, 2.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.024169921875, -0.0234830379486084, -0.022796154022216797, -0.022109270095825195, -0.021422386169433594, -0.020735502243041992, -0.02004861831665039, -0.01936173439025879, -0.018674850463867188, -0.017987966537475586, -0.017301082611083984, -0.016614198684692383, -0.01592731475830078, -0.01524043083190918, -0.014553546905517578, -0.013866662979125977, -0.013179779052734375, -0.012492895126342773, -0.011806011199951172, -0.01111912727355957, -0.010432243347167969, -0.009745359420776367, -0.009058475494384766, -0.008371591567993164, -0.0076847076416015625, -0.006997823715209961, -0.006310939788818359, -0.005624055862426758, -0.004937171936035156, -0.004250288009643555, -0.003563404083251953, -0.0028765201568603516, -0.00218963623046875, -0.0015027523040771484, -0.0008158683776855469, -0.0001289844512939453, 0.0005578994750976562, 0.0012447834014892578, 0.0019316673278808594, 0.002618551254272461, 0.0033054351806640625, 0.003992319107055664, 0.004679203033447266, 0.005366086959838867, 0.006052970886230469, 0.00673985481262207, 0.007426738739013672, 0.008113622665405273, 0.008800506591796875, 0.009487390518188477, 0.010174274444580078, 0.01086115837097168, 0.011548042297363281, 0.012234926223754883, 0.012921810150146484, 0.013608694076538086, 0.014295578002929688, 0.014982461929321289, 0.01566934585571289, 0.016356229782104492, 0.017043113708496094, 0.017729997634887695, 0.018416881561279297, 0.0191037654876709, 0.0197906494140625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [2.0, 13.0, 31.0, 395.0, 538.0, 31.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20775380730628967, -0.15670248866081238, -0.10565116256475449, -0.054599836468696594, -0.0035485178232192993, 0.04750281572341919, 0.09855413436889648, 0.14960545301437378, 0.20065677165985107, 0.25170809030532837, 0.30275940895080566, 0.35381072759628296, 0.40486204624176025, 0.45591339468955994, 0.5069646835327148, 0.5580160617828369, 0.6090673208236694, 0.6601186394691467, 0.711169958114624, 0.7622212767601013, 0.8132725954055786, 0.8643239736557007, 0.9153752326965332, 0.9664266109466553, 1.0174779891967773, 1.0685293674468994, 1.119580626487732, 1.170632004737854, 1.2216832637786865, 1.2727346420288086, 1.3237859010696411, 1.3748372793197632, 1.4258884191513062, 1.4769397974014282, 1.5279910564422607, 1.5790424346923828, 1.6300936937332153, 1.6811450719833374, 1.73219633102417, 1.783247709274292, 1.8342989683151245, 1.8853503465652466, 1.936401605606079, 1.9874529838562012, 2.0385043621063232, 2.089555501937866, 2.1406068801879883, 2.1916582584381104, 2.2427096366882324, 2.2937610149383545, 2.3448123931884766, 2.3958635330200195, 2.4469149112701416, 2.4979662895202637, 2.5490176677703857, 2.6000688076019287, 2.651120185852051, 2.702171564102173, 2.753222942352295, 2.804274082183838, 2.85532546043396, 2.906376838684082, 2.957428216934204, 3.008479356765747, 3.059530735015869]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 8.0, 1.0, 4.0, 3.0, 7.0, 9.0, 9.0, 7.0, 8.0, 9.0, 14.0, 32.0, 48.0, 102.0, 110.0, 167.0, 153.0, 127.0, 69.0, 36.0, 18.0, 19.0, 6.0, 5.0, 2.0, 4.0, 3.0, 4.0, 3.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4588866233825684, -1.418999433517456, -1.3791122436523438, -1.3392250537872314, -1.2993378639221191, -1.2594506740570068, -1.2195634841918945, -1.1796762943267822, -1.13978910446167, -1.0999019145965576, -1.0600147247314453, -1.020127534866333, -0.9802403450012207, -0.9403531551361084, -0.9004659652709961, -0.8605787754058838, -0.8206915855407715, -0.7808043956756592, -0.7409172058105469, -0.7010300159454346, -0.6611428260803223, -0.62125563621521, -0.5813684463500977, -0.5414812564849854, -0.501594066619873, -0.46170687675476074, -0.42181968688964844, -0.38193249702453613, -0.34204530715942383, -0.3021581172943115, -0.2622709274291992, -0.22238373756408691, -0.1824965476989746, -0.1426093578338623, -0.10272216796875, -0.0628349781036377, -0.02294778823852539, 0.016939401626586914, 0.05682659149169922, 0.09671378135681152, 0.13660097122192383, 0.17648816108703613, 0.21637535095214844, 0.25626254081726074, 0.29614973068237305, 0.33603692054748535, 0.37592411041259766, 0.41581130027770996, 0.45569849014282227, 0.49558568000793457, 0.5354728698730469, 0.5753600597381592, 0.6152472496032715, 0.6551344394683838, 0.6950216293334961, 0.7349088191986084, 0.7747960090637207, 0.814683198928833, 0.8545703887939453, 0.8944575786590576, 0.9343447685241699, 0.9742319583892822, 1.0141191482543945, 1.0540063381195068, 1.0938935279846191]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 8.0, 9.0, 19.0, 21.0, 25.0, 40.0, 46.0, 85.0, 103.0, 184.0, 236.0, 368.0, 568.0, 887.0, 1470.0, 2372.0, 4193.0, 7981.0, 16318.0, 43379.0, 255070.0, 3706340.0, 100439.0, 27748.0, 11918.0, 6051.0, 3261.0, 1913.0, 1148.0, 662.0, 508.0, 324.0, 195.0, 125.0, 67.0, 64.0, 40.0, 32.0, 25.0, 13.0, 10.0, 7.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.098388671875, -0.09534263610839844, -0.09229660034179688, -0.08925056457519531, -0.08620452880859375, -0.08315849304199219, -0.08011245727539062, -0.07706642150878906, -0.0740203857421875, -0.07097434997558594, -0.06792831420898438, -0.06488227844238281, -0.06183624267578125, -0.05879020690917969, -0.055744171142578125, -0.05269813537597656, -0.049652099609375, -0.04660606384277344, -0.043560028076171875, -0.04051399230957031, -0.03746795654296875, -0.03442192077636719, -0.031375885009765625, -0.028329849243164062, -0.0252838134765625, -0.022237777709960938, -0.019191741943359375, -0.016145706176757812, -0.01309967041015625, -0.010053634643554688, -0.007007598876953125, -0.0039615631103515625, -0.00091552734375, 0.0021305084228515625, 0.005176544189453125, 0.008222579956054688, 0.01126861572265625, 0.014314651489257812, 0.017360687255859375, 0.020406723022460938, 0.0234527587890625, 0.026498794555664062, 0.029544830322265625, 0.03259086608886719, 0.03563690185546875, 0.03868293762207031, 0.041728973388671875, 0.04477500915527344, 0.047821044921875, 0.05086708068847656, 0.053913116455078125, 0.05695915222167969, 0.06000518798828125, 0.06305122375488281, 0.06609725952148438, 0.06914329528808594, 0.0721893310546875, 0.07523536682128906, 0.07828140258789062, 0.08132743835449219, 0.08437347412109375, 0.08741950988769531, 0.09046554565429688, 0.09351158142089844, 0.0965576171875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 7.0, 5.0, 6.0, 7.0, 15.0, 13.0, 15.0, 27.0, 22.0, 25.0, 36.0, 43.0, 81.0, 182.0, 191.0, 96.0, 41.0, 34.0, 33.0, 17.0, 18.0, 17.0, 12.0, 17.0, 5.0, 8.0, 6.0, 8.0, 4.0, 2.0, 1.0, 2.0, 0.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0208587646484375, -0.0203096866607666, -0.019760608673095703, -0.019211530685424805, -0.018662452697753906, -0.018113374710083008, -0.01756429672241211, -0.01701521873474121, -0.016466140747070312, -0.015917062759399414, -0.015367984771728516, -0.014818906784057617, -0.014269828796386719, -0.01372075080871582, -0.013171672821044922, -0.012622594833374023, -0.012073516845703125, -0.011524438858032227, -0.010975360870361328, -0.01042628288269043, -0.009877204895019531, -0.009328126907348633, -0.008779048919677734, -0.008229970932006836, -0.0076808929443359375, -0.007131814956665039, -0.006582736968994141, -0.006033658981323242, -0.005484580993652344, -0.004935503005981445, -0.004386425018310547, -0.0038373470306396484, -0.00328826904296875, -0.0027391910552978516, -0.002190113067626953, -0.0016410350799560547, -0.0010919570922851562, -0.0005428791046142578, 6.198883056640625e-06, 0.0005552768707275391, 0.0011043548583984375, 0.001653432846069336, 0.0022025108337402344, 0.002751588821411133, 0.0033006668090820312, 0.0038497447967529297, 0.004398822784423828, 0.0049479007720947266, 0.005496978759765625, 0.0060460567474365234, 0.006595134735107422, 0.00714421272277832, 0.007693290710449219, 0.008242368698120117, 0.008791446685791016, 0.009340524673461914, 0.009889602661132812, 0.010438680648803711, 0.01098775863647461, 0.011536836624145508, 0.012085914611816406, 0.012634992599487305, 0.013184070587158203, 0.013733148574829102, 0.0142822265625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 5.0, 1.0, 3.0, 4.0, 5.0, 8.0, 16.0, 13.0, 13.0, 22.0, 40.0, 48.0, 78.0, 125.0, 220.0, 389.0, 668.0, 1433.0, 3366.0, 8682.0, 26489.0, 111000.0, 3259480.0, 680511.0, 70604.0, 19197.0, 6634.0, 2682.0, 1128.0, 593.0, 290.0, 204.0, 115.0, 65.0, 51.0, 33.0, 22.0, 12.0, 10.0, 7.0, 3.0, 8.0, 4.0, 0.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09619140625, -0.09317207336425781, -0.09015274047851562, -0.08713340759277344, -0.08411407470703125, -0.08109474182128906, -0.07807540893554688, -0.07505607604980469, -0.0720367431640625, -0.06901741027832031, -0.06599807739257812, -0.06297874450683594, -0.05995941162109375, -0.05694007873535156, -0.053920745849609375, -0.05090141296386719, -0.047882080078125, -0.04486274719238281, -0.041843414306640625, -0.03882408142089844, -0.03580474853515625, -0.03278541564941406, -0.029766082763671875, -0.026746749877929688, -0.0237274169921875, -0.020708084106445312, -0.017688751220703125, -0.014669418334960938, -0.01165008544921875, -0.008630752563476562, -0.005611419677734375, -0.0025920867919921875, 0.00042724609375, 0.0034465789794921875, 0.006465911865234375, 0.009485244750976562, 0.01250457763671875, 0.015523910522460938, 0.018543243408203125, 0.021562576293945312, 0.0245819091796875, 0.027601242065429688, 0.030620574951171875, 0.03363990783691406, 0.03665924072265625, 0.03967857360839844, 0.042697906494140625, 0.04571723937988281, 0.048736572265625, 0.05175590515136719, 0.054775238037109375, 0.05779457092285156, 0.06081390380859375, 0.06383323669433594, 0.06685256958007812, 0.06987190246582031, 0.0728912353515625, 0.07591056823730469, 0.07892990112304688, 0.08194923400878906, 0.08496856689453125, 0.08798789978027344, 0.09100723266601562, 0.09402656555175781, 0.0970458984375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 5.0, 2.0, 14.0, 9.0, 13.0, 15.0, 16.0, 28.0, 53.0, 58.0, 82.0, 136.0, 251.0, 629.0, 1837.0, 365.0, 172.0, 107.0, 65.0, 52.0, 37.0, 25.0, 21.0, 17.0, 14.0, 10.0, 8.0, 4.0, 3.0, 6.0, 7.0, 2.0, 0.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0224151611328125, -0.021828889846801758, -0.021242618560791016, -0.020656347274780273, -0.02007007598876953, -0.01948380470275879, -0.018897533416748047, -0.018311262130737305, -0.017724990844726562, -0.01713871955871582, -0.016552448272705078, -0.015966176986694336, -0.015379905700683594, -0.014793634414672852, -0.01420736312866211, -0.013621091842651367, -0.013034820556640625, -0.012448549270629883, -0.01186227798461914, -0.011276006698608398, -0.010689735412597656, -0.010103464126586914, -0.009517192840576172, -0.00893092155456543, -0.008344650268554688, -0.007758378982543945, -0.007172107696533203, -0.006585836410522461, -0.005999565124511719, -0.0054132938385009766, -0.004827022552490234, -0.004240751266479492, -0.00365447998046875, -0.003068208694458008, -0.0024819374084472656, -0.0018956661224365234, -0.0013093948364257812, -0.0007231235504150391, -0.00013685226440429688, 0.0004494190216064453, 0.0010356903076171875, 0.0016219615936279297, 0.002208232879638672, 0.002794504165649414, 0.0033807754516601562, 0.0039670467376708984, 0.004553318023681641, 0.005139589309692383, 0.005725860595703125, 0.006312131881713867, 0.006898403167724609, 0.0074846744537353516, 0.008070945739746094, 0.008657217025756836, 0.009243488311767578, 0.00982975959777832, 0.010416030883789062, 0.011002302169799805, 0.011588573455810547, 0.012174844741821289, 0.012761116027832031, 0.013347387313842773, 0.013933658599853516, 0.014519929885864258, 0.015106201171875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 32.0, 142.0, 435.0, 303.0, 68.0, 19.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08249970525503159, -0.07544651627540588, -0.06839332729578018, -0.06134013831615448, -0.05428694933652878, -0.047233764082193375, -0.04018057510256767, -0.03312738612294197, -0.02607419714331627, -0.019021008163690567, -0.01196782011538744, -0.0049146320670843124, 0.0021385569125413895, 0.009191744029521942, 0.016244933009147644, 0.023298121988773346, 0.030351310968399048, 0.03740449994802475, 0.04445768892765045, 0.051510877907276154, 0.058564066886901855, 0.06561724841594696, 0.07267044484615326, 0.07972362637519836, 0.08677682280540466, 0.09383001178503036, 0.10088320076465607, 0.10793638974428177, 0.11498957872390747, 0.12204276025295258, 0.12909595668315887, 0.13614913821220398, 0.14320231974124908, 0.1502555012702942, 0.1573086977005005, 0.1643618792295456, 0.1714150756597519, 0.178468257188797, 0.1855214536190033, 0.1925746351480484, 0.1996278315782547, 0.2066810131072998, 0.2137342095375061, 0.2207873910665512, 0.2278405874967575, 0.2348937690258026, 0.2419469654560089, 0.24900014698505402, 0.2560533285140991, 0.2631065249443054, 0.27015969157218933, 0.27721288800239563, 0.28426608443260193, 0.2913192808628082, 0.29837244749069214, 0.30542564392089844, 0.31247884035110474, 0.31953203678131104, 0.32658520340919495, 0.33363839983940125, 0.34069159626960754, 0.34774479269981384, 0.35479795932769775, 0.36185115575790405, 0.36890435218811035]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 10.0, 6.0, 9.0, 16.0, 13.0, 19.0, 25.0, 35.0, 51.0, 49.0, 75.0, 57.0, 77.0, 86.0, 77.0, 76.0, 59.0, 53.0, 33.0, 35.0, 28.0, 25.0, 10.0, 21.0, 11.0, 4.0, 8.0, 6.0, 5.0, 4.0, 4.0, 2.0, 0.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.08272719383239746, -0.08022410422563553, -0.0777210146188736, -0.07521792501211166, -0.07271483540534973, -0.0702117532491684, -0.06770866364240646, -0.06520557403564453, -0.0627024844288826, -0.060199394822120667, -0.057696305215358734, -0.0551932193338871, -0.05269012972712517, -0.050187040120363235, -0.0476839542388916, -0.04518086463212967, -0.04267777502536774, -0.040174685418605804, -0.03767159581184387, -0.03516850993037224, -0.032665420323610306, -0.030162330716848373, -0.02765924297273159, -0.025156155228614807, -0.022653065621852875, -0.020149976015090942, -0.01764688827097416, -0.015143799595534801, -0.012640710920095444, -0.010137622244656086, -0.007634533569216728, -0.005131445825099945, -0.0026283562183380127, -0.00012526754289865494, 0.002377821132540703, 0.004880909807980061, 0.007383998483419418, 0.009887087158858776, 0.012390175834298134, 0.014893263578414917, 0.01739635318517685, 0.019899442791938782, 0.022402530536055565, 0.024905618280172348, 0.02740870788693428, 0.029911797493696213, 0.03241488337516785, 0.03491797298192978, 0.03742106258869171, 0.039924152195453644, 0.042427241802215576, 0.04493032768368721, 0.04743341729044914, 0.049936506897211075, 0.05243959277868271, 0.05494268238544464, 0.057445771992206573, 0.059948861598968506, 0.06245195120573044, 0.06495504081249237, 0.0674581229686737, 0.06996121257543564, 0.07246430218219757, 0.0749673917889595, 0.07747048139572144]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 5.0, 2.0, 3.0, 10.0, 8.0, 17.0, 13.0, 24.0, 43.0, 44.0, 78.0, 126.0, 204.0, 336.0, 537.0, 997.0, 1892.0, 3656.0, 8401.0, 21395.0, 73443.0, 622629.0, 240371.0, 46349.0, 15355.0, 6187.0, 2935.0, 1409.0, 781.0, 499.0, 287.0, 186.0, 108.0, 70.0, 48.0, 40.0, 13.0, 13.0, 16.0, 14.0, 9.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11676025390625, -0.11350154876708984, -0.11024284362792969, -0.10698413848876953, -0.10372543334960938, -0.10046672821044922, -0.09720802307128906, -0.0939493179321289, -0.09069061279296875, -0.0874319076538086, -0.08417320251464844, -0.08091449737548828, -0.07765579223632812, -0.07439708709716797, -0.07113838195800781, -0.06787967681884766, -0.0646209716796875, -0.061362266540527344, -0.05810356140136719, -0.05484485626220703, -0.051586151123046875, -0.04832744598388672, -0.04506874084472656, -0.041810035705566406, -0.03855133056640625, -0.035292625427246094, -0.03203392028808594, -0.02877521514892578, -0.025516510009765625, -0.02225780487060547, -0.018999099731445312, -0.015740394592285156, -0.012481689453125, -0.009222984313964844, -0.0059642791748046875, -0.0027055740356445312, 0.000553131103515625, 0.0038118362426757812, 0.0070705413818359375, 0.010329246520996094, 0.01358795166015625, 0.016846656799316406, 0.020105361938476562, 0.02336406707763672, 0.026622772216796875, 0.02988147735595703, 0.03314018249511719, 0.036398887634277344, 0.0396575927734375, 0.042916297912597656, 0.04617500305175781, 0.04943370819091797, 0.052692413330078125, 0.05595111846923828, 0.05920982360839844, 0.062468528747558594, 0.06572723388671875, 0.0689859390258789, 0.07224464416503906, 0.07550334930419922, 0.07876205444335938, 0.08202075958251953, 0.08527946472167969, 0.08853816986083984, 0.091796875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 2.0, 4.0, 7.0, 5.0, 7.0, 14.0, 17.0, 11.0, 24.0, 26.0, 39.0, 26.0, 55.0, 113.0, 176.0, 151.0, 84.0, 44.0, 36.0, 32.0, 26.0, 13.0, 19.0, 8.0, 18.0, 12.0, 2.0, 9.0, 3.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.0210418701171875, -0.020514369010925293, -0.019986867904663086, -0.01945936679840088, -0.018931865692138672, -0.018404364585876465, -0.017876863479614258, -0.01734936237335205, -0.016821861267089844, -0.016294360160827637, -0.01576685905456543, -0.015239357948303223, -0.014711856842041016, -0.014184355735778809, -0.013656854629516602, -0.013129353523254395, -0.012601852416992188, -0.01207435131072998, -0.011546850204467773, -0.011019349098205566, -0.01049184799194336, -0.009964346885681152, -0.009436845779418945, -0.008909344673156738, -0.008381843566894531, -0.007854342460632324, -0.007326841354370117, -0.00679934024810791, -0.006271839141845703, -0.005744338035583496, -0.005216836929321289, -0.004689335823059082, -0.004161834716796875, -0.003634333610534668, -0.003106832504272461, -0.002579331398010254, -0.002051830291748047, -0.0015243291854858398, -0.0009968280792236328, -0.0004693269729614258, 5.817413330078125e-05, 0.0005856752395629883, 0.0011131763458251953, 0.0016406774520874023, 0.0021681785583496094, 0.0026956796646118164, 0.0032231807708740234, 0.0037506818771362305, 0.0042781829833984375, 0.0048056840896606445, 0.0053331851959228516, 0.005860686302185059, 0.006388187408447266, 0.006915688514709473, 0.00744318962097168, 0.007970690727233887, 0.008498191833496094, 0.0090256929397583, 0.009553194046020508, 0.010080695152282715, 0.010608196258544922, 0.011135697364807129, 0.011663198471069336, 0.012190699577331543, 0.01271820068359375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 9.0, 2.0, 7.0, 13.0, 22.0, 21.0, 36.0, 66.0, 88.0, 196.0, 501.0, 2216.0, 15803.0, 485391.0, 525182.0, 15805.0, 2199.0, 526.0, 197.0, 82.0, 64.0, 28.0, 28.0, 16.0, 5.0, 8.0, 8.0, 3.0, 2.0, 5.0, 4.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.1575927734375, -0.1530914306640625, -0.148590087890625, -0.1440887451171875, -0.13958740234375, -0.1350860595703125, -0.130584716796875, -0.1260833740234375, -0.12158203125, -0.1170806884765625, -0.112579345703125, -0.1080780029296875, -0.10357666015625, -0.0990753173828125, -0.094573974609375, -0.0900726318359375, -0.0855712890625, -0.0810699462890625, -0.076568603515625, -0.0720672607421875, -0.06756591796875, -0.0630645751953125, -0.058563232421875, -0.0540618896484375, -0.049560546875, -0.0450592041015625, -0.040557861328125, -0.0360565185546875, -0.03155517578125, -0.0270538330078125, -0.022552490234375, -0.0180511474609375, -0.0135498046875, -0.0090484619140625, -0.004547119140625, -4.57763671875e-05, 0.00445556640625, 0.0089569091796875, 0.013458251953125, 0.0179595947265625, 0.0224609375, 0.0269622802734375, 0.031463623046875, 0.0359649658203125, 0.04046630859375, 0.0449676513671875, 0.049468994140625, 0.0539703369140625, 0.0584716796875, 0.0629730224609375, 0.067474365234375, 0.0719757080078125, 0.07647705078125, 0.0809783935546875, 0.085479736328125, 0.0899810791015625, 0.094482421875, 0.0989837646484375, 0.103485107421875, 0.1079864501953125, 0.11248779296875, 0.1169891357421875, 0.121490478515625, 0.1259918212890625, 0.1304931640625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 10.0, 6.0, 7.0, 5.0, 8.0, 18.0, 19.0, 14.0, 23.0, 21.0, 28.0, 32.0, 40.0, 42.0, 56.0, 46.0, 49.0, 46.0, 55.0, 44.0, 35.0, 49.0, 57.0, 38.0, 34.0, 42.0, 25.0, 31.0, 25.0, 16.0, 19.0, 12.0, 10.0, 12.0, 4.0, 7.0, 7.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.05364990234375, -0.052046775817871094, -0.05044364929199219, -0.04884052276611328, -0.047237396240234375, -0.04563426971435547, -0.04403114318847656, -0.042428016662597656, -0.04082489013671875, -0.039221763610839844, -0.03761863708496094, -0.03601551055908203, -0.034412384033203125, -0.03280925750732422, -0.031206130981445312, -0.029603004455566406, -0.0279998779296875, -0.026396751403808594, -0.024793624877929688, -0.02319049835205078, -0.021587371826171875, -0.01998424530029297, -0.018381118774414062, -0.016777992248535156, -0.01517486572265625, -0.013571739196777344, -0.011968612670898438, -0.010365486145019531, -0.008762359619140625, -0.007159233093261719, -0.0055561065673828125, -0.003952980041503906, -0.002349853515625, -0.0007467269897460938, 0.0008563995361328125, 0.0024595260620117188, 0.004062652587890625, 0.005665779113769531, 0.0072689056396484375, 0.008872032165527344, 0.01047515869140625, 0.012078285217285156, 0.013681411743164062, 0.015284538269042969, 0.016887664794921875, 0.01849079132080078, 0.020093917846679688, 0.021697044372558594, 0.0233001708984375, 0.024903297424316406, 0.026506423950195312, 0.02810955047607422, 0.029712677001953125, 0.03131580352783203, 0.03291893005371094, 0.034522056579589844, 0.03612518310546875, 0.037728309631347656, 0.03933143615722656, 0.04093456268310547, 0.042537689208984375, 0.04414081573486328, 0.04574394226074219, 0.047347068786621094, 0.0489501953125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 7.0, 13.0, 25.0, 78.0, 554.0, 616227.0, 430949.0, 562.0, 82.0, 33.0, 15.0, 3.0, 3.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4658203125, -0.4538726806640625, -0.441925048828125, -0.4299774169921875, -0.41802978515625, -0.4060821533203125, -0.394134521484375, -0.3821868896484375, -0.3702392578125, -0.3582916259765625, -0.346343994140625, -0.3343963623046875, -0.32244873046875, -0.3105010986328125, -0.298553466796875, -0.2866058349609375, -0.274658203125, -0.2627105712890625, -0.250762939453125, -0.2388153076171875, -0.22686767578125, -0.2149200439453125, -0.202972412109375, -0.1910247802734375, -0.1790771484375, -0.1671295166015625, -0.155181884765625, -0.1432342529296875, -0.13128662109375, -0.1193389892578125, -0.107391357421875, -0.0954437255859375, -0.08349609375, -0.0715484619140625, -0.059600830078125, -0.0476531982421875, -0.03570556640625, -0.0237579345703125, -0.011810302734375, 0.0001373291015625, 0.0120849609375, 0.0240325927734375, 0.035980224609375, 0.0479278564453125, 0.05987548828125, 0.0718231201171875, 0.083770751953125, 0.0957183837890625, 0.107666015625, 0.1196136474609375, 0.131561279296875, 0.1435089111328125, 0.15545654296875, 0.1674041748046875, 0.179351806640625, 0.1912994384765625, 0.2032470703125, 0.2151947021484375, 0.227142333984375, 0.2390899658203125, 0.25103759765625, 0.2629852294921875, 0.274932861328125, 0.2868804931640625, 0.298828125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 2.0, 5.0, 5.0, 9.0, 17.0, 14.0, 23.0, 34.0, 45.0, 62.0, 70.0, 99.0, 106.0, 121.0, 83.0, 79.0, 57.0, 34.0, 29.0, 25.0, 9.0, 7.0, 10.0, 7.0, 9.0, 6.0, 8.0, 3.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.9981136322021484e-05, -2.8857029974460602e-05, -2.773292362689972e-05, -2.6608817279338837e-05, -2.5484710931777954e-05, -2.436060458421707e-05, -2.323649823665619e-05, -2.2112391889095306e-05, -2.0988285541534424e-05, -1.986417919397354e-05, -1.874007284641266e-05, -1.7615966498851776e-05, -1.6491860151290894e-05, -1.536775380373001e-05, -1.4243647456169128e-05, -1.3119541108608246e-05, -1.1995434761047363e-05, -1.087132841348648e-05, -9.747222065925598e-06, -8.623115718364716e-06, -7.499009370803833e-06, -6.3749030232429504e-06, -5.250796675682068e-06, -4.126690328121185e-06, -3.0025839805603027e-06, -1.8784776329994202e-06, -7.543712854385376e-07, 3.6973506212234497e-07, 1.4938414096832275e-06, 2.61794775724411e-06, 3.7420541048049927e-06, 4.866160452365875e-06, 5.990266799926758e-06, 7.11437314748764e-06, 8.238479495048523e-06, 9.362585842609406e-06, 1.0486692190170288e-05, 1.161079853773117e-05, 1.2734904885292053e-05, 1.3859011232852936e-05, 1.4983117580413818e-05, 1.61072239279747e-05, 1.7231330275535583e-05, 1.8355436623096466e-05, 1.947954297065735e-05, 2.060364931821823e-05, 2.1727755665779114e-05, 2.2851862013339996e-05, 2.397596836090088e-05, 2.510007470846176e-05, 2.6224181056022644e-05, 2.7348287403583527e-05, 2.847239375114441e-05, 2.9596500098705292e-05, 3.0720606446266174e-05, 3.184471279382706e-05, 3.296881914138794e-05, 3.409292548894882e-05, 3.5217031836509705e-05, 3.634113818407059e-05, 3.746524453163147e-05, 3.858935087919235e-05, 3.9713457226753235e-05, 4.083756357431412e-05, 4.1961669921875e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 10.0, 12.0, 28.0, 34.0, 50.0, 107.0, 208.0, 500.0, 1401.0, 5130.0, 38540.0, 842549.0, 145093.0, 10940.0, 2487.0, 795.0, 344.0, 126.0, 69.0, 42.0, 16.0, 15.0, 14.0, 8.0, 9.0, 5.0, 6.0, 2.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09271240234375, -0.08987712860107422, -0.08704185485839844, -0.08420658111572266, -0.08137130737304688, -0.0785360336303711, -0.07570075988769531, -0.07286548614501953, -0.07003021240234375, -0.06719493865966797, -0.06435966491699219, -0.061524391174316406, -0.058689117431640625, -0.055853843688964844, -0.05301856994628906, -0.05018329620361328, -0.0473480224609375, -0.04451274871826172, -0.04167747497558594, -0.038842201232910156, -0.036006927490234375, -0.033171653747558594, -0.030336380004882812, -0.02750110626220703, -0.02466583251953125, -0.02183055877685547, -0.018995285034179688, -0.016160011291503906, -0.013324737548828125, -0.010489463806152344, -0.0076541900634765625, -0.004818916320800781, -0.001983642578125, 0.0008516311645507812, 0.0036869049072265625, 0.006522178649902344, 0.009357452392578125, 0.012192726135253906, 0.015027999877929688, 0.01786327362060547, 0.02069854736328125, 0.02353382110595703, 0.026369094848632812, 0.029204368591308594, 0.032039642333984375, 0.034874916076660156, 0.03771018981933594, 0.04054546356201172, 0.0433807373046875, 0.04621601104736328, 0.04905128479003906, 0.051886558532714844, 0.054721832275390625, 0.057557106018066406, 0.06039237976074219, 0.06322765350341797, 0.06606292724609375, 0.06889820098876953, 0.07173347473144531, 0.0745687484741211, 0.07740402221679688, 0.08023929595947266, 0.08307456970214844, 0.08590984344482422, 0.0887451171875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 8.0, 6.0, 10.0, 16.0, 25.0, 41.0, 67.0, 124.0, 133.0, 173.0, 160.0, 93.0, 51.0, 26.0, 16.0, 12.0, 8.0, 8.0, 4.0, 1.0, 2.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.057373046875, -0.05559873580932617, -0.053824424743652344, -0.052050113677978516, -0.05027580261230469, -0.04850149154663086, -0.04672718048095703, -0.0449528694152832, -0.043178558349609375, -0.04140424728393555, -0.03962993621826172, -0.03785562515258789, -0.03608131408691406, -0.034307003021240234, -0.032532691955566406, -0.030758380889892578, -0.02898406982421875, -0.027209758758544922, -0.025435447692871094, -0.023661136627197266, -0.021886825561523438, -0.02011251449584961, -0.01833820343017578, -0.016563892364501953, -0.014789581298828125, -0.013015270233154297, -0.011240959167480469, -0.00946664810180664, -0.0076923370361328125, -0.005918025970458984, -0.004143714904785156, -0.002369403839111328, -0.0005950927734375, 0.0011792182922363281, 0.0029535293579101562, 0.004727840423583984, 0.0065021514892578125, 0.00827646255493164, 0.010050773620605469, 0.011825084686279297, 0.013599395751953125, 0.015373706817626953, 0.01714801788330078, 0.01892232894897461, 0.020696640014648438, 0.022470951080322266, 0.024245262145996094, 0.026019573211669922, 0.02779388427734375, 0.029568195343017578, 0.031342506408691406, 0.033116817474365234, 0.03489112854003906, 0.03666543960571289, 0.03843975067138672, 0.04021406173706055, 0.041988372802734375, 0.0437626838684082, 0.04553699493408203, 0.04731130599975586, 0.04908561706542969, 0.050859928131103516, 0.052634239196777344, 0.05440855026245117, 0.056182861328125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 7.0, 16.0, 218.0, 732.0, 32.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35238611698150635, -0.2851608991622925, -0.21793566644191742, -0.15071043372154236, -0.08348521590232849, -0.016259998083114624, 0.05096524953842163, 0.1181904673576355, 0.18541568517684937, 0.25264090299606323, 0.3198661208152771, 0.38709136843681335, 0.4543165862560272, 0.5215418338775635, 0.5887670516967773, 0.6559922695159912, 0.7232174873352051, 0.790442705154419, 0.8576679229736328, 0.9248931407928467, 0.9921183586120605, 1.0593435764312744, 1.1265687942504883, 1.1937940120697021, 1.261019229888916, 1.3282444477081299, 1.3954696655273438, 1.4626948833465576, 1.5299201011657715, 1.5971453189849854, 1.6643705368041992, 1.731595754623413, 1.798821210861206, 1.86604642868042, 1.9332716464996338, 2.0004968643188477, 2.0677220821380615, 2.1349472999572754, 2.2021725177764893, 2.269397735595703, 2.336622953414917, 2.403848171234131, 2.4710733890533447, 2.5382986068725586, 2.6055238246917725, 2.6727490425109863, 2.7399742603302, 2.807199478149414, 2.874424934387207, 2.941650152206421, 3.0088753700256348, 3.0761005878448486, 3.1433258056640625, 3.2105510234832764, 3.2777762413024902, 3.345001459121704, 3.412226676940918, 3.479451894760132, 3.5466771125793457, 3.6139023303985596, 3.6811275482177734, 3.7483527660369873, 3.815577983856201, 3.882803201675415, 3.950028419494629]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 1.0, 8.0, 10.0, 12.0, 8.0, 8.0, 9.0, 14.0, 15.0, 27.0, 33.0, 42.0, 52.0, 51.0, 66.0, 54.0, 72.0, 65.0, 71.0, 65.0, 46.0, 46.0, 40.0, 26.0, 38.0, 22.0, 18.0, 15.0, 20.0, 8.0, 4.0, 8.0, 4.0, 3.0, 3.0, 6.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4513883590698242, -0.4379616677761078, -0.42453497648239136, -0.41110825538635254, -0.3976815640926361, -0.3842548727989197, -0.37082818150520325, -0.3574014902114868, -0.343974769115448, -0.33054807782173157, -0.31712138652801514, -0.3036946654319763, -0.2902679741382599, -0.27684128284454346, -0.263414591550827, -0.2499879002571106, -0.23656120896339417, -0.22313451766967773, -0.2097078114748001, -0.19628112018108368, -0.18285441398620605, -0.16942772269248962, -0.1560010313987732, -0.14257434010505676, -0.12914763391017914, -0.11572093516588211, -0.10229423642158508, -0.08886754512786865, -0.07544084638357162, -0.0620141476392746, -0.048587456345558167, -0.03516075760126114, -0.02173405885696411, -0.008307361975312233, 0.005119334906339645, 0.018546029925346375, 0.0319727286696434, 0.04539942741394043, 0.05882611870765686, 0.07225281745195389, 0.08567951619625092, 0.09910621494054794, 0.11253291368484497, 0.1259596049785614, 0.13938629627227783, 0.15281300246715546, 0.1662396937608719, 0.1796663999557495, 0.19309309124946594, 0.20651978254318237, 0.21994648873806, 0.23337318003177643, 0.24679988622665405, 0.2602265775203705, 0.2736532688140869, 0.28707996010780334, 0.3005066514015198, 0.3139333426952362, 0.32736003398895264, 0.34078675508499146, 0.3542134463787079, 0.3676401376724243, 0.38106682896614075, 0.3944935202598572, 0.407920241355896]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 7.0, 3.0, 5.0, 16.0, 8.0, 10.0, 21.0, 20.0, 32.0, 27.0, 32.0, 54.0, 68.0, 98.0, 127.0, 183.0, 271.0, 384.0, 625.0, 812.0, 1244.0, 1796.0, 2898.0, 4701.0, 9240.0, 24348.0, 138289.0, 3877231.0, 90253.0, 20420.0, 8250.0, 4348.0, 2699.0, 1789.0, 1113.0, 819.0, 584.0, 411.0, 331.0, 211.0, 144.0, 113.0, 72.0, 63.0, 37.0, 29.0, 20.0, 13.0, 6.0, 6.0, 2.0, 2.0, 1.0], "bins": [-0.177734375, -0.17310714721679688, -0.16847991943359375, -0.16385269165039062, -0.1592254638671875, -0.15459823608398438, -0.14997100830078125, -0.14534378051757812, -0.140716552734375, -0.13608932495117188, -0.13146209716796875, -0.12683486938476562, -0.1222076416015625, -0.11758041381835938, -0.11295318603515625, -0.10832595825195312, -0.10369873046875, -0.09907150268554688, -0.09444427490234375, -0.08981704711914062, -0.0851898193359375, -0.08056259155273438, -0.07593536376953125, -0.07130813598632812, -0.066680908203125, -0.062053680419921875, -0.05742645263671875, -0.052799224853515625, -0.0481719970703125, -0.043544769287109375, -0.03891754150390625, -0.034290313720703125, -0.0296630859375, -0.025035858154296875, -0.02040863037109375, -0.015781402587890625, -0.0111541748046875, -0.006526947021484375, -0.00189971923828125, 0.002727508544921875, 0.007354736328125, 0.011981964111328125, 0.01660919189453125, 0.021236419677734375, 0.0258636474609375, 0.030490875244140625, 0.03511810302734375, 0.039745330810546875, 0.04437255859375, 0.048999786376953125, 0.05362701416015625, 0.058254241943359375, 0.0628814697265625, 0.06750869750976562, 0.07213592529296875, 0.07676315307617188, 0.081390380859375, 0.08601760864257812, 0.09064483642578125, 0.09527206420898438, 0.0998992919921875, 0.10452651977539062, 0.10915374755859375, 0.11378097534179688, 0.118408203125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 3.0, 6.0, 12.0, 11.0, 17.0, 19.0, 13.0, 18.0, 32.0, 39.0, 66.0, 82.0, 137.0, 142.0, 121.0, 63.0, 51.0, 42.0, 15.0, 20.0, 17.0, 13.0, 19.0, 5.0, 8.0, 5.0, 6.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.0209197998046875, -0.020386576652526855, -0.01985335350036621, -0.019320130348205566, -0.018786907196044922, -0.018253684043884277, -0.017720460891723633, -0.01718723773956299, -0.016654014587402344, -0.0161207914352417, -0.015587568283081055, -0.01505434513092041, -0.014521121978759766, -0.013987898826599121, -0.013454675674438477, -0.012921452522277832, -0.012388229370117188, -0.011855006217956543, -0.011321783065795898, -0.010788559913635254, -0.01025533676147461, -0.009722113609313965, -0.00918889045715332, -0.008655667304992676, -0.008122444152832031, -0.007589221000671387, -0.007055997848510742, -0.006522774696350098, -0.005989551544189453, -0.005456328392028809, -0.004923105239868164, -0.0043898820877075195, -0.003856658935546875, -0.0033234357833862305, -0.002790212631225586, -0.0022569894790649414, -0.0017237663269042969, -0.0011905431747436523, -0.0006573200225830078, -0.00012409687042236328, 0.00040912628173828125, 0.0009423494338989258, 0.0014755725860595703, 0.002008795738220215, 0.0025420188903808594, 0.003075242042541504, 0.0036084651947021484, 0.004141688346862793, 0.0046749114990234375, 0.005208134651184082, 0.0057413578033447266, 0.006274580955505371, 0.006807804107666016, 0.00734102725982666, 0.007874250411987305, 0.00840747356414795, 0.008940696716308594, 0.009473919868469238, 0.010007143020629883, 0.010540366172790527, 0.011073589324951172, 0.011606812477111816, 0.012140035629272461, 0.012673258781433105, 0.01320648193359375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 5.0, 12.0, 12.0, 14.0, 15.0, 40.0, 53.0, 90.0, 164.0, 324.0, 812.0, 2214.0, 6765.0, 23959.0, 154203.0, 3821972.0, 149177.0, 23828.0, 6628.0, 2308.0, 871.0, 334.0, 181.0, 85.0, 62.0, 40.0, 27.0, 20.0, 14.0, 12.0, 11.0, 5.0, 10.0, 2.0, 5.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1544189453125, -0.1493549346923828, -0.14429092407226562, -0.13922691345214844, -0.13416290283203125, -0.12909889221191406, -0.12403488159179688, -0.11897087097167969, -0.1139068603515625, -0.10884284973144531, -0.10377883911132812, -0.09871482849121094, -0.09365081787109375, -0.08858680725097656, -0.08352279663085938, -0.07845878601074219, -0.073394775390625, -0.06833076477050781, -0.06326675415039062, -0.05820274353027344, -0.05313873291015625, -0.04807472229003906, -0.043010711669921875, -0.03794670104980469, -0.0328826904296875, -0.027818679809570312, -0.022754669189453125, -0.017690658569335938, -0.01262664794921875, -0.0075626373291015625, -0.002498626708984375, 0.0025653839111328125, 0.00762939453125, 0.012693405151367188, 0.017757415771484375, 0.022821426391601562, 0.02788543701171875, 0.03294944763183594, 0.038013458251953125, 0.04307746887207031, 0.0481414794921875, 0.05320549011230469, 0.058269500732421875, 0.06333351135253906, 0.06839752197265625, 0.07346153259277344, 0.07852554321289062, 0.08358955383300781, 0.088653564453125, 0.09371757507324219, 0.09878158569335938, 0.10384559631347656, 0.10890960693359375, 0.11397361755371094, 0.11903762817382812, 0.12410163879394531, 0.1291656494140625, 0.1342296600341797, 0.13929367065429688, 0.14435768127441406, 0.14942169189453125, 0.15448570251464844, 0.15954971313476562, 0.1646137237548828, 0.169677734375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 4.0, 4.0, 3.0, 6.0, 7.0, 4.0, 9.0, 14.0, 10.0, 19.0, 33.0, 33.0, 45.0, 71.0, 105.0, 177.0, 409.0, 1784.0, 655.0, 231.0, 126.0, 98.0, 52.0, 33.0, 28.0, 24.0, 15.0, 19.0, 12.0, 7.0, 8.0, 4.0, 8.0, 2.0, 0.0, 3.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0160675048828125, -0.015443563461303711, -0.014819622039794922, -0.014195680618286133, -0.013571739196777344, -0.012947797775268555, -0.012323856353759766, -0.011699914932250977, -0.011075973510742188, -0.010452032089233398, -0.00982809066772461, -0.00920414924621582, -0.008580207824707031, -0.007956266403198242, -0.007332324981689453, -0.006708383560180664, -0.006084442138671875, -0.005460500717163086, -0.004836559295654297, -0.004212617874145508, -0.0035886764526367188, -0.0029647350311279297, -0.0023407936096191406, -0.0017168521881103516, -0.0010929107666015625, -0.00046896934509277344, 0.00015497207641601562, 0.0007789134979248047, 0.0014028549194335938, 0.002026796340942383, 0.002650737762451172, 0.003274679183959961, 0.00389862060546875, 0.004522562026977539, 0.005146503448486328, 0.005770444869995117, 0.006394386291503906, 0.007018327713012695, 0.007642269134521484, 0.008266210556030273, 0.008890151977539062, 0.009514093399047852, 0.01013803482055664, 0.01076197624206543, 0.011385917663574219, 0.012009859085083008, 0.012633800506591797, 0.013257741928100586, 0.013881683349609375, 0.014505624771118164, 0.015129566192626953, 0.015753507614135742, 0.01637744903564453, 0.01700139045715332, 0.01762533187866211, 0.0182492733001709, 0.018873214721679688, 0.019497156143188477, 0.020121097564697266, 0.020745038986206055, 0.021368980407714844, 0.021992921829223633, 0.022616863250732422, 0.02324080467224121, 0.02386474609375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 10.0, 34.0, 172.0, 427.0, 293.0, 55.0, 15.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16836299002170563, -0.1582910716533661, -0.14821913838386536, -0.13814722001552582, -0.12807530164718628, -0.11800337582826614, -0.10793145000934601, -0.09785953164100647, -0.08778760582208633, -0.0777156800031662, -0.06764376163482666, -0.057571835815906525, -0.04749991372227669, -0.03742799162864685, -0.027356065809726715, -0.017284147441387177, -0.007212221622467041, 0.0028597014024853706, 0.012931624427437782, 0.02300354838371277, 0.033075470477342606, 0.04314739257097244, 0.05321931838989258, 0.06329123675823212, 0.07336316257715225, 0.08343508839607239, 0.09350700676441193, 0.10357893258333206, 0.1136508584022522, 0.12372277677059174, 0.13379469513893127, 0.143866628408432, 0.15393856167793274, 0.16401048004627228, 0.174082413315773, 0.18415433168411255, 0.1942262500524521, 0.20429816842079163, 0.21437010169029236, 0.2244420200586319, 0.23451393842697144, 0.24458585679531097, 0.2546577751636505, 0.26472970843315125, 0.274801641702652, 0.2848735451698303, 0.29494547843933105, 0.3050174117088318, 0.3150893449783325, 0.32516127824783325, 0.3352331817150116, 0.34530511498451233, 0.35537704825401306, 0.3654489517211914, 0.37552088499069214, 0.38559281826019287, 0.3956647217273712, 0.40573665499687195, 0.4158085584640503, 0.425880491733551, 0.43595242500305176, 0.4460243284702301, 0.45609626173973083, 0.4661681652069092, 0.4762400984764099]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 3.0, 7.0, 7.0, 13.0, 18.0, 21.0, 22.0, 31.0, 39.0, 51.0, 63.0, 65.0, 58.0, 73.0, 63.0, 56.0, 56.0, 49.0, 64.0, 50.0, 46.0, 32.0, 34.0, 20.0, 18.0, 14.0, 7.0, 7.0, 6.0, 7.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09539002180099487, -0.0922093614935875, -0.08902870118618011, -0.08584803342819214, -0.08266737312078476, -0.07948671281337738, -0.0763060450553894, -0.07312538474798203, -0.06994472444057465, -0.06676406413316727, -0.06358340382575989, -0.06040273606777191, -0.05722207576036453, -0.05404141545295715, -0.050860751420259476, -0.0476800873875618, -0.04449942708015442, -0.04131876677274704, -0.03813810274004936, -0.034957438707351685, -0.031776778399944305, -0.028596116229891777, -0.02541545405983925, -0.02223479188978672, -0.019054129719734192, -0.015873467549681664, -0.012692805379629135, -0.009512143209576607, -0.006331481039524078, -0.00315081886947155, 2.9843300580978394e-05, 0.0032105054706335068, 0.006391167640686035, 0.009571829810738564, 0.012752491980791092, 0.01593315415084362, 0.01911381632089615, 0.022294478490948677, 0.025475140661001205, 0.028655802831053734, 0.03183646500110626, 0.03501712530851364, 0.03819778934121132, 0.041378453373909, 0.044559113681316376, 0.047739773988723755, 0.05092043802142143, 0.05410110205411911, 0.05728176236152649, 0.06046242266893387, 0.06364308297634125, 0.06682375073432922, 0.0700044110417366, 0.07318507134914398, 0.07636573910713196, 0.07954639941453934, 0.08272705972194672, 0.0859077200293541, 0.08908838033676147, 0.09226904809474945, 0.09544970840215683, 0.09863036870956421, 0.10181103646755219, 0.10499169677495956, 0.10817235708236694]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 10.0, 7.0, 14.0, 10.0, 24.0, 31.0, 44.0, 100.0, 136.0, 260.0, 431.0, 825.0, 1566.0, 3212.0, 7147.0, 16761.0, 49290.0, 237241.0, 586675.0, 96747.0, 27796.0, 10757.0, 4669.0, 2228.0, 1197.0, 585.0, 298.0, 184.0, 101.0, 78.0, 46.0, 22.0, 23.0, 18.0, 10.0, 4.0, 7.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1180419921875, -0.11413955688476562, -0.11023712158203125, -0.10633468627929688, -0.1024322509765625, -0.09852981567382812, -0.09462738037109375, -0.09072494506835938, -0.086822509765625, -0.08292007446289062, -0.07901763916015625, -0.07511520385742188, -0.0712127685546875, -0.06731033325195312, -0.06340789794921875, -0.059505462646484375, -0.05560302734375, -0.051700592041015625, -0.04779815673828125, -0.043895721435546875, -0.0399932861328125, -0.036090850830078125, -0.03218841552734375, -0.028285980224609375, -0.024383544921875, -0.020481109619140625, -0.01657867431640625, -0.012676239013671875, -0.0087738037109375, -0.004871368408203125, -0.00096893310546875, 0.002933502197265625, 0.0068359375, 0.010738372802734375, 0.01464080810546875, 0.018543243408203125, 0.0224456787109375, 0.026348114013671875, 0.03025054931640625, 0.034152984619140625, 0.038055419921875, 0.041957855224609375, 0.04586029052734375, 0.049762725830078125, 0.0536651611328125, 0.057567596435546875, 0.06147003173828125, 0.06537246704101562, 0.06927490234375, 0.07317733764648438, 0.07707977294921875, 0.08098220825195312, 0.0848846435546875, 0.08878707885742188, 0.09268951416015625, 0.09659194946289062, 0.100494384765625, 0.10439682006835938, 0.10829925537109375, 0.11220169067382812, 0.1161041259765625, 0.12000656127929688, 0.12390899658203125, 0.12781143188476562, 0.1317138671875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 3.0, 0.0, 10.0, 9.0, 3.0, 13.0, 14.0, 20.0, 15.0, 27.0, 23.0, 50.0, 71.0, 94.0, 134.0, 139.0, 105.0, 61.0, 55.0, 35.0, 25.0, 17.0, 16.0, 15.0, 9.0, 8.0, 5.0, 1.0, 7.0, 6.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 1.0], "bins": [-0.020599365234375, -0.02008509635925293, -0.01957082748413086, -0.01905655860900879, -0.01854228973388672, -0.01802802085876465, -0.017513751983642578, -0.016999483108520508, -0.016485214233398438, -0.015970945358276367, -0.015456676483154297, -0.014942407608032227, -0.014428138732910156, -0.013913869857788086, -0.013399600982666016, -0.012885332107543945, -0.012371063232421875, -0.011856794357299805, -0.011342525482177734, -0.010828256607055664, -0.010313987731933594, -0.009799718856811523, -0.009285449981689453, -0.008771181106567383, -0.008256912231445312, -0.007742643356323242, -0.007228374481201172, -0.0067141056060791016, -0.006199836730957031, -0.005685567855834961, -0.005171298980712891, -0.00465703010559082, -0.00414276123046875, -0.0036284923553466797, -0.0031142234802246094, -0.002599954605102539, -0.0020856857299804688, -0.0015714168548583984, -0.0010571479797363281, -0.0005428791046142578, -2.86102294921875e-05, 0.0004856586456298828, 0.0009999275207519531, 0.0015141963958740234, 0.0020284652709960938, 0.002542734146118164, 0.0030570030212402344, 0.0035712718963623047, 0.004085540771484375, 0.004599809646606445, 0.005114078521728516, 0.005628347396850586, 0.006142616271972656, 0.0066568851470947266, 0.007171154022216797, 0.007685422897338867, 0.008199691772460938, 0.008713960647583008, 0.009228229522705078, 0.009742498397827148, 0.010256767272949219, 0.010771036148071289, 0.01128530502319336, 0.01179957389831543, 0.0123138427734375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 4.0, 5.0, 9.0, 8.0, 14.0, 16.0, 27.0, 32.0, 40.0, 62.0, 93.0, 131.0, 194.0, 302.0, 507.0, 1090.0, 2809.0, 10933.0, 65724.0, 488951.0, 411494.0, 52188.0, 9158.0, 2410.0, 992.0, 501.0, 289.0, 177.0, 118.0, 82.0, 54.0, 36.0, 31.0, 23.0, 16.0, 6.0, 8.0, 6.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.15234375, -0.1478557586669922, -0.14336776733398438, -0.13887977600097656, -0.13439178466796875, -0.12990379333496094, -0.12541580200195312, -0.12092781066894531, -0.1164398193359375, -0.11195182800292969, -0.10746383666992188, -0.10297584533691406, -0.09848785400390625, -0.09399986267089844, -0.08951187133789062, -0.08502388000488281, -0.080535888671875, -0.07604789733886719, -0.07155990600585938, -0.06707191467285156, -0.06258392333984375, -0.05809593200683594, -0.053607940673828125, -0.04911994934082031, -0.0446319580078125, -0.04014396667480469, -0.035655975341796875, -0.031167984008789062, -0.02667999267578125, -0.022192001342773438, -0.017704010009765625, -0.013216018676757812, -0.00872802734375, -0.0042400360107421875, 0.000247955322265625, 0.0047359466552734375, 0.00922393798828125, 0.013711929321289062, 0.018199920654296875, 0.022687911987304688, 0.0271759033203125, 0.03166389465332031, 0.036151885986328125, 0.04063987731933594, 0.04512786865234375, 0.04961585998535156, 0.054103851318359375, 0.05859184265136719, 0.063079833984375, 0.06756782531738281, 0.07205581665039062, 0.07654380798339844, 0.08103179931640625, 0.08551979064941406, 0.09000778198242188, 0.09449577331542969, 0.0989837646484375, 0.10347175598144531, 0.10795974731445312, 0.11244773864746094, 0.11693572998046875, 0.12142372131347656, 0.12591171264648438, 0.1303997039794922, 0.1348876953125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 3.0, 6.0, 5.0, 11.0, 8.0, 22.0, 19.0, 14.0, 20.0, 23.0, 23.0, 30.0, 24.0, 36.0, 33.0, 32.0, 49.0, 42.0, 52.0, 54.0, 46.0, 46.0, 51.0, 42.0, 37.0, 40.0, 38.0, 28.0, 23.0, 20.0, 30.0, 13.0, 15.0, 16.0, 13.0, 11.0, 8.0, 2.0, 6.0, 3.0, 4.0, 1.0, 4.0, 2.0, 0.0, 2.0, 3.0], "bins": [-0.07135009765625, -0.06942319869995117, -0.06749629974365234, -0.06556940078735352, -0.06364250183105469, -0.06171560287475586, -0.05978870391845703, -0.0578618049621582, -0.055934906005859375, -0.05400800704956055, -0.05208110809326172, -0.05015420913696289, -0.04822731018066406, -0.046300411224365234, -0.044373512268066406, -0.04244661331176758, -0.04051971435546875, -0.03859281539916992, -0.036665916442871094, -0.034739017486572266, -0.03281211853027344, -0.03088521957397461, -0.02895832061767578, -0.027031421661376953, -0.025104522705078125, -0.023177623748779297, -0.02125072479248047, -0.01932382583618164, -0.017396926879882812, -0.015470027923583984, -0.013543128967285156, -0.011616230010986328, -0.0096893310546875, -0.007762432098388672, -0.005835533142089844, -0.003908634185791016, -0.0019817352294921875, -5.4836273193359375e-05, 0.0018720626831054688, 0.003798961639404297, 0.005725860595703125, 0.007652759552001953, 0.009579658508300781, 0.01150655746459961, 0.013433456420898438, 0.015360355377197266, 0.017287254333496094, 0.019214153289794922, 0.02114105224609375, 0.023067951202392578, 0.024994850158691406, 0.026921749114990234, 0.028848648071289062, 0.03077554702758789, 0.03270244598388672, 0.03462934494018555, 0.036556243896484375, 0.0384831428527832, 0.04041004180908203, 0.04233694076538086, 0.04426383972167969, 0.046190738677978516, 0.048117637634277344, 0.05004453659057617, 0.051971435546875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 7.0, 7.0, 11.0, 16.0, 17.0, 47.0, 58.0, 105.0, 189.0, 293.0, 572.0, 1078.0, 2560.0, 6471.0, 19806.0, 83520.0, 416245.0, 405727.0, 81352.0, 19358.0, 6170.0, 2419.0, 1159.0, 622.0, 289.0, 172.0, 103.0, 67.0, 40.0, 34.0, 16.0, 13.0, 7.0, 3.0, 5.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.053375244140625, -0.05165290832519531, -0.049930572509765625, -0.04820823669433594, -0.04648590087890625, -0.04476356506347656, -0.043041229248046875, -0.04131889343261719, -0.0395965576171875, -0.03787422180175781, -0.036151885986328125, -0.03442955017089844, -0.03270721435546875, -0.030984878540039062, -0.029262542724609375, -0.027540206909179688, -0.02581787109375, -0.024095535278320312, -0.022373199462890625, -0.020650863647460938, -0.01892852783203125, -0.017206192016601562, -0.015483856201171875, -0.013761520385742188, -0.0120391845703125, -0.010316848754882812, -0.008594512939453125, -0.0068721771240234375, -0.00514984130859375, -0.0034275054931640625, -0.001705169677734375, 1.71661376953125e-05, 0.001739501953125, 0.0034618377685546875, 0.005184173583984375, 0.0069065093994140625, 0.00862884521484375, 0.010351181030273438, 0.012073516845703125, 0.013795852661132812, 0.0155181884765625, 0.017240524291992188, 0.018962860107421875, 0.020685195922851562, 0.02240753173828125, 0.024129867553710938, 0.025852203369140625, 0.027574539184570312, 0.029296875, 0.031019210815429688, 0.032741546630859375, 0.03446388244628906, 0.03618621826171875, 0.03790855407714844, 0.039630889892578125, 0.04135322570800781, 0.0430755615234375, 0.04479789733886719, 0.046520233154296875, 0.04824256896972656, 0.04996490478515625, 0.05168724060058594, 0.053409576416015625, 0.05513191223144531, 0.056854248046875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 1.0, 8.0, 11.0, 6.0, 8.0, 14.0, 14.0, 21.0, 33.0, 31.0, 31.0, 58.0, 51.0, 67.0, 83.0, 92.0, 70.0, 63.0, 61.0, 59.0, 43.0, 31.0, 22.0, 21.0, 29.0, 10.0, 16.0, 13.0, 10.0, 5.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.695487976074219e-05, -3.566499799489975e-05, -3.437511622905731e-05, -3.3085234463214874e-05, -3.1795352697372437e-05, -3.050547093153e-05, -2.921558916568756e-05, -2.7925707399845123e-05, -2.6635825634002686e-05, -2.5345943868160248e-05, -2.405606210231781e-05, -2.2766180336475372e-05, -2.1476298570632935e-05, -2.0186416804790497e-05, -1.889653503894806e-05, -1.760665327310562e-05, -1.6316771507263184e-05, -1.5026889741420746e-05, -1.3737007975578308e-05, -1.244712620973587e-05, -1.1157244443893433e-05, -9.867362678050995e-06, -8.577480912208557e-06, -7.287599146366119e-06, -5.997717380523682e-06, -4.707835614681244e-06, -3.417953848838806e-06, -2.1280720829963684e-06, -8.381903171539307e-07, 4.516914486885071e-07, 1.7415732145309448e-06, 3.0314549803733826e-06, 4.32133674621582e-06, 5.611218512058258e-06, 6.901100277900696e-06, 8.190982043743134e-06, 9.480863809585571e-06, 1.0770745575428009e-05, 1.2060627341270447e-05, 1.3350509107112885e-05, 1.4640390872955322e-05, 1.593027263879776e-05, 1.7220154404640198e-05, 1.8510036170482635e-05, 1.9799917936325073e-05, 2.108979970216751e-05, 2.237968146800995e-05, 2.3669563233852386e-05, 2.4959444999694824e-05, 2.6249326765537262e-05, 2.75392085313797e-05, 2.8829090297222137e-05, 3.0118972063064575e-05, 3.140885382890701e-05, 3.269873559474945e-05, 3.398861736059189e-05, 3.5278499126434326e-05, 3.6568380892276764e-05, 3.78582626581192e-05, 3.914814442396164e-05, 4.043802618980408e-05, 4.1727907955646515e-05, 4.301778972148895e-05, 4.430767148733139e-05, 4.559755325317383e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 6.0, 10.0, 9.0, 5.0, 11.0, 7.0, 16.0, 15.0, 27.0, 40.0, 42.0, 63.0, 104.0, 171.0, 309.0, 561.0, 1307.0, 3230.0, 10499.0, 53923.0, 452268.0, 454746.0, 54635.0, 10617.0, 3308.0, 1267.0, 543.0, 276.0, 169.0, 103.0, 60.0, 66.0, 28.0, 29.0, 28.0, 14.0, 12.0, 9.0, 3.0, 7.0, 4.0, 0.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.07867431640625, -0.07648897171020508, -0.07430362701416016, -0.07211828231811523, -0.06993293762207031, -0.06774759292602539, -0.06556224822998047, -0.06337690353393555, -0.061191558837890625, -0.0590062141418457, -0.05682086944580078, -0.05463552474975586, -0.05245018005371094, -0.050264835357666016, -0.048079490661621094, -0.04589414596557617, -0.04370880126953125, -0.04152345657348633, -0.039338111877441406, -0.037152767181396484, -0.03496742248535156, -0.03278207778930664, -0.03059673309326172, -0.028411388397216797, -0.026226043701171875, -0.024040699005126953, -0.02185535430908203, -0.01967000961303711, -0.017484664916992188, -0.015299320220947266, -0.013113975524902344, -0.010928630828857422, -0.0087432861328125, -0.006557941436767578, -0.004372596740722656, -0.0021872520446777344, -1.9073486328125e-06, 0.0021834373474121094, 0.004368782043457031, 0.006554126739501953, 0.008739471435546875, 0.010924816131591797, 0.013110160827636719, 0.01529550552368164, 0.017480850219726562, 0.019666194915771484, 0.021851539611816406, 0.024036884307861328, 0.02622222900390625, 0.028407573699951172, 0.030592918395996094, 0.032778263092041016, 0.03496360778808594, 0.03714895248413086, 0.03933429718017578, 0.0415196418762207, 0.043704986572265625, 0.04589033126831055, 0.04807567596435547, 0.05026102066040039, 0.05244636535644531, 0.054631710052490234, 0.056817054748535156, 0.05900239944458008, 0.061187744140625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 4.0, 4.0, 3.0, 9.0, 11.0, 10.0, 17.0, 23.0, 16.0, 29.0, 31.0, 44.0, 55.0, 60.0, 52.0, 79.0, 77.0, 69.0, 67.0, 62.0, 42.0, 44.0, 40.0, 31.0, 22.0, 20.0, 18.0, 12.0, 8.0, 12.0, 7.0, 6.0, 5.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03155517578125, -0.030637025833129883, -0.029718875885009766, -0.02880072593688965, -0.02788257598876953, -0.026964426040649414, -0.026046276092529297, -0.02512812614440918, -0.024209976196289062, -0.023291826248168945, -0.022373676300048828, -0.02145552635192871, -0.020537376403808594, -0.019619226455688477, -0.01870107650756836, -0.017782926559448242, -0.016864776611328125, -0.015946626663208008, -0.01502847671508789, -0.014110326766967773, -0.013192176818847656, -0.012274026870727539, -0.011355876922607422, -0.010437726974487305, -0.009519577026367188, -0.00860142707824707, -0.007683277130126953, -0.006765127182006836, -0.005846977233886719, -0.0049288272857666016, -0.004010677337646484, -0.003092527389526367, -0.00217437744140625, -0.0012562274932861328, -0.0003380775451660156, 0.0005800724029541016, 0.0014982223510742188, 0.002416372299194336, 0.003334522247314453, 0.00425267219543457, 0.0051708221435546875, 0.006088972091674805, 0.007007122039794922, 0.007925271987915039, 0.008843421936035156, 0.009761571884155273, 0.01067972183227539, 0.011597871780395508, 0.012516021728515625, 0.013434171676635742, 0.01435232162475586, 0.015270471572875977, 0.016188621520996094, 0.01710677146911621, 0.018024921417236328, 0.018943071365356445, 0.019861221313476562, 0.02077937126159668, 0.021697521209716797, 0.022615671157836914, 0.02353382110595703, 0.02445197105407715, 0.025370121002197266, 0.026288270950317383, 0.0272064208984375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 5.0, 4.0, 13.0, 30.0, 63.0, 119.0, 228.0, 246.0, 147.0, 82.0, 33.0, 17.0, 12.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0117350816726685, -0.9838110208511353, -0.955886960029602, -0.9279628396034241, -0.9000387787818909, -0.8721147179603577, -0.8441905975341797, -0.8162665367126465, -0.7883424758911133, -0.7604184150695801, -0.7324943542480469, -0.7045702338218689, -0.6766461730003357, -0.6487221121788025, -0.6207979917526245, -0.5928739309310913, -0.5649498701095581, -0.5370258092880249, -0.5091017484664917, -0.4811776280403137, -0.4532535672187805, -0.4253295063972473, -0.3974054157733917, -0.36948132514953613, -0.34155726432800293, -0.3136332035064697, -0.28570911288261414, -0.25778502225875854, -0.22986096143722534, -0.20193688571453094, -0.17401280999183655, -0.14608873426914215, -0.11816471815109253, -0.09024064242839813, -0.062316566705703735, -0.03439249098300934, -0.006468415260314941, 0.021455660462379456, 0.04937973618507385, 0.07730381190776825, 0.10522788763046265, 0.13315196335315704, 0.16107603907585144, 0.18900011479854584, 0.21692419052124023, 0.24484826624393463, 0.27277234196662903, 0.3006964325904846, 0.3286204934120178, 0.356544554233551, 0.3844686448574066, 0.4123927354812622, 0.4403167963027954, 0.4682408571243286, 0.4961649477481842, 0.5240890383720398, 0.552013099193573, 0.5799371600151062, 0.6078612804412842, 0.6357853412628174, 0.6637094020843506, 0.6916334629058838, 0.719557523727417, 0.747481644153595, 0.7754057049751282]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 7.0, 5.0, 8.0, 7.0, 16.0, 11.0, 25.0, 28.0, 32.0, 33.0, 36.0, 53.0, 48.0, 46.0, 57.0, 59.0, 67.0, 60.0, 60.0, 48.0, 53.0, 39.0, 41.0, 36.0, 24.0, 23.0, 24.0, 16.0, 11.0, 13.0, 9.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5634295344352722, -0.5459505319595337, -0.5284714698791504, -0.5109924674034119, -0.49351343512535095, -0.47603440284729004, -0.4585554003715515, -0.4410763680934906, -0.4235973358154297, -0.4061183035373688, -0.38863930106163025, -0.37116026878356934, -0.3536812365055084, -0.3362022042274475, -0.318723201751709, -0.30124416947364807, -0.28376516699790955, -0.26628613471984863, -0.2488071173429489, -0.2313280999660492, -0.21384906768798828, -0.19637005031108856, -0.17889103293418884, -0.16141200065612793, -0.1439329832792282, -0.1264539659023285, -0.10897493362426758, -0.09149591624736786, -0.07401689141988754, -0.05653786659240723, -0.03905884921550751, -0.02157982438802719, -0.004100799560546875, 0.013378223404288292, 0.03085724636912346, 0.04833626747131348, 0.06581529229879379, 0.08329431712627411, 0.10077333450317383, 0.11825235933065414, 0.13573138415813446, 0.15321040153503418, 0.1706894338130951, 0.1881684511899948, 0.20564746856689453, 0.22312650084495544, 0.24060551822185516, 0.2580845355987549, 0.2755635678768158, 0.2930426001548767, 0.31052160263061523, 0.32800063490867615, 0.34547966718673706, 0.3629586696624756, 0.3804377019405365, 0.3979167342185974, 0.41539573669433594, 0.43287476897239685, 0.4503537714481354, 0.4678328037261963, 0.4853118360042572, 0.5027908682823181, 0.5202698707580566, 0.5377488732337952, 0.5552279353141785]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 8.0, 10.0, 10.0, 16.0, 30.0, 28.0, 46.0, 87.0, 173.0, 345.0, 730.0, 2176.0, 9538.0, 133125.0, 4005801.0, 34736.0, 4867.0, 1424.0, 525.0, 241.0, 145.0, 75.0, 45.0, 27.0, 25.0, 7.0, 5.0, 11.0, 6.0, 1.0, 1.0, 4.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.417236328125, -0.406341552734375, -0.39544677734375, -0.384552001953125, -0.3736572265625, -0.362762451171875, -0.35186767578125, -0.340972900390625, -0.330078125, -0.319183349609375, -0.30828857421875, -0.297393798828125, -0.2864990234375, -0.275604248046875, -0.26470947265625, -0.253814697265625, -0.242919921875, -0.232025146484375, -0.22113037109375, -0.210235595703125, -0.1993408203125, -0.188446044921875, -0.17755126953125, -0.166656494140625, -0.15576171875, -0.144866943359375, -0.13397216796875, -0.123077392578125, -0.1121826171875, -0.101287841796875, -0.09039306640625, -0.079498291015625, -0.068603515625, -0.057708740234375, -0.04681396484375, -0.035919189453125, -0.0250244140625, -0.014129638671875, -0.00323486328125, 0.007659912109375, 0.0185546875, 0.029449462890625, 0.04034423828125, 0.051239013671875, 0.0621337890625, 0.073028564453125, 0.08392333984375, 0.094818115234375, 0.105712890625, 0.116607666015625, 0.12750244140625, 0.138397216796875, 0.1492919921875, 0.160186767578125, 0.17108154296875, 0.181976318359375, 0.19287109375, 0.203765869140625, 0.21466064453125, 0.225555419921875, 0.2364501953125, 0.247344970703125, 0.25823974609375, 0.269134521484375, 0.280029296875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 4.0, 5.0, 11.0, 7.0, 9.0, 21.0, 16.0, 21.0, 36.0, 32.0, 51.0, 60.0, 96.0, 77.0, 113.0, 91.0, 76.0, 75.0, 49.0, 25.0, 21.0, 22.0, 18.0, 18.0, 9.0, 3.0, 7.0, 5.0, 7.0, 3.0, 1.0, 0.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.0220184326171875, -0.021444082260131836, -0.020869731903076172, -0.020295381546020508, -0.019721031188964844, -0.01914668083190918, -0.018572330474853516, -0.01799798011779785, -0.017423629760742188, -0.016849279403686523, -0.01627492904663086, -0.015700578689575195, -0.015126228332519531, -0.014551877975463867, -0.013977527618408203, -0.013403177261352539, -0.012828826904296875, -0.012254476547241211, -0.011680126190185547, -0.011105775833129883, -0.010531425476074219, -0.009957075119018555, -0.00938272476196289, -0.008808374404907227, -0.008234024047851562, -0.0076596736907958984, -0.007085323333740234, -0.00651097297668457, -0.005936622619628906, -0.005362272262573242, -0.004787921905517578, -0.004213571548461914, -0.00363922119140625, -0.003064870834350586, -0.002490520477294922, -0.0019161701202392578, -0.0013418197631835938, -0.0007674694061279297, -0.00019311904907226562, 0.00038123130798339844, 0.0009555816650390625, 0.0015299320220947266, 0.0021042823791503906, 0.0026786327362060547, 0.0032529830932617188, 0.003827333450317383, 0.004401683807373047, 0.004976034164428711, 0.005550384521484375, 0.006124734878540039, 0.006699085235595703, 0.007273435592651367, 0.007847785949707031, 0.008422136306762695, 0.00899648666381836, 0.009570837020874023, 0.010145187377929688, 0.010719537734985352, 0.011293888092041016, 0.01186823844909668, 0.012442588806152344, 0.013016939163208008, 0.013591289520263672, 0.014165639877319336, 0.014739990234375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 6.0, 9.0, 15.0, 25.0, 34.0, 45.0, 122.0, 268.0, 700.0, 2117.0, 8458.0, 50179.0, 3128000.0, 955022.0, 39467.0, 7076.0, 1798.0, 491.0, 221.0, 96.0, 65.0, 32.0, 15.0, 7.0, 6.0, 8.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.280029296875, -0.27301788330078125, -0.2660064697265625, -0.25899505615234375, -0.251983642578125, -0.24497222900390625, -0.2379608154296875, -0.23094940185546875, -0.22393798828125, -0.21692657470703125, -0.2099151611328125, -0.20290374755859375, -0.195892333984375, -0.18888092041015625, -0.1818695068359375, -0.17485809326171875, -0.1678466796875, -0.16083526611328125, -0.1538238525390625, -0.14681243896484375, -0.139801025390625, -0.13278961181640625, -0.1257781982421875, -0.11876678466796875, -0.11175537109375, -0.10474395751953125, -0.0977325439453125, -0.09072113037109375, -0.083709716796875, -0.07669830322265625, -0.0696868896484375, -0.06267547607421875, -0.0556640625, -0.04865264892578125, -0.0416412353515625, -0.03462982177734375, -0.027618408203125, -0.02060699462890625, -0.0135955810546875, -0.00658416748046875, 0.00042724609375, 0.00743865966796875, 0.0144500732421875, 0.02146148681640625, 0.028472900390625, 0.03548431396484375, 0.0424957275390625, 0.04950714111328125, 0.0565185546875, 0.06352996826171875, 0.0705413818359375, 0.07755279541015625, 0.084564208984375, 0.09157562255859375, 0.0985870361328125, 0.10559844970703125, 0.11260986328125, 0.11962127685546875, 0.1266326904296875, 0.13364410400390625, 0.140655517578125, 0.14766693115234375, 0.1546783447265625, 0.16168975830078125, 0.168701171875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 3.0, 2.0, 3.0, 8.0, 11.0, 14.0, 9.0, 17.0, 20.0, 26.0, 41.0, 59.0, 81.0, 122.0, 261.0, 479.0, 1800.0, 469.0, 207.0, 126.0, 82.0, 67.0, 40.0, 22.0, 19.0, 22.0, 8.0, 16.0, 9.0, 5.0, 9.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.025177001953125, -0.02429342269897461, -0.02340984344482422, -0.022526264190673828, -0.021642684936523438, -0.020759105682373047, -0.019875526428222656, -0.018991947174072266, -0.018108367919921875, -0.017224788665771484, -0.016341209411621094, -0.015457630157470703, -0.014574050903320312, -0.013690471649169922, -0.012806892395019531, -0.01192331314086914, -0.01103973388671875, -0.01015615463256836, -0.009272575378417969, -0.008388996124267578, -0.0075054168701171875, -0.006621837615966797, -0.005738258361816406, -0.004854679107666016, -0.003971099853515625, -0.0030875205993652344, -0.0022039413452148438, -0.0013203620910644531, -0.0004367828369140625, 0.0004467964172363281, 0.0013303756713867188, 0.0022139549255371094, 0.0030975341796875, 0.003981113433837891, 0.004864692687988281, 0.005748271942138672, 0.0066318511962890625, 0.007515430450439453, 0.008399009704589844, 0.009282588958740234, 0.010166168212890625, 0.011049747467041016, 0.011933326721191406, 0.012816905975341797, 0.013700485229492188, 0.014584064483642578, 0.015467643737792969, 0.01635122299194336, 0.01723480224609375, 0.01811838150024414, 0.01900196075439453, 0.019885540008544922, 0.020769119262695312, 0.021652698516845703, 0.022536277770996094, 0.023419857025146484, 0.024303436279296875, 0.025187015533447266, 0.026070594787597656, 0.026954174041748047, 0.027837753295898438, 0.028721332550048828, 0.02960491180419922, 0.03048849105834961, 0.0313720703125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 8.0, 20.0, 44.0, 81.0, 179.0, 270.0, 203.0, 108.0, 49.0, 22.0, 13.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3423707187175751, -0.3335146903991699, -0.3246586322784424, -0.31580260396003723, -0.3069465756416321, -0.29809054732322693, -0.2892345190048218, -0.28037846088409424, -0.2715224325656891, -0.26266640424728394, -0.2538103461265564, -0.24495431780815125, -0.2360982894897461, -0.22724226117134094, -0.2183862179517746, -0.20953017473220825, -0.2006741464138031, -0.19181811809539795, -0.1829620748758316, -0.17410603165626526, -0.1652500033378601, -0.15639397501945496, -0.1475379317998886, -0.13868188858032227, -0.12982586026191711, -0.12096982449293137, -0.11211378872394562, -0.10325775295495987, -0.09440171718597412, -0.08554568141698837, -0.07668964564800262, -0.06783360987901688, -0.05897757411003113, -0.05012153834104538, -0.04126550257205963, -0.03240946680307388, -0.023553431034088135, -0.014697395265102386, -0.005841359496116638, 0.00301467627286911, 0.011870712041854858, 0.020726747810840607, 0.029582783579826355, 0.0384388193488121, 0.04729485511779785, 0.0561508908867836, 0.06500692665576935, 0.0738629624247551, 0.08271899819374084, 0.09157503396272659, 0.10043106973171234, 0.10928710550069809, 0.11814314126968384, 0.126999169588089, 0.13585521280765533, 0.14471125602722168, 0.15356728434562683, 0.16242331266403198, 0.17127935588359833, 0.18013539910316467, 0.18899142742156982, 0.19784745573997498, 0.20670349895954132, 0.21555954217910767, 0.22441557049751282]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 4.0, 2.0, 9.0, 5.0, 11.0, 11.0, 15.0, 16.0, 22.0, 25.0, 26.0, 34.0, 37.0, 51.0, 33.0, 56.0, 53.0, 44.0, 53.0, 57.0, 44.0, 47.0, 43.0, 45.0, 36.0, 36.0, 30.0, 37.0, 21.0, 26.0, 17.0, 14.0, 14.0, 11.0, 7.0, 7.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11070460081100464, -0.10726530849933624, -0.10382600873708725, -0.10038671642541885, -0.09694741666316986, -0.09350812435150146, -0.09006883203983307, -0.08662953972816467, -0.08319023996591568, -0.07975094765424728, -0.07631164789199829, -0.0728723555803299, -0.0694330632686615, -0.0659937635064125, -0.06255447119474411, -0.059115175157785416, -0.05567587912082672, -0.05223658308386803, -0.04879728704690933, -0.045357994735240936, -0.04191869869828224, -0.03847940266132355, -0.03504011034965515, -0.03160081431269646, -0.028161518275737762, -0.024722222238779068, -0.021282928064465523, -0.017843633890151978, -0.014404337853193283, -0.010965041816234589, -0.007525747641921043, -0.004086453467607498, -0.0006471574306488037, 0.002792137674987316, 0.006231432780623436, 0.009670727886259556, 0.013110022991895676, 0.01654931902885437, 0.019988613203167915, 0.02342790737748146, 0.026867203414440155, 0.03030649945139885, 0.033745795488357544, 0.03718508780002594, 0.040624383836984634, 0.04406367987394333, 0.047502972185611725, 0.05094226822257042, 0.054381564259529114, 0.05782086029648781, 0.0612601563334465, 0.0646994486451149, 0.06813874840736389, 0.07157804071903229, 0.07501733303070068, 0.07845662534236908, 0.08189592510461807, 0.08533521741628647, 0.08877451717853546, 0.09221380949020386, 0.09565310180187225, 0.09909240156412125, 0.10253169387578964, 0.10597099363803864, 0.10941028594970703]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 7.0, 10.0, 24.0, 22.0, 21.0, 69.0, 95.0, 136.0, 228.0, 341.0, 645.0, 1177.0, 2397.0, 5065.0, 11219.0, 29827.0, 94999.0, 371507.0, 380403.0, 98179.0, 30169.0, 11645.0, 5056.0, 2413.0, 1277.0, 647.0, 366.0, 197.0, 144.0, 88.0, 59.0, 27.0, 27.0, 20.0, 17.0, 12.0, 6.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1146240234375, -0.11135005950927734, -0.10807609558105469, -0.10480213165283203, -0.10152816772460938, -0.09825420379638672, -0.09498023986816406, -0.0917062759399414, -0.08843231201171875, -0.0851583480834961, -0.08188438415527344, -0.07861042022705078, -0.07533645629882812, -0.07206249237060547, -0.06878852844238281, -0.06551456451416016, -0.0622406005859375, -0.058966636657714844, -0.05569267272949219, -0.05241870880126953, -0.049144744873046875, -0.04587078094482422, -0.04259681701660156, -0.039322853088378906, -0.03604888916015625, -0.032774925231933594, -0.029500961303710938, -0.02622699737548828, -0.022953033447265625, -0.01967906951904297, -0.016405105590820312, -0.013131141662597656, -0.009857177734375, -0.006583213806152344, -0.0033092498779296875, -3.528594970703125e-05, 0.003238677978515625, 0.006512641906738281, 0.009786605834960938, 0.013060569763183594, 0.01633453369140625, 0.019608497619628906, 0.022882461547851562, 0.02615642547607422, 0.029430389404296875, 0.03270435333251953, 0.03597831726074219, 0.039252281188964844, 0.0425262451171875, 0.045800209045410156, 0.04907417297363281, 0.05234813690185547, 0.055622100830078125, 0.05889606475830078, 0.06217002868652344, 0.0654439926147461, 0.06871795654296875, 0.0719919204711914, 0.07526588439941406, 0.07853984832763672, 0.08181381225585938, 0.08508777618408203, 0.08836174011230469, 0.09163570404052734, 0.09490966796875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 5.0, 10.0, 6.0, 15.0, 23.0, 15.0, 35.0, 44.0, 48.0, 64.0, 81.0, 84.0, 103.0, 72.0, 77.0, 70.0, 55.0, 34.0, 35.0, 22.0, 18.0, 14.0, 9.0, 11.0, 11.0, 6.0, 3.0, 3.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.021331787109375, -0.020779967308044434, -0.020228147506713867, -0.0196763277053833, -0.019124507904052734, -0.018572688102722168, -0.0180208683013916, -0.017469048500061035, -0.01691722869873047, -0.016365408897399902, -0.015813589096069336, -0.01526176929473877, -0.014709949493408203, -0.014158129692077637, -0.01360630989074707, -0.013054490089416504, -0.012502670288085938, -0.011950850486755371, -0.011399030685424805, -0.010847210884094238, -0.010295391082763672, -0.009743571281433105, -0.009191751480102539, -0.008639931678771973, -0.008088111877441406, -0.00753629207611084, -0.0069844722747802734, -0.006432652473449707, -0.005880832672119141, -0.005329012870788574, -0.004777193069458008, -0.004225373268127441, -0.003673553466796875, -0.0031217336654663086, -0.002569913864135742, -0.0020180940628051758, -0.0014662742614746094, -0.000914454460144043, -0.00036263465881347656, 0.00018918514251708984, 0.0007410049438476562, 0.0012928247451782227, 0.001844644546508789, 0.0023964643478393555, 0.002948284149169922, 0.0035001039505004883, 0.004051923751831055, 0.004603743553161621, 0.0051555633544921875, 0.005707383155822754, 0.00625920295715332, 0.006811022758483887, 0.007362842559814453, 0.00791466236114502, 0.008466482162475586, 0.009018301963806152, 0.009570121765136719, 0.010121941566467285, 0.010673761367797852, 0.011225581169128418, 0.011777400970458984, 0.01232922077178955, 0.012881040573120117, 0.013432860374450684, 0.01398468017578125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 8.0, 10.0, 12.0, 15.0, 28.0, 32.0, 56.0, 65.0, 86.0, 138.0, 197.0, 293.0, 441.0, 858.0, 1857.0, 5087.0, 16709.0, 67086.0, 313689.0, 486508.0, 115530.0, 26844.0, 7593.0, 2650.0, 1098.0, 578.0, 344.0, 220.0, 160.0, 95.0, 65.0, 58.0, 31.0, 25.0, 23.0, 19.0, 7.0, 9.0, 11.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1171875, -0.11342906951904297, -0.10967063903808594, -0.1059122085571289, -0.10215377807617188, -0.09839534759521484, -0.09463691711425781, -0.09087848663330078, -0.08712005615234375, -0.08336162567138672, -0.07960319519042969, -0.07584476470947266, -0.07208633422851562, -0.0683279037475586, -0.06456947326660156, -0.06081104278564453, -0.0570526123046875, -0.05329418182373047, -0.04953575134277344, -0.045777320861816406, -0.042018890380859375, -0.038260459899902344, -0.03450202941894531, -0.03074359893798828, -0.02698516845703125, -0.02322673797607422, -0.019468307495117188, -0.015709877014160156, -0.011951446533203125, -0.008193016052246094, -0.0044345855712890625, -0.0006761550903320312, 0.003082275390625, 0.006840705871582031, 0.010599136352539062, 0.014357566833496094, 0.018115997314453125, 0.021874427795410156, 0.025632858276367188, 0.02939128875732422, 0.03314971923828125, 0.03690814971923828, 0.04066658020019531, 0.044425010681152344, 0.048183441162109375, 0.051941871643066406, 0.05570030212402344, 0.05945873260498047, 0.0632171630859375, 0.06697559356689453, 0.07073402404785156, 0.0744924545288086, 0.07825088500976562, 0.08200931549072266, 0.08576774597167969, 0.08952617645263672, 0.09328460693359375, 0.09704303741455078, 0.10080146789550781, 0.10455989837646484, 0.10831832885742188, 0.1120767593383789, 0.11583518981933594, 0.11959362030029297, 0.12335205078125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 1.0, 3.0, 6.0, 4.0, 9.0, 3.0, 12.0, 11.0, 10.0, 20.0, 19.0, 15.0, 32.0, 33.0, 29.0, 28.0, 31.0, 35.0, 45.0, 46.0, 40.0, 48.0, 41.0, 48.0, 45.0, 38.0, 40.0, 35.0, 38.0, 44.0, 34.0, 23.0, 27.0, 12.0, 17.0, 14.0, 8.0, 13.0, 6.0, 9.0, 5.0, 10.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.072021484375, -0.06980514526367188, -0.06758880615234375, -0.06537246704101562, -0.0631561279296875, -0.060939788818359375, -0.05872344970703125, -0.056507110595703125, -0.054290771484375, -0.052074432373046875, -0.04985809326171875, -0.047641754150390625, -0.0454254150390625, -0.043209075927734375, -0.04099273681640625, -0.038776397705078125, -0.03656005859375, -0.034343719482421875, -0.03212738037109375, -0.029911041259765625, -0.0276947021484375, -0.025478363037109375, -0.02326202392578125, -0.021045684814453125, -0.018829345703125, -0.016613006591796875, -0.01439666748046875, -0.012180328369140625, -0.0099639892578125, -0.007747650146484375, -0.00553131103515625, -0.003314971923828125, -0.0010986328125, 0.001117706298828125, 0.00333404541015625, 0.005550384521484375, 0.0077667236328125, 0.009983062744140625, 0.01219940185546875, 0.014415740966796875, 0.016632080078125, 0.018848419189453125, 0.02106475830078125, 0.023281097412109375, 0.0254974365234375, 0.027713775634765625, 0.02993011474609375, 0.032146453857421875, 0.03436279296875, 0.036579132080078125, 0.03879547119140625, 0.041011810302734375, 0.0432281494140625, 0.045444488525390625, 0.04766082763671875, 0.049877166748046875, 0.052093505859375, 0.054309844970703125, 0.05652618408203125, 0.058742523193359375, 0.0609588623046875, 0.06317520141601562, 0.06539154052734375, 0.06760787963867188, 0.06982421875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 9.0, 11.0, 13.0, 18.0, 27.0, 52.0, 106.0, 102.0, 143.0, 239.0, 345.0, 517.0, 755.0, 1333.0, 2212.0, 4008.0, 8235.0, 21451.0, 71233.0, 295663.0, 459488.0, 124802.0, 33349.0, 12019.0, 5275.0, 2812.0, 1589.0, 906.0, 606.0, 392.0, 256.0, 181.0, 120.0, 91.0, 61.0, 53.0, 22.0, 18.0, 12.0, 8.0, 10.0, 2.0, 8.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.054534912109375, -0.05294036865234375, -0.0513458251953125, -0.04975128173828125, -0.04815673828125, -0.04656219482421875, -0.0449676513671875, -0.04337310791015625, -0.041778564453125, -0.04018402099609375, -0.0385894775390625, -0.03699493408203125, -0.035400390625, -0.03380584716796875, -0.0322113037109375, -0.03061676025390625, -0.029022216796875, -0.02742767333984375, -0.0258331298828125, -0.02423858642578125, -0.02264404296875, -0.02104949951171875, -0.0194549560546875, -0.01786041259765625, -0.016265869140625, -0.01467132568359375, -0.0130767822265625, -0.01148223876953125, -0.0098876953125, -0.00829315185546875, -0.0066986083984375, -0.00510406494140625, -0.003509521484375, -0.00191497802734375, -0.0003204345703125, 0.00127410888671875, 0.00286865234375, 0.00446319580078125, 0.0060577392578125, 0.00765228271484375, 0.009246826171875, 0.01084136962890625, 0.0124359130859375, 0.01403045654296875, 0.015625, 0.01721954345703125, 0.0188140869140625, 0.02040863037109375, 0.022003173828125, 0.02359771728515625, 0.0251922607421875, 0.02678680419921875, 0.02838134765625, 0.02997589111328125, 0.0315704345703125, 0.03316497802734375, 0.034759521484375, 0.03635406494140625, 0.0379486083984375, 0.03954315185546875, 0.0411376953125, 0.04273223876953125, 0.0443267822265625, 0.04592132568359375, 0.047515869140625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 6.0, 15.0, 21.0, 20.0, 32.0, 79.0, 90.0, 142.0, 187.0, 149.0, 103.0, 57.0, 39.0, 26.0, 19.0, 11.0, 3.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.594989776611328e-05, -8.409842848777771e-05, -8.224695920944214e-05, -8.039548993110657e-05, -7.8544020652771e-05, -7.669255137443542e-05, -7.484108209609985e-05, -7.298961281776428e-05, -7.113814353942871e-05, -6.928667426109314e-05, -6.743520498275757e-05, -6.5583735704422e-05, -6.373226642608643e-05, -6.188079714775085e-05, -6.002932786941528e-05, -5.817785859107971e-05, -5.632638931274414e-05, -5.447492003440857e-05, -5.2623450756073e-05, -5.077198147773743e-05, -4.8920512199401855e-05, -4.7069042921066284e-05, -4.521757364273071e-05, -4.336610436439514e-05, -4.151463508605957e-05, -3.9663165807724e-05, -3.781169652938843e-05, -3.5960227251052856e-05, -3.4108757972717285e-05, -3.2257288694381714e-05, -3.0405819416046143e-05, -2.855435013771057e-05, -2.6702880859375e-05, -2.485141158103943e-05, -2.2999942302703857e-05, -2.1148473024368286e-05, -1.9297003746032715e-05, -1.7445534467697144e-05, -1.5594065189361572e-05, -1.3742595911026001e-05, -1.189112663269043e-05, -1.0039657354354858e-05, -8.188188076019287e-06, -6.336718797683716e-06, -4.4852495193481445e-06, -2.6337802410125732e-06, -7.82310962677002e-07, 1.0691583156585693e-06, 2.9206275939941406e-06, 4.772096872329712e-06, 6.623566150665283e-06, 8.475035429000854e-06, 1.0326504707336426e-05, 1.2177973985671997e-05, 1.4029443264007568e-05, 1.588091254234314e-05, 1.773238182067871e-05, 1.9583851099014282e-05, 2.1435320377349854e-05, 2.3286789655685425e-05, 2.5138258934020996e-05, 2.6989728212356567e-05, 2.884119749069214e-05, 3.069266676902771e-05, 3.254413604736328e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 8.0, 6.0, 12.0, 17.0, 20.0, 42.0, 72.0, 124.0, 249.0, 667.0, 2197.0, 10833.0, 222616.0, 782098.0, 24187.0, 3671.0, 964.0, 367.0, 165.0, 71.0, 56.0, 28.0, 17.0, 15.0, 11.0, 11.0, 8.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10650634765625, -0.10147762298583984, -0.09644889831542969, -0.09142017364501953, -0.08639144897460938, -0.08136272430419922, -0.07633399963378906, -0.0713052749633789, -0.06627655029296875, -0.061247825622558594, -0.05621910095214844, -0.05119037628173828, -0.046161651611328125, -0.04113292694091797, -0.03610420227050781, -0.031075477600097656, -0.0260467529296875, -0.021018028259277344, -0.015989303588867188, -0.010960578918457031, -0.005931854248046875, -0.0009031295776367188, 0.0041255950927734375, 0.009154319763183594, 0.01418304443359375, 0.019211769104003906, 0.024240493774414062, 0.02926921844482422, 0.034297943115234375, 0.03932666778564453, 0.04435539245605469, 0.049384117126464844, 0.054412841796875, 0.059441566467285156, 0.06447029113769531, 0.06949901580810547, 0.07452774047851562, 0.07955646514892578, 0.08458518981933594, 0.0896139144897461, 0.09464263916015625, 0.0996713638305664, 0.10470008850097656, 0.10972881317138672, 0.11475753784179688, 0.11978626251220703, 0.12481498718261719, 0.12984371185302734, 0.1348724365234375, 0.13990116119384766, 0.1449298858642578, 0.14995861053466797, 0.15498733520507812, 0.16001605987548828, 0.16504478454589844, 0.1700735092163086, 0.17510223388671875, 0.1801309585571289, 0.18515968322753906, 0.19018840789794922, 0.19521713256835938, 0.20024585723876953, 0.2052745819091797, 0.21030330657958984, 0.21533203125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 9.0, 7.0, 20.0, 22.0, 45.0, 80.0, 124.0, 163.0, 143.0, 151.0, 68.0, 54.0, 36.0, 25.0, 13.0, 7.0, 5.0, 5.0, 2.0, 1.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.050506591796875, -0.048220157623291016, -0.04593372344970703, -0.04364728927612305, -0.04136085510253906, -0.03907442092895508, -0.036787986755371094, -0.03450155258178711, -0.032215118408203125, -0.02992868423461914, -0.027642250061035156, -0.025355815887451172, -0.023069381713867188, -0.020782947540283203, -0.01849651336669922, -0.016210079193115234, -0.01392364501953125, -0.011637210845947266, -0.009350776672363281, -0.007064342498779297, -0.0047779083251953125, -0.002491474151611328, -0.00020503997802734375, 0.0020813941955566406, 0.004367828369140625, 0.006654262542724609, 0.008940696716308594, 0.011227130889892578, 0.013513565063476562, 0.015799999237060547, 0.01808643341064453, 0.020372867584228516, 0.0226593017578125, 0.024945735931396484, 0.02723217010498047, 0.029518604278564453, 0.03180503845214844, 0.03409147262573242, 0.036377906799316406, 0.03866434097290039, 0.040950775146484375, 0.04323720932006836, 0.045523643493652344, 0.04781007766723633, 0.05009651184082031, 0.0523829460144043, 0.05466938018798828, 0.056955814361572266, 0.05924224853515625, 0.061528682708740234, 0.06381511688232422, 0.0661015510559082, 0.06838798522949219, 0.07067441940307617, 0.07296085357666016, 0.07524728775024414, 0.07753372192382812, 0.07982015609741211, 0.0821065902709961, 0.08439302444458008, 0.08667945861816406, 0.08896589279174805, 0.09125232696533203, 0.09353876113891602, 0.0958251953125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 6.0, 8.0, 16.0, 16.0, 43.0, 77.0, 106.0, 158.0, 158.0, 148.0, 118.0, 58.0, 43.0, 19.0, 10.0, 11.0, 9.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5261595845222473, -0.5014950037002563, -0.47683045268058777, -0.4521659016609192, -0.4275013208389282, -0.40283676981925964, -0.37817221879959106, -0.3535076379776001, -0.3288430869579315, -0.30417853593826294, -0.279513955116272, -0.2548494040966034, -0.23018483817577362, -0.20552027225494385, -0.18085572123527527, -0.1561911553144455, -0.13152658939361572, -0.10686202347278595, -0.08219746500253677, -0.0575329065322876, -0.032868340611457825, -0.008203774690628052, 0.016460776329040527, 0.0411253422498703, 0.06578990817070007, 0.09045447409152985, 0.11511903256177902, 0.1397835910320282, 0.16444815695285797, 0.18911272287368774, 0.21377727389335632, 0.2384418398141861, 0.2631063461303711, 0.2877708971500397, 0.31243547797203064, 0.3371000289916992, 0.3617646098136902, 0.38642916083335876, 0.41109371185302734, 0.4357582926750183, 0.4604228436946869, 0.48508739471435547, 0.5097519755363464, 0.5344165563583374, 0.5590810775756836, 0.5837456583976746, 0.6084102392196655, 0.6330747604370117, 0.6577393412590027, 0.6824039220809937, 0.7070684432983398, 0.7317330241203308, 0.7563976049423218, 0.781062126159668, 0.8057267069816589, 0.8303912878036499, 0.8550558090209961, 0.8797203898429871, 0.9043849110603333, 0.9290494918823242, 0.9537140727043152, 0.9783786535263062, 1.0030431747436523, 1.0277076959609985, 1.0523723363876343]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 6.0, 6.0, 7.0, 9.0, 9.0, 10.0, 17.0, 16.0, 23.0, 27.0, 25.0, 20.0, 31.0, 42.0, 30.0, 30.0, 36.0, 46.0, 40.0, 51.0, 38.0, 37.0, 38.0, 45.0, 46.0, 43.0, 40.0, 37.0, 35.0, 18.0, 30.0, 18.0, 14.0, 15.0, 18.0, 3.0, 10.0, 13.0, 2.0, 9.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.49666398763656616, -0.48125702142715454, -0.46585002541542053, -0.4504430294036865, -0.4350360631942749, -0.4196290969848633, -0.4042221009731293, -0.38881510496139526, -0.37340813875198364, -0.358001172542572, -0.342594176530838, -0.327187180519104, -0.3117802143096924, -0.29637324810028076, -0.28096625208854675, -0.26555925607681274, -0.2501522898674011, -0.2347453087568283, -0.2193383276462555, -0.20393134653568268, -0.18852436542510986, -0.17311738431453705, -0.15771040320396423, -0.14230342209339142, -0.1268964409828186, -0.11148945987224579, -0.09608247876167297, -0.08067549765110016, -0.06526851654052734, -0.04986153542995453, -0.034454554319381714, -0.0190475732088089, -0.003640592098236084, 0.011766389012336731, 0.027173370122909546, 0.04258035123348236, 0.057987332344055176, 0.07339431345462799, 0.0888012945652008, 0.10420827567577362, 0.11961525678634644, 0.13502223789691925, 0.15042921900749207, 0.16583620011806488, 0.1812431812286377, 0.1966501623392105, 0.21205714344978333, 0.22746412456035614, 0.24287110567092896, 0.2582780718803406, 0.2736850678920746, 0.2890920639038086, 0.3044990301132202, 0.31990599632263184, 0.33531299233436584, 0.35071998834609985, 0.3661269545555115, 0.3815339207649231, 0.3969409167766571, 0.4123479127883911, 0.42775487899780273, 0.44316184520721436, 0.45856884121894836, 0.4739758372306824, 0.489382803440094]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 9.0, 12.0, 10.0, 11.0, 15.0, 40.0, 42.0, 63.0, 92.0, 138.0, 206.0, 336.0, 541.0, 1004.0, 2046.0, 5136.0, 16182.0, 77559.0, 3638498.0, 396478.0, 38505.0, 9941.0, 3622.0, 1595.0, 798.0, 463.0, 298.0, 189.0, 122.0, 86.0, 63.0, 45.0, 39.0, 34.0, 12.0, 17.0, 11.0, 8.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.12841796875, -0.12410926818847656, -0.11980056762695312, -0.11549186706542969, -0.11118316650390625, -0.10687446594238281, -0.10256576538085938, -0.09825706481933594, -0.0939483642578125, -0.08963966369628906, -0.08533096313476562, -0.08102226257324219, -0.07671356201171875, -0.07240486145019531, -0.06809616088867188, -0.06378746032714844, -0.059478759765625, -0.05517005920410156, -0.050861358642578125, -0.04655265808105469, -0.04224395751953125, -0.03793525695800781, -0.033626556396484375, -0.029317855834960938, -0.0250091552734375, -0.020700454711914062, -0.016391754150390625, -0.012083053588867188, -0.00777435302734375, -0.0034656524658203125, 0.000843048095703125, 0.0051517486572265625, 0.00946044921875, 0.013769149780273438, 0.018077850341796875, 0.022386550903320312, 0.02669525146484375, 0.031003952026367188, 0.035312652587890625, 0.03962135314941406, 0.0439300537109375, 0.04823875427246094, 0.052547454833984375, 0.05685615539550781, 0.06116485595703125, 0.06547355651855469, 0.06978225708007812, 0.07409095764160156, 0.078399658203125, 0.08270835876464844, 0.08701705932617188, 0.09132575988769531, 0.09563446044921875, 0.09994316101074219, 0.10425186157226562, 0.10856056213378906, 0.1128692626953125, 0.11717796325683594, 0.12148666381835938, 0.1257953643798828, 0.13010406494140625, 0.1344127655029297, 0.13872146606445312, 0.14303016662597656, 0.1473388671875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 6.0, 6.0, 6.0, 6.0, 11.0, 8.0, 16.0, 12.0, 22.0, 25.0, 42.0, 46.0, 53.0, 47.0, 69.0, 80.0, 71.0, 84.0, 73.0, 73.0, 39.0, 45.0, 32.0, 25.0, 24.0, 18.0, 15.0, 10.0, 8.0, 8.0, 7.0, 4.0, 2.0, 4.0, 5.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0196685791015625, -0.019065380096435547, -0.018462181091308594, -0.01785898208618164, -0.017255783081054688, -0.016652584075927734, -0.01604938507080078, -0.015446186065673828, -0.014842987060546875, -0.014239788055419922, -0.013636589050292969, -0.013033390045166016, -0.012430191040039062, -0.01182699203491211, -0.011223793029785156, -0.010620594024658203, -0.01001739501953125, -0.009414196014404297, -0.008810997009277344, -0.00820779800415039, -0.0076045989990234375, -0.007001399993896484, -0.006398200988769531, -0.005795001983642578, -0.005191802978515625, -0.004588603973388672, -0.003985404968261719, -0.0033822059631347656, -0.0027790069580078125, -0.0021758079528808594, -0.0015726089477539062, -0.0009694099426269531, -0.0003662109375, 0.00023698806762695312, 0.0008401870727539062, 0.0014433860778808594, 0.0020465850830078125, 0.0026497840881347656, 0.0032529830932617188, 0.003856182098388672, 0.004459381103515625, 0.005062580108642578, 0.005665779113769531, 0.006268978118896484, 0.0068721771240234375, 0.007475376129150391, 0.008078575134277344, 0.008681774139404297, 0.00928497314453125, 0.009888172149658203, 0.010491371154785156, 0.01109457015991211, 0.011697769165039062, 0.012300968170166016, 0.012904167175292969, 0.013507366180419922, 0.014110565185546875, 0.014713764190673828, 0.015316963195800781, 0.015920162200927734, 0.016523361206054688, 0.01712656021118164, 0.017729759216308594, 0.018332958221435547, 0.0189361572265625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 6.0, 8.0, 16.0, 35.0, 72.0, 103.0, 175.0, 366.0, 908.0, 1973.0, 5086.0, 15355.0, 59749.0, 555866.0, 3391310.0, 124937.0, 25298.0, 7843.0, 2825.0, 1165.0, 610.0, 280.0, 138.0, 63.0, 40.0, 27.0, 15.0, 7.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13427734375, -0.1305685043334961, -0.1268596649169922, -0.12315082550048828, -0.11944198608398438, -0.11573314666748047, -0.11202430725097656, -0.10831546783447266, -0.10460662841796875, -0.10089778900146484, -0.09718894958496094, -0.09348011016845703, -0.08977127075195312, -0.08606243133544922, -0.08235359191894531, -0.0786447525024414, -0.0749359130859375, -0.0712270736694336, -0.06751823425292969, -0.06380939483642578, -0.060100555419921875, -0.05639171600341797, -0.05268287658691406, -0.048974037170410156, -0.04526519775390625, -0.041556358337402344, -0.03784751892089844, -0.03413867950439453, -0.030429840087890625, -0.02672100067138672, -0.023012161254882812, -0.019303321838378906, -0.015594482421875, -0.011885643005371094, -0.008176803588867188, -0.004467964172363281, -0.000759124755859375, 0.0029497146606445312, 0.0066585540771484375, 0.010367393493652344, 0.01407623291015625, 0.017785072326660156, 0.021493911743164062, 0.02520275115966797, 0.028911590576171875, 0.03262042999267578, 0.03632926940917969, 0.040038108825683594, 0.0437469482421875, 0.047455787658691406, 0.05116462707519531, 0.05487346649169922, 0.058582305908203125, 0.06229114532470703, 0.06599998474121094, 0.06970882415771484, 0.07341766357421875, 0.07712650299072266, 0.08083534240722656, 0.08454418182373047, 0.08825302124023438, 0.09196186065673828, 0.09567070007324219, 0.0993795394897461, 0.10308837890625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 1.0, 1.0, 4.0, 2.0, 7.0, 6.0, 10.0, 12.0, 15.0, 20.0, 21.0, 26.0, 61.0, 90.0, 147.0, 235.0, 717.0, 1767.0, 419.0, 193.0, 101.0, 60.0, 43.0, 28.0, 28.0, 20.0, 7.0, 12.0, 8.0, 7.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0295257568359375, -0.028580665588378906, -0.027635574340820312, -0.02669048309326172, -0.025745391845703125, -0.02480030059814453, -0.023855209350585938, -0.022910118103027344, -0.02196502685546875, -0.021019935607910156, -0.020074844360351562, -0.01912975311279297, -0.018184661865234375, -0.01723957061767578, -0.016294479370117188, -0.015349388122558594, -0.014404296875, -0.013459205627441406, -0.012514114379882812, -0.011569023132324219, -0.010623931884765625, -0.009678840637207031, -0.008733749389648438, -0.007788658142089844, -0.00684356689453125, -0.005898475646972656, -0.0049533843994140625, -0.004008293151855469, -0.003063201904296875, -0.0021181106567382812, -0.0011730194091796875, -0.00022792816162109375, 0.0007171630859375, 0.0016622543334960938, 0.0026073455810546875, 0.0035524368286132812, 0.004497528076171875, 0.005442619323730469, 0.0063877105712890625, 0.007332801818847656, 0.00827789306640625, 0.009222984313964844, 0.010168075561523438, 0.011113166809082031, 0.012058258056640625, 0.013003349304199219, 0.013948440551757812, 0.014893531799316406, 0.015838623046875, 0.016783714294433594, 0.017728805541992188, 0.01867389678955078, 0.019618988037109375, 0.02056407928466797, 0.021509170532226562, 0.022454261779785156, 0.02339935302734375, 0.024344444274902344, 0.025289535522460938, 0.02623462677001953, 0.027179718017578125, 0.02812480926513672, 0.029069900512695312, 0.030014991760253906, 0.0309600830078125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 7.0, 5.0, 12.0, 20.0, 28.0, 31.0, 45.0, 55.0, 87.0, 111.0, 129.0, 111.0, 101.0, 75.0, 51.0, 45.0, 26.0, 18.0, 14.0, 6.0, 2.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10153816640377045, -0.09757574647665024, -0.09361332654953003, -0.08965090662240982, -0.08568848669528961, -0.0817260593175888, -0.0777636393904686, -0.07380121946334839, -0.06983879953622818, -0.06587637960910797, -0.06191395968198776, -0.057951536029577255, -0.053989116102457047, -0.05002669617533684, -0.04606427252292633, -0.04210185259580612, -0.03813943266868591, -0.034177012741565704, -0.030214590951800346, -0.02625216916203499, -0.02228974923491478, -0.01832732930779457, -0.014364907518029213, -0.010402485728263855, -0.006440065801143646, -0.002477644942700863, 0.0014847759157419205, 0.005447196774184704, 0.009409617632627487, 0.013372037559747696, 0.017334459349513054, 0.021296881139278412, 0.025259315967559814, 0.029221735894680023, 0.03318415582180023, 0.03714657947421074, 0.04110899940133095, 0.04507141932845116, 0.049033842980861664, 0.05299626290798187, 0.05695868283510208, 0.06092110276222229, 0.0648835226893425, 0.06884594261646271, 0.07280836999416351, 0.07677078247070312, 0.08073320984840393, 0.08469562977552414, 0.08865804970264435, 0.09262046962976456, 0.09658288955688477, 0.10054530948400497, 0.10450772941112518, 0.10847015678882599, 0.1124325767159462, 0.1163949966430664, 0.12035741657018661, 0.12431983649730682, 0.12828226387500763, 0.13224467635154724, 0.13620710372924805, 0.14016951620578766, 0.14413194358348846, 0.14809435606002808, 0.15205678343772888]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 1.0, 5.0, 8.0, 6.0, 6.0, 16.0, 17.0, 12.0, 16.0, 14.0, 22.0, 25.0, 28.0, 34.0, 41.0, 40.0, 30.0, 33.0, 40.0, 32.0, 50.0, 59.0, 31.0, 44.0, 44.0, 43.0, 35.0, 38.0, 42.0, 27.0, 22.0, 14.0, 20.0, 14.0, 20.0, 18.0, 5.0, 18.0, 8.0, 2.0, 2.0, 6.0, 5.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.08024102449417114, -0.07758000493049622, -0.07491899281740189, -0.07225797325372696, -0.06959696114063263, -0.0669359415769577, -0.06427492201328278, -0.06161390617489815, -0.05895289033651352, -0.05629187449812889, -0.05363085865974426, -0.050969839096069336, -0.04830882325768471, -0.04564780741930008, -0.04298678785562515, -0.040325772017240524, -0.037664756178855896, -0.03500374034047127, -0.03234272450208664, -0.029681704938411713, -0.027020689100027084, -0.024359673261642456, -0.02169865556061268, -0.0190376378595829, -0.016376622021198273, -0.01371560525149107, -0.011054588481783867, -0.008393571712076664, -0.005732554942369461, -0.003071538172662258, -0.00041052140295505524, 0.0022504962980747223, 0.004911512136459351, 0.0075725289061665535, 0.010233545675873756, 0.01289456244558096, 0.015555579215288162, 0.01821659505367279, 0.020877612754702568, 0.023538630455732346, 0.026199646294116974, 0.028860662132501602, 0.03152167797088623, 0.03418269753456116, 0.036843713372945786, 0.039504729211330414, 0.04216574877500534, 0.04482676461338997, 0.0474877804517746, 0.050148796290159225, 0.052809812128543854, 0.05547083169221878, 0.05813184753060341, 0.06079286336898804, 0.06345388293266296, 0.06611490249633789, 0.06877591460943222, 0.07143693417310715, 0.07409794628620148, 0.0767589658498764, 0.07941998541355133, 0.08208099752664566, 0.08474201709032059, 0.08740302920341492, 0.09006404876708984]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 7.0, 10.0, 27.0, 33.0, 32.0, 54.0, 74.0, 137.0, 144.0, 248.0, 394.0, 586.0, 837.0, 1564.0, 2573.0, 4250.0, 7376.0, 13223.0, 25448.0, 50624.0, 105914.0, 222735.0, 298507.0, 159194.0, 74791.0, 36437.0, 18901.0, 10208.0, 5473.0, 3216.0, 2052.0, 1188.0, 799.0, 474.0, 347.0, 213.0, 154.0, 103.0, 54.0, 46.0, 39.0, 17.0, 9.0, 7.0, 12.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.055572509765625, -0.05390214920043945, -0.052231788635253906, -0.05056142807006836, -0.04889106750488281, -0.047220706939697266, -0.04555034637451172, -0.04387998580932617, -0.042209625244140625, -0.04053926467895508, -0.03886890411376953, -0.037198543548583984, -0.03552818298339844, -0.03385782241821289, -0.032187461853027344, -0.030517101287841797, -0.02884674072265625, -0.027176380157470703, -0.025506019592285156, -0.02383565902709961, -0.022165298461914062, -0.020494937896728516, -0.01882457733154297, -0.017154216766357422, -0.015483856201171875, -0.013813495635986328, -0.012143135070800781, -0.010472774505615234, -0.008802413940429688, -0.007132053375244141, -0.005461692810058594, -0.003791332244873047, -0.0021209716796875, -0.0004506111145019531, 0.0012197494506835938, 0.0028901100158691406, 0.0045604705810546875, 0.006230831146240234, 0.007901191711425781, 0.009571552276611328, 0.011241912841796875, 0.012912273406982422, 0.014582633972167969, 0.016252994537353516, 0.017923355102539062, 0.01959371566772461, 0.021264076232910156, 0.022934436798095703, 0.02460479736328125, 0.026275157928466797, 0.027945518493652344, 0.02961587905883789, 0.03128623962402344, 0.032956600189208984, 0.03462696075439453, 0.03629732131958008, 0.037967681884765625, 0.03963804244995117, 0.04130840301513672, 0.042978763580322266, 0.04464912414550781, 0.04631948471069336, 0.047989845275878906, 0.04966020584106445, 0.05133056640625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 7.0, 2.0, 5.0, 15.0, 12.0, 22.0, 18.0, 31.0, 29.0, 32.0, 50.0, 46.0, 72.0, 66.0, 64.0, 76.0, 63.0, 55.0, 59.0, 58.0, 42.0, 47.0, 22.0, 29.0, 15.0, 11.0, 7.0, 6.0, 9.0, 7.0, 2.0, 9.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.019561767578125, -0.018991708755493164, -0.018421649932861328, -0.017851591110229492, -0.017281532287597656, -0.01671147346496582, -0.016141414642333984, -0.015571355819702148, -0.015001296997070312, -0.014431238174438477, -0.01386117935180664, -0.013291120529174805, -0.012721061706542969, -0.012151002883911133, -0.011580944061279297, -0.011010885238647461, -0.010440826416015625, -0.009870767593383789, -0.009300708770751953, -0.008730649948120117, -0.008160591125488281, -0.007590532302856445, -0.007020473480224609, -0.0064504146575927734, -0.0058803558349609375, -0.0053102970123291016, -0.004740238189697266, -0.00417017936706543, -0.0036001205444335938, -0.003030061721801758, -0.002460002899169922, -0.001889944076538086, -0.00131988525390625, -0.0007498264312744141, -0.00017976760864257812, 0.0003902912139892578, 0.0009603500366210938, 0.0015304088592529297, 0.0021004676818847656, 0.0026705265045166016, 0.0032405853271484375, 0.0038106441497802734, 0.004380702972412109, 0.004950761795043945, 0.005520820617675781, 0.006090879440307617, 0.006660938262939453, 0.007230997085571289, 0.007801055908203125, 0.008371114730834961, 0.008941173553466797, 0.009511232376098633, 0.010081291198730469, 0.010651350021362305, 0.01122140884399414, 0.011791467666625977, 0.012361526489257812, 0.012931585311889648, 0.013501644134521484, 0.01407170295715332, 0.014641761779785156, 0.015211820602416992, 0.015781879425048828, 0.016351938247680664, 0.0169219970703125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 5.0, 9.0, 7.0, 8.0, 14.0, 17.0, 16.0, 30.0, 58.0, 68.0, 88.0, 119.0, 182.0, 245.0, 378.0, 596.0, 1022.0, 1885.0, 4027.0, 9376.0, 25054.0, 75623.0, 228990.0, 405571.0, 194491.0, 63303.0, 21265.0, 8167.0, 3557.0, 1628.0, 973.0, 585.0, 368.0, 235.0, 180.0, 111.0, 78.0, 51.0, 51.0, 33.0, 29.0, 18.0, 16.0, 8.0, 7.0, 4.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.071044921875, -0.06891918182373047, -0.06679344177246094, -0.0646677017211914, -0.06254196166992188, -0.060416221618652344, -0.05829048156738281, -0.05616474151611328, -0.05403900146484375, -0.05191326141357422, -0.04978752136230469, -0.047661781311035156, -0.045536041259765625, -0.043410301208496094, -0.04128456115722656, -0.03915882110595703, -0.0370330810546875, -0.03490734100341797, -0.03278160095214844, -0.030655860900878906, -0.028530120849609375, -0.026404380798339844, -0.024278640747070312, -0.02215290069580078, -0.02002716064453125, -0.01790142059326172, -0.015775680541992188, -0.013649940490722656, -0.011524200439453125, -0.009398460388183594, -0.0072727203369140625, -0.005146980285644531, -0.003021240234375, -0.0008955001831054688, 0.0012302398681640625, 0.0033559799194335938, 0.005481719970703125, 0.007607460021972656, 0.009733200073242188, 0.011858940124511719, 0.01398468017578125, 0.01611042022705078, 0.018236160278320312, 0.020361900329589844, 0.022487640380859375, 0.024613380432128906, 0.026739120483398438, 0.02886486053466797, 0.0309906005859375, 0.03311634063720703, 0.03524208068847656, 0.037367820739746094, 0.039493560791015625, 0.041619300842285156, 0.04374504089355469, 0.04587078094482422, 0.04799652099609375, 0.05012226104736328, 0.05224800109863281, 0.054373741149902344, 0.056499481201171875, 0.058625221252441406, 0.06075096130371094, 0.06287670135498047, 0.06500244140625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 5.0, 2.0, 3.0, 4.0, 5.0, 13.0, 10.0, 15.0, 18.0, 24.0, 22.0, 22.0, 28.0, 32.0, 25.0, 35.0, 34.0, 31.0, 47.0, 45.0, 53.0, 41.0, 46.0, 39.0, 38.0, 33.0, 43.0, 31.0, 32.0, 46.0, 25.0, 25.0, 20.0, 18.0, 15.0, 17.0, 14.0, 12.0, 5.0, 3.0, 8.0, 7.0, 3.0, 3.0, 4.0, 5.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.0765380859375, -0.07442569732666016, -0.07231330871582031, -0.07020092010498047, -0.06808853149414062, -0.06597614288330078, -0.06386375427246094, -0.061751365661621094, -0.05963897705078125, -0.057526588439941406, -0.05541419982910156, -0.05330181121826172, -0.051189422607421875, -0.04907703399658203, -0.04696464538574219, -0.044852256774902344, -0.0427398681640625, -0.040627479553222656, -0.03851509094238281, -0.03640270233154297, -0.034290313720703125, -0.03217792510986328, -0.030065536499023438, -0.027953147888183594, -0.02584075927734375, -0.023728370666503906, -0.021615982055664062, -0.01950359344482422, -0.017391204833984375, -0.015278816223144531, -0.013166427612304688, -0.011054039001464844, -0.008941650390625, -0.006829261779785156, -0.0047168731689453125, -0.0026044845581054688, -0.000492095947265625, 0.0016202926635742188, 0.0037326812744140625, 0.005845069885253906, 0.00795745849609375, 0.010069847106933594, 0.012182235717773438, 0.014294624328613281, 0.016407012939453125, 0.01851940155029297, 0.020631790161132812, 0.022744178771972656, 0.0248565673828125, 0.026968955993652344, 0.029081344604492188, 0.03119373321533203, 0.033306121826171875, 0.03541851043701172, 0.03753089904785156, 0.039643287658691406, 0.04175567626953125, 0.043868064880371094, 0.04598045349121094, 0.04809284210205078, 0.050205230712890625, 0.05231761932373047, 0.05443000793457031, 0.056542396545410156, 0.05865478515625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 7.0, 15.0, 13.0, 15.0, 23.0, 34.0, 55.0, 78.0, 96.0, 139.0, 243.0, 449.0, 728.0, 1332.0, 2706.0, 5568.0, 13143.0, 34961.0, 105435.0, 351051.0, 361193.0, 109679.0, 36006.0, 13630.0, 5749.0, 2790.0, 1382.0, 764.0, 463.0, 274.0, 183.0, 106.0, 81.0, 44.0, 35.0, 17.0, 18.0, 14.0, 8.0, 6.0, 1.0, 7.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.03448486328125, -0.033471107482910156, -0.03245735168457031, -0.03144359588623047, -0.030429840087890625, -0.02941608428955078, -0.028402328491210938, -0.027388572692871094, -0.02637481689453125, -0.025361061096191406, -0.024347305297851562, -0.02333354949951172, -0.022319793701171875, -0.02130603790283203, -0.020292282104492188, -0.019278526306152344, -0.0182647705078125, -0.017251014709472656, -0.016237258911132812, -0.015223503112792969, -0.014209747314453125, -0.013195991516113281, -0.012182235717773438, -0.011168479919433594, -0.01015472412109375, -0.009140968322753906, -0.008127212524414062, -0.007113456726074219, -0.006099700927734375, -0.005085945129394531, -0.0040721893310546875, -0.0030584335327148438, -0.002044677734375, -0.0010309219360351562, -1.71661376953125e-05, 0.0009965896606445312, 0.002010345458984375, 0.0030241012573242188, 0.0040378570556640625, 0.005051612854003906, 0.00606536865234375, 0.007079124450683594, 0.008092880249023438, 0.009106636047363281, 0.010120391845703125, 0.011134147644042969, 0.012147903442382812, 0.013161659240722656, 0.0141754150390625, 0.015189170837402344, 0.016202926635742188, 0.01721668243408203, 0.018230438232421875, 0.01924419403076172, 0.020257949829101562, 0.021271705627441406, 0.02228546142578125, 0.023299217224121094, 0.024312973022460938, 0.02532672882080078, 0.026340484619140625, 0.02735424041748047, 0.028367996215820312, 0.029381752014160156, 0.0303955078125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 13.0, 15.0, 16.0, 28.0, 34.0, 46.0, 45.0, 86.0, 85.0, 86.0, 100.0, 108.0, 69.0, 70.0, 47.0, 43.0, 28.0, 25.0, 12.0, 8.0, 5.0, 5.0, 5.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.7087669372558594e-05, -4.5942142605781555e-05, -4.4796615839004517e-05, -4.365108907222748e-05, -4.250556230545044e-05, -4.13600355386734e-05, -4.021450877189636e-05, -3.9068982005119324e-05, -3.7923455238342285e-05, -3.6777928471565247e-05, -3.563240170478821e-05, -3.448687493801117e-05, -3.334134817123413e-05, -3.219582140445709e-05, -3.1050294637680054e-05, -2.9904767870903015e-05, -2.8759241104125977e-05, -2.7613714337348938e-05, -2.64681875705719e-05, -2.532266080379486e-05, -2.4177134037017822e-05, -2.3031607270240784e-05, -2.1886080503463745e-05, -2.0740553736686707e-05, -1.9595026969909668e-05, -1.844950020313263e-05, -1.730397343635559e-05, -1.6158446669578552e-05, -1.5012919902801514e-05, -1.3867393136024475e-05, -1.2721866369247437e-05, -1.1576339602470398e-05, -1.043081283569336e-05, -9.28528606891632e-06, -8.139759302139282e-06, -6.994232535362244e-06, -5.848705768585205e-06, -4.7031790018081665e-06, -3.557652235031128e-06, -2.4121254682540894e-06, -1.2665987014770508e-06, -1.210719347000122e-07, 1.0244548320770264e-06, 2.169981598854065e-06, 3.3155083656311035e-06, 4.461035132408142e-06, 5.606561899185181e-06, 6.752088665962219e-06, 7.897615432739258e-06, 9.043142199516296e-06, 1.0188668966293335e-05, 1.1334195733070374e-05, 1.2479722499847412e-05, 1.362524926662445e-05, 1.477077603340149e-05, 1.5916302800178528e-05, 1.7061829566955566e-05, 1.8207356333732605e-05, 1.9352883100509644e-05, 2.0498409867286682e-05, 2.164393663406372e-05, 2.278946340084076e-05, 2.3934990167617798e-05, 2.5080516934394836e-05, 2.6226043701171875e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 5.0, 4.0, 14.0, 11.0, 15.0, 25.0, 29.0, 51.0, 93.0, 132.0, 260.0, 433.0, 890.0, 2231.0, 6922.0, 29549.0, 167603.0, 631490.0, 168106.0, 29552.0, 6970.0, 2183.0, 968.0, 457.0, 222.0, 137.0, 71.0, 47.0, 28.0, 22.0, 11.0, 7.0, 10.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052520751953125, -0.050952911376953125, -0.04938507080078125, -0.047817230224609375, -0.0462493896484375, -0.044681549072265625, -0.04311370849609375, -0.041545867919921875, -0.03997802734375, -0.038410186767578125, -0.03684234619140625, -0.035274505615234375, -0.0337066650390625, -0.032138824462890625, -0.03057098388671875, -0.029003143310546875, -0.027435302734375, -0.025867462158203125, -0.02429962158203125, -0.022731781005859375, -0.0211639404296875, -0.019596099853515625, -0.01802825927734375, -0.016460418701171875, -0.014892578125, -0.013324737548828125, -0.01175689697265625, -0.010189056396484375, -0.0086212158203125, -0.007053375244140625, -0.00548553466796875, -0.003917694091796875, -0.002349853515625, -0.000782012939453125, 0.00078582763671875, 0.002353668212890625, 0.0039215087890625, 0.005489349365234375, 0.00705718994140625, 0.008625030517578125, 0.01019287109375, 0.011760711669921875, 0.01332855224609375, 0.014896392822265625, 0.0164642333984375, 0.018032073974609375, 0.01959991455078125, 0.021167755126953125, 0.022735595703125, 0.024303436279296875, 0.02587127685546875, 0.027439117431640625, 0.0290069580078125, 0.030574798583984375, 0.03214263916015625, 0.033710479736328125, 0.0352783203125, 0.036846160888671875, 0.03841400146484375, 0.039981842041015625, 0.0415496826171875, 0.043117523193359375, 0.04468536376953125, 0.046253204345703125, 0.047821044921875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 4.0, 8.0, 9.0, 4.0, 9.0, 13.0, 18.0, 33.0, 51.0, 49.0, 73.0, 98.0, 102.0, 118.0, 105.0, 89.0, 65.0, 45.0, 34.0, 29.0, 19.0, 14.0, 8.0, 7.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.05975341796875, -0.05840444564819336, -0.05705547332763672, -0.05570650100708008, -0.05435752868652344, -0.0530085563659668, -0.051659584045410156, -0.050310611724853516, -0.048961639404296875, -0.047612667083740234, -0.046263694763183594, -0.04491472244262695, -0.04356575012207031, -0.04221677780151367, -0.04086780548095703, -0.03951883316040039, -0.03816986083984375, -0.03682088851928711, -0.03547191619873047, -0.03412294387817383, -0.03277397155761719, -0.03142499923706055, -0.030076026916503906, -0.028727054595947266, -0.027378082275390625, -0.026029109954833984, -0.024680137634277344, -0.023331165313720703, -0.021982192993164062, -0.020633220672607422, -0.01928424835205078, -0.01793527603149414, -0.0165863037109375, -0.01523733139038086, -0.013888359069824219, -0.012539386749267578, -0.011190414428710938, -0.009841442108154297, -0.008492469787597656, -0.007143497467041016, -0.005794525146484375, -0.004445552825927734, -0.0030965805053710938, -0.0017476081848144531, -0.0003986358642578125, 0.0009503364562988281, 0.0022993087768554688, 0.0036482810974121094, 0.00499725341796875, 0.006346225738525391, 0.007695198059082031, 0.009044170379638672, 0.010393142700195312, 0.011742115020751953, 0.013091087341308594, 0.014440059661865234, 0.015789031982421875, 0.017138004302978516, 0.018486976623535156, 0.019835948944091797, 0.021184921264648438, 0.022533893585205078, 0.02388286590576172, 0.02523183822631836, 0.026580810546875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 13.0, 16.0, 49.0, 117.0, 219.0, 235.0, 177.0, 115.0, 33.0, 18.0, 12.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42393758893013, -0.39454230666160583, -0.36514702439308167, -0.3357517421245575, -0.3063564598560333, -0.27696117758750916, -0.24756589531898499, -0.21817061305046082, -0.18877533078193665, -0.15938004851341248, -0.1299847662448883, -0.10058948397636414, -0.07119420170783997, -0.041798919439315796, -0.012403637170791626, 0.016991645097732544, 0.046386927366256714, 0.07578220963478088, 0.10517749190330505, 0.13457277417182922, 0.1639680564403534, 0.19336333870887756, 0.22275862097740173, 0.2521539032459259, 0.2815491855144501, 0.31094446778297424, 0.3403397500514984, 0.3697350323200226, 0.39913031458854675, 0.4285255968570709, 0.4579208791255951, 0.48731616139411926, 0.5167114734649658, 0.54610675573349, 0.5755020380020142, 0.6048973202705383, 0.6342926025390625, 0.6636878848075867, 0.6930831670761108, 0.722478449344635, 0.7518737316131592, 0.7812690138816833, 0.8106642961502075, 0.8400595784187317, 0.8694548606872559, 0.89885014295578, 0.9282454252243042, 0.9576407074928284, 0.9870359897613525, 1.0164313316345215, 1.0458265542984009, 1.0752217769622803, 1.1046171188354492, 1.1340124607086182, 1.1634076833724976, 1.192802906036377, 1.222198247909546, 1.2515935897827148, 1.2809888124465942, 1.3103840351104736, 1.3397793769836426, 1.3691747188568115, 1.398569941520691, 1.4279651641845703, 1.4573605060577393]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 5.0, 5.0, 7.0, 8.0, 9.0, 9.0, 10.0, 13.0, 19.0, 23.0, 24.0, 22.0, 25.0, 34.0, 40.0, 37.0, 54.0, 38.0, 61.0, 48.0, 52.0, 57.0, 61.0, 43.0, 50.0, 40.0, 34.0, 23.0, 19.0, 20.0, 21.0, 24.0, 15.0, 13.0, 13.0, 10.0, 3.0, 3.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.5078218579292297, -0.4937440752983093, -0.4796662926673889, -0.4655885100364685, -0.4515107274055481, -0.4374329447746277, -0.4233551621437073, -0.40927737951278687, -0.39519959688186646, -0.38112181425094604, -0.36704403162002563, -0.3529662489891052, -0.3388884663581848, -0.3248106837272644, -0.310732901096344, -0.2966551184654236, -0.2825773358345032, -0.26849955320358276, -0.25442177057266235, -0.24034398794174194, -0.22626620531082153, -0.21218842267990112, -0.1981106400489807, -0.1840328574180603, -0.1699550747871399, -0.15587729215621948, -0.14179950952529907, -0.12772172689437866, -0.11364394426345825, -0.09956616163253784, -0.08548837900161743, -0.07141059637069702, -0.05733281373977661, -0.0432550311088562, -0.02917724847793579, -0.01509946584701538, -0.0010216832160949707, 0.01305609941482544, 0.02713388204574585, 0.04121166467666626, 0.05528944730758667, 0.06936722993850708, 0.08344501256942749, 0.0975227952003479, 0.11160057783126831, 0.12567836046218872, 0.13975614309310913, 0.15383392572402954, 0.16791170835494995, 0.18198949098587036, 0.19606727361679077, 0.21014505624771118, 0.2242228388786316, 0.238300621509552, 0.2523784041404724, 0.2664561867713928, 0.28053396940231323, 0.29461175203323364, 0.30868953466415405, 0.32276731729507446, 0.3368450999259949, 0.3509228825569153, 0.3650006651878357, 0.3790784478187561, 0.3931562304496765]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 7.0, 5.0, 7.0, 9.0, 11.0, 18.0, 28.0, 40.0, 81.0, 106.0, 141.0, 235.0, 379.0, 612.0, 1035.0, 1793.0, 3568.0, 7368.0, 17966.0, 58294.0, 507898.0, 3451142.0, 98614.0, 25213.0, 9634.0, 4447.0, 2297.0, 1273.0, 741.0, 420.0, 266.0, 199.0, 150.0, 92.0, 61.0, 44.0, 31.0, 22.0, 15.0, 7.0, 2.0, 7.0, 1.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0804443359375, -0.07758903503417969, -0.07473373413085938, -0.07187843322753906, -0.06902313232421875, -0.06616783142089844, -0.06331253051757812, -0.06045722961425781, -0.0576019287109375, -0.05474662780761719, -0.051891326904296875, -0.04903602600097656, -0.04618072509765625, -0.04332542419433594, -0.040470123291015625, -0.03761482238769531, -0.034759521484375, -0.03190422058105469, -0.029048919677734375, -0.026193618774414062, -0.02333831787109375, -0.020483016967773438, -0.017627716064453125, -0.014772415161132812, -0.0119171142578125, -0.009061813354492188, -0.006206512451171875, -0.0033512115478515625, -0.00049591064453125, 0.0023593902587890625, 0.005214691162109375, 0.008069992065429688, 0.01092529296875, 0.013780593872070312, 0.016635894775390625, 0.019491195678710938, 0.02234649658203125, 0.025201797485351562, 0.028057098388671875, 0.030912399291992188, 0.0337677001953125, 0.03662300109863281, 0.039478302001953125, 0.04233360290527344, 0.04518890380859375, 0.04804420471191406, 0.050899505615234375, 0.05375480651855469, 0.056610107421875, 0.05946540832519531, 0.062320709228515625, 0.06517601013183594, 0.06803131103515625, 0.07088661193847656, 0.07374191284179688, 0.07659721374511719, 0.0794525146484375, 0.08230781555175781, 0.08516311645507812, 0.08801841735839844, 0.09087371826171875, 0.09372901916503906, 0.09658432006835938, 0.09943962097167969, 0.102294921875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 5.0, 9.0, 13.0, 6.0, 19.0, 18.0, 26.0, 29.0, 33.0, 37.0, 52.0, 50.0, 49.0, 64.0, 57.0, 64.0, 67.0, 60.0, 55.0, 33.0, 37.0, 47.0, 30.0, 24.0, 21.0, 14.0, 20.0, 14.0, 6.0, 9.0, 4.0, 3.0, 3.0, 6.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0189056396484375, -0.0183560848236084, -0.017806529998779297, -0.017256975173950195, -0.016707420349121094, -0.016157865524291992, -0.01560831069946289, -0.015058755874633789, -0.014509201049804688, -0.013959646224975586, -0.013410091400146484, -0.012860536575317383, -0.012310981750488281, -0.01176142692565918, -0.011211872100830078, -0.010662317276000977, -0.010112762451171875, -0.009563207626342773, -0.009013652801513672, -0.00846409797668457, -0.007914543151855469, -0.007364988327026367, -0.006815433502197266, -0.006265878677368164, -0.0057163238525390625, -0.005166769027709961, -0.004617214202880859, -0.004067659378051758, -0.0035181045532226562, -0.0029685497283935547, -0.002418994903564453, -0.0018694400787353516, -0.00131988525390625, -0.0007703304290771484, -0.00022077560424804688, 0.0003287792205810547, 0.0008783340454101562, 0.0014278888702392578, 0.0019774436950683594, 0.002526998519897461, 0.0030765533447265625, 0.003626108169555664, 0.004175662994384766, 0.004725217819213867, 0.005274772644042969, 0.00582432746887207, 0.006373882293701172, 0.0069234371185302734, 0.007472991943359375, 0.008022546768188477, 0.008572101593017578, 0.00912165641784668, 0.009671211242675781, 0.010220766067504883, 0.010770320892333984, 0.011319875717163086, 0.011869430541992188, 0.012418985366821289, 0.01296854019165039, 0.013518095016479492, 0.014067649841308594, 0.014617204666137695, 0.015166759490966797, 0.0157163143157959, 0.016265869140625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 5.0, 11.0, 12.0, 30.0, 29.0, 41.0, 68.0, 90.0, 201.0, 369.0, 747.0, 1808.0, 4738.0, 14161.0, 60029.0, 773628.0, 3213419.0, 94480.0, 19564.0, 6198.0, 2341.0, 1042.0, 496.0, 285.0, 156.0, 100.0, 67.0, 54.0, 36.0, 28.0, 14.0, 7.0, 10.0, 9.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08697509765625, -0.08336925506591797, -0.07976341247558594, -0.0761575698852539, -0.07255172729492188, -0.06894588470458984, -0.06534004211425781, -0.06173419952392578, -0.05812835693359375, -0.05452251434326172, -0.05091667175292969, -0.047310829162597656, -0.043704986572265625, -0.040099143981933594, -0.03649330139160156, -0.03288745880126953, -0.0292816162109375, -0.02567577362060547, -0.022069931030273438, -0.018464088439941406, -0.014858245849609375, -0.011252403259277344, -0.0076465606689453125, -0.004040718078613281, -0.00043487548828125, 0.0031709671020507812, 0.0067768096923828125, 0.010382652282714844, 0.013988494873046875, 0.017594337463378906, 0.021200180053710938, 0.02480602264404297, 0.028411865234375, 0.03201770782470703, 0.03562355041503906, 0.039229393005371094, 0.042835235595703125, 0.046441078186035156, 0.05004692077636719, 0.05365276336669922, 0.05725860595703125, 0.06086444854736328, 0.06447029113769531, 0.06807613372802734, 0.07168197631835938, 0.0752878189086914, 0.07889366149902344, 0.08249950408935547, 0.0861053466796875, 0.08971118927001953, 0.09331703186035156, 0.0969228744506836, 0.10052871704101562, 0.10413455963134766, 0.10774040222167969, 0.11134624481201172, 0.11495208740234375, 0.11855792999267578, 0.12216377258300781, 0.12576961517333984, 0.12937545776367188, 0.1329813003540039, 0.13658714294433594, 0.14019298553466797, 0.143798828125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 7.0, 14.0, 11.0, 24.0, 40.0, 59.0, 93.0, 173.0, 395.0, 2043.0, 635.0, 247.0, 117.0, 72.0, 46.0, 26.0, 19.0, 5.0, 19.0, 6.0, 4.0, 6.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0232086181640625, -0.02208685874938965, -0.020965099334716797, -0.019843339920043945, -0.018721580505371094, -0.017599821090698242, -0.01647806167602539, -0.015356302261352539, -0.014234542846679688, -0.013112783432006836, -0.011991024017333984, -0.010869264602661133, -0.009747505187988281, -0.00862574577331543, -0.007503986358642578, -0.0063822269439697266, -0.005260467529296875, -0.0041387081146240234, -0.003016948699951172, -0.0018951892852783203, -0.0007734298706054688, 0.0003483295440673828, 0.0014700889587402344, 0.002591848373413086, 0.0037136077880859375, 0.004835367202758789, 0.005957126617431641, 0.007078886032104492, 0.008200645446777344, 0.009322404861450195, 0.010444164276123047, 0.011565923690795898, 0.01268768310546875, 0.013809442520141602, 0.014931201934814453, 0.016052961349487305, 0.017174720764160156, 0.018296480178833008, 0.01941823959350586, 0.02053999900817871, 0.021661758422851562, 0.022783517837524414, 0.023905277252197266, 0.025027036666870117, 0.02614879608154297, 0.02727055549621582, 0.028392314910888672, 0.029514074325561523, 0.030635833740234375, 0.03175759315490723, 0.03287935256958008, 0.03400111198425293, 0.03512287139892578, 0.03624463081359863, 0.037366390228271484, 0.038488149642944336, 0.03960990905761719, 0.04073166847229004, 0.04185342788696289, 0.04297518730163574, 0.044096946716308594, 0.045218706130981445, 0.0463404655456543, 0.04746222496032715, 0.048583984375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 12.0, 27.0, 69.0, 131.0, 277.0, 254.0, 152.0, 45.0, 30.0, 7.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13349102437496185, -0.12308056652545929, -0.11267010867595673, -0.10225965082645416, -0.0918491929769516, -0.08143873512744904, -0.07102828472852707, -0.060617826879024506, -0.05020736902952194, -0.03979691118001938, -0.029386455193161964, -0.01897599920630455, -0.008565541356801987, 0.0018449164927005768, 0.012255370616912842, 0.022665828466415405, 0.03307628631591797, 0.04348674416542053, 0.053897202014923096, 0.06430765986442566, 0.07471811771392822, 0.08512857556343079, 0.09553902596235275, 0.10594948381185532, 0.11635994166135788, 0.12677039206027985, 0.1371808499097824, 0.14759130775928497, 0.15800176560878754, 0.1684122234582901, 0.17882268130779266, 0.18923313915729523, 0.1996435821056366, 0.21005403995513916, 0.22046449780464172, 0.2308749556541443, 0.24128541350364685, 0.2516958713531494, 0.262106329202652, 0.27251678705215454, 0.2829272449016571, 0.29333770275115967, 0.30374816060066223, 0.3141586184501648, 0.32456907629966736, 0.3349795341491699, 0.3453899919986725, 0.35580044984817505, 0.3662108778953552, 0.3766213357448578, 0.38703179359436035, 0.3974422514438629, 0.4078527092933655, 0.41826316714286804, 0.4286736249923706, 0.43908408284187317, 0.44949454069137573, 0.4599049985408783, 0.47031545639038086, 0.4807259142398834, 0.491136372089386, 0.5015468001365662, 0.5119572877883911, 0.5223677158355713, 0.5327782034873962]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 3.0, 9.0, 0.0, 4.0, 4.0, 7.0, 8.0, 11.0, 19.0, 13.0, 28.0, 13.0, 20.0, 26.0, 31.0, 20.0, 25.0, 38.0, 47.0, 58.0, 34.0, 53.0, 49.0, 37.0, 39.0, 42.0, 34.0, 42.0, 34.0, 41.0, 28.0, 25.0, 31.0, 26.0, 15.0, 24.0, 14.0, 13.0, 10.0, 3.0, 7.0, 6.0, 4.0, 4.0, 6.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09318786859512329, -0.0903608500957489, -0.08753383159637451, -0.08470682054758072, -0.08187980204820633, -0.07905278354883194, -0.07622577250003815, -0.07339875400066376, -0.07057173550128937, -0.06774471700191498, -0.06491769850254059, -0.062090687453746796, -0.059263668954372406, -0.056436650454998016, -0.053609635680913925, -0.050782620906829834, -0.047955602407455444, -0.045128583908081055, -0.042301569133996964, -0.03947455435991287, -0.03664753586053848, -0.03382051736116409, -0.030993502587080002, -0.02816648595035076, -0.02533946931362152, -0.02251245267689228, -0.01968543604016304, -0.0168584194034338, -0.01403140276670456, -0.011204386129975319, -0.008377369493246078, -0.005550352856516838, -0.0027233362197875977, 0.00010368041694164276, 0.002930697053670883, 0.005757713690400124, 0.008584730327129364, 0.011411746963858604, 0.014238763600587845, 0.017065780237317085, 0.019892796874046326, 0.022719813510775566, 0.025546830147504807, 0.028373846784234047, 0.031200863420963287, 0.03402788192033768, 0.03685489669442177, 0.03968191146850586, 0.04250892996788025, 0.04533594846725464, 0.04816296324133873, 0.05098997801542282, 0.05381699651479721, 0.0566440150141716, 0.05947102978825569, 0.06229804456233978, 0.06512506306171417, 0.06795208156108856, 0.07077910006046295, 0.07360611110925674, 0.07643312960863113, 0.07926014810800552, 0.08208715915679932, 0.0849141776561737, 0.0877411961555481]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 8.0, 10.0, 8.0, 13.0, 17.0, 31.0, 32.0, 51.0, 80.0, 112.0, 185.0, 252.0, 421.0, 667.0, 952.0, 1607.0, 2761.0, 4824.0, 8505.0, 15951.0, 31413.0, 62896.0, 131228.0, 254376.0, 261716.0, 135650.0, 65164.0, 32220.0, 16498.0, 8725.0, 4844.0, 2761.0, 1609.0, 1015.0, 661.0, 443.0, 266.0, 187.0, 118.0, 86.0, 49.0, 46.0, 27.0, 18.0, 17.0, 8.0, 7.0, 9.0, 6.0, 4.0, 2.0, 2.0], "bins": [-0.05615234375, -0.054593563079833984, -0.05303478240966797, -0.05147600173950195, -0.04991722106933594, -0.04835844039916992, -0.046799659729003906, -0.04524087905883789, -0.043682098388671875, -0.04212331771850586, -0.040564537048339844, -0.03900575637817383, -0.03744697570800781, -0.0358881950378418, -0.03432941436767578, -0.032770633697509766, -0.03121185302734375, -0.029653072357177734, -0.02809429168701172, -0.026535511016845703, -0.024976730346679688, -0.023417949676513672, -0.021859169006347656, -0.02030038833618164, -0.018741607666015625, -0.01718282699584961, -0.015624046325683594, -0.014065265655517578, -0.012506484985351562, -0.010947704315185547, -0.009388923645019531, -0.007830142974853516, -0.0062713623046875, -0.004712581634521484, -0.0031538009643554688, -0.0015950202941894531, -3.62396240234375e-05, 0.0015225410461425781, 0.0030813217163085938, 0.004640102386474609, 0.006198883056640625, 0.007757663726806641, 0.009316444396972656, 0.010875225067138672, 0.012434005737304688, 0.013992786407470703, 0.015551567077636719, 0.017110347747802734, 0.01866912841796875, 0.020227909088134766, 0.02178668975830078, 0.023345470428466797, 0.024904251098632812, 0.026463031768798828, 0.028021812438964844, 0.02958059310913086, 0.031139373779296875, 0.03269815444946289, 0.034256935119628906, 0.03581571578979492, 0.03737449645996094, 0.03893327713012695, 0.04049205780029297, 0.042050838470458984, 0.043609619140625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 6.0, 6.0, 7.0, 7.0, 13.0, 19.0, 24.0, 28.0, 28.0, 53.0, 39.0, 45.0, 63.0, 64.0, 53.0, 62.0, 65.0, 63.0, 63.0, 40.0, 51.0, 47.0, 29.0, 21.0, 25.0, 17.0, 13.0, 12.0, 6.0, 6.0, 8.0, 7.0, 1.0, 5.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0204620361328125, -0.01987171173095703, -0.019281387329101562, -0.018691062927246094, -0.018100738525390625, -0.017510414123535156, -0.016920089721679688, -0.01632976531982422, -0.01573944091796875, -0.015149116516113281, -0.014558792114257812, -0.013968467712402344, -0.013378143310546875, -0.012787818908691406, -0.012197494506835938, -0.011607170104980469, -0.011016845703125, -0.010426521301269531, -0.009836196899414062, -0.009245872497558594, -0.008655548095703125, -0.008065223693847656, -0.0074748992919921875, -0.006884574890136719, -0.00629425048828125, -0.005703926086425781, -0.0051136016845703125, -0.004523277282714844, -0.003932952880859375, -0.0033426284790039062, -0.0027523040771484375, -0.0021619796752929688, -0.0015716552734375, -0.0009813308715820312, -0.0003910064697265625, 0.00019931793212890625, 0.000789642333984375, 0.0013799667358398438, 0.0019702911376953125, 0.0025606155395507812, 0.00315093994140625, 0.0037412643432617188, 0.0043315887451171875, 0.004921913146972656, 0.005512237548828125, 0.006102561950683594, 0.0066928863525390625, 0.007283210754394531, 0.00787353515625, 0.008463859558105469, 0.009054183959960938, 0.009644508361816406, 0.010234832763671875, 0.010825157165527344, 0.011415481567382812, 0.012005805969238281, 0.01259613037109375, 0.013186454772949219, 0.013776779174804688, 0.014367103576660156, 0.014957427978515625, 0.015547752380371094, 0.016138076782226562, 0.01672840118408203, 0.0173187255859375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 6.0, 10.0, 5.0, 11.0, 13.0, 20.0, 36.0, 49.0, 72.0, 103.0, 180.0, 214.0, 367.0, 627.0, 1144.0, 2440.0, 5743.0, 17459.0, 62121.0, 246050.0, 473241.0, 172974.0, 43915.0, 12901.0, 4458.0, 1951.0, 953.0, 532.0, 320.0, 213.0, 128.0, 83.0, 69.0, 51.0, 28.0, 20.0, 18.0, 12.0, 13.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06781005859375, -0.06533241271972656, -0.06285476684570312, -0.06037712097167969, -0.05789947509765625, -0.05542182922363281, -0.052944183349609375, -0.05046653747558594, -0.0479888916015625, -0.04551124572753906, -0.043033599853515625, -0.04055595397949219, -0.03807830810546875, -0.03560066223144531, -0.033123016357421875, -0.030645370483398438, -0.028167724609375, -0.025690078735351562, -0.023212432861328125, -0.020734786987304688, -0.01825714111328125, -0.015779495239257812, -0.013301849365234375, -0.010824203491210938, -0.0083465576171875, -0.0058689117431640625, -0.003391265869140625, -0.0009136199951171875, 0.00156402587890625, 0.0040416717529296875, 0.006519317626953125, 0.008996963500976562, 0.011474609375, 0.013952255249023438, 0.016429901123046875, 0.018907546997070312, 0.02138519287109375, 0.023862838745117188, 0.026340484619140625, 0.028818130493164062, 0.0312957763671875, 0.03377342224121094, 0.036251068115234375, 0.03872871398925781, 0.04120635986328125, 0.04368400573730469, 0.046161651611328125, 0.04863929748535156, 0.051116943359375, 0.05359458923339844, 0.056072235107421875, 0.05854988098144531, 0.06102752685546875, 0.06350517272949219, 0.06598281860351562, 0.06846046447753906, 0.0709381103515625, 0.07341575622558594, 0.07589340209960938, 0.07837104797363281, 0.08084869384765625, 0.08332633972167969, 0.08580398559570312, 0.08828163146972656, 0.09075927734375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 1.0, 7.0, 4.0, 3.0, 6.0, 12.0, 17.0, 20.0, 18.0, 18.0, 21.0, 24.0, 32.0, 34.0, 31.0, 41.0, 42.0, 49.0, 42.0, 42.0, 35.0, 41.0, 45.0, 41.0, 46.0, 38.0, 37.0, 35.0, 31.0, 26.0, 20.0, 24.0, 28.0, 19.0, 19.0, 8.0, 9.0, 6.0, 8.0, 3.0, 7.0, 7.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06634521484375, -0.06415367126464844, -0.061962127685546875, -0.05977058410644531, -0.05757904052734375, -0.05538749694824219, -0.053195953369140625, -0.05100440979003906, -0.0488128662109375, -0.04662132263183594, -0.044429779052734375, -0.04223823547363281, -0.04004669189453125, -0.03785514831542969, -0.035663604736328125, -0.03347206115722656, -0.031280517578125, -0.029088973999023438, -0.026897430419921875, -0.024705886840820312, -0.02251434326171875, -0.020322799682617188, -0.018131256103515625, -0.015939712524414062, -0.0137481689453125, -0.011556625366210938, -0.009365081787109375, -0.0071735382080078125, -0.00498199462890625, -0.0027904510498046875, -0.000598907470703125, 0.0015926361083984375, 0.0037841796875, 0.0059757232666015625, 0.008167266845703125, 0.010358810424804688, 0.01255035400390625, 0.014741897583007812, 0.016933441162109375, 0.019124984741210938, 0.0213165283203125, 0.023508071899414062, 0.025699615478515625, 0.027891159057617188, 0.03008270263671875, 0.03227424621582031, 0.034465789794921875, 0.03665733337402344, 0.038848876953125, 0.04104042053222656, 0.043231964111328125, 0.04542350769042969, 0.04761505126953125, 0.04980659484863281, 0.051998138427734375, 0.05418968200683594, 0.0563812255859375, 0.05857276916503906, 0.060764312744140625, 0.06295585632324219, 0.06514739990234375, 0.06733894348144531, 0.06953048706054688, 0.07172203063964844, 0.07391357421875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 4.0, 1.0, 7.0, 10.0, 10.0, 17.0, 24.0, 27.0, 50.0, 92.0, 109.0, 199.0, 366.0, 721.0, 1673.0, 3668.0, 10462.0, 39419.0, 227914.0, 585868.0, 137671.0, 26701.0, 7812.0, 3025.0, 1254.0, 654.0, 325.0, 167.0, 82.0, 61.0, 43.0, 33.0, 20.0, 24.0, 15.0, 7.0, 5.0, 5.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04254150390625, -0.04114055633544922, -0.03973960876464844, -0.038338661193847656, -0.036937713623046875, -0.035536766052246094, -0.03413581848144531, -0.03273487091064453, -0.03133392333984375, -0.02993297576904297, -0.028532028198242188, -0.027131080627441406, -0.025730133056640625, -0.024329185485839844, -0.022928237915039062, -0.02152729034423828, -0.0201263427734375, -0.01872539520263672, -0.017324447631835938, -0.015923500061035156, -0.014522552490234375, -0.013121604919433594, -0.011720657348632812, -0.010319709777832031, -0.00891876220703125, -0.007517814636230469, -0.0061168670654296875, -0.004715919494628906, -0.003314971923828125, -0.0019140243530273438, -0.0005130767822265625, 0.0008878707885742188, 0.002288818359375, 0.0036897659301757812, 0.0050907135009765625, 0.006491661071777344, 0.007892608642578125, 0.009293556213378906, 0.010694503784179688, 0.012095451354980469, 0.01349639892578125, 0.014897346496582031, 0.016298294067382812, 0.017699241638183594, 0.019100189208984375, 0.020501136779785156, 0.021902084350585938, 0.02330303192138672, 0.0247039794921875, 0.02610492706298828, 0.027505874633789062, 0.028906822204589844, 0.030307769775390625, 0.031708717346191406, 0.03310966491699219, 0.03451061248779297, 0.03591156005859375, 0.03731250762939453, 0.03871345520019531, 0.040114402770996094, 0.041515350341796875, 0.042916297912597656, 0.04431724548339844, 0.04571819305419922, 0.047119140625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 6.0, 12.0, 11.0, 26.0, 22.0, 34.0, 41.0, 74.0, 74.0, 115.0, 100.0, 116.0, 96.0, 76.0, 60.0, 30.0, 25.0, 27.0, 13.0, 11.0, 6.0, 1.0, 6.0, 4.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0279159545898438e-05, -2.9056333005428314e-05, -2.783350646495819e-05, -2.6610679924488068e-05, -2.5387853384017944e-05, -2.416502684354782e-05, -2.2942200303077698e-05, -2.1719373762607574e-05, -2.049654722213745e-05, -1.9273720681667328e-05, -1.8050894141197205e-05, -1.682806760072708e-05, -1.5605241060256958e-05, -1.4382414519786835e-05, -1.3159587979316711e-05, -1.1936761438846588e-05, -1.0713934898376465e-05, -9.491108357906342e-06, -8.268281817436218e-06, -7.045455276966095e-06, -5.822628736495972e-06, -4.599802196025848e-06, -3.376975655555725e-06, -2.154149115085602e-06, -9.313225746154785e-07, 2.915039658546448e-07, 1.514330506324768e-06, 2.7371570467948914e-06, 3.959983587265015e-06, 5.182810127735138e-06, 6.405636668205261e-06, 7.6284632086753845e-06, 8.851289749145508e-06, 1.0074116289615631e-05, 1.1296942830085754e-05, 1.2519769370555878e-05, 1.3742595911026001e-05, 1.4965422451496124e-05, 1.6188248991966248e-05, 1.741107553243637e-05, 1.8633902072906494e-05, 1.9856728613376617e-05, 2.107955515384674e-05, 2.2302381694316864e-05, 2.3525208234786987e-05, 2.474803477525711e-05, 2.5970861315727234e-05, 2.7193687856197357e-05, 2.841651439666748e-05, 2.9639340937137604e-05, 3.086216747760773e-05, 3.208499401807785e-05, 3.3307820558547974e-05, 3.45306470990181e-05, 3.575347363948822e-05, 3.6976300179958344e-05, 3.819912672042847e-05, 3.942195326089859e-05, 4.064477980136871e-05, 4.186760634183884e-05, 4.309043288230896e-05, 4.431325942277908e-05, 4.5536085963249207e-05, 4.675891250371933e-05, 4.798173904418945e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 7.0, 11.0, 12.0, 30.0, 35.0, 41.0, 74.0, 107.0, 192.0, 310.0, 631.0, 1326.0, 3038.0, 8449.0, 29151.0, 171937.0, 625424.0, 165405.0, 28482.0, 8120.0, 3013.0, 1236.0, 662.0, 321.0, 206.0, 103.0, 73.0, 52.0, 30.0, 19.0, 11.0, 8.0, 8.0, 10.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.042205810546875, -0.04082155227661133, -0.039437294006347656, -0.038053035736083984, -0.03666877746582031, -0.03528451919555664, -0.03390026092529297, -0.0325160026550293, -0.031131744384765625, -0.029747486114501953, -0.02836322784423828, -0.02697896957397461, -0.025594711303710938, -0.024210453033447266, -0.022826194763183594, -0.021441936492919922, -0.02005767822265625, -0.018673419952392578, -0.017289161682128906, -0.015904903411865234, -0.014520645141601562, -0.01313638687133789, -0.011752128601074219, -0.010367870330810547, -0.008983612060546875, -0.007599353790283203, -0.006215095520019531, -0.004830837249755859, -0.0034465789794921875, -0.0020623207092285156, -0.0006780624389648438, 0.0007061958312988281, 0.0020904541015625, 0.003474712371826172, 0.004858970642089844, 0.006243228912353516, 0.0076274871826171875, 0.00901174545288086, 0.010396003723144531, 0.011780261993408203, 0.013164520263671875, 0.014548778533935547, 0.01593303680419922, 0.01731729507446289, 0.018701553344726562, 0.020085811614990234, 0.021470069885253906, 0.022854328155517578, 0.02423858642578125, 0.025622844696044922, 0.027007102966308594, 0.028391361236572266, 0.029775619506835938, 0.03115987777709961, 0.03254413604736328, 0.03392839431762695, 0.035312652587890625, 0.0366969108581543, 0.03808116912841797, 0.03946542739868164, 0.04084968566894531, 0.042233943939208984, 0.043618202209472656, 0.04500246047973633, 0.04638671875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 4.0, 7.0, 8.0, 13.0, 15.0, 26.0, 28.0, 29.0, 61.0, 71.0, 63.0, 90.0, 103.0, 77.0, 86.0, 72.0, 58.0, 53.0, 33.0, 19.0, 17.0, 16.0, 14.0, 7.0, 3.0, 3.0, 5.0, 6.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0300140380859375, -0.02901434898376465, -0.028014659881591797, -0.027014970779418945, -0.026015281677246094, -0.025015592575073242, -0.02401590347290039, -0.02301621437072754, -0.022016525268554688, -0.021016836166381836, -0.020017147064208984, -0.019017457962036133, -0.01801776885986328, -0.01701807975769043, -0.016018390655517578, -0.015018701553344727, -0.014019012451171875, -0.013019323348999023, -0.012019634246826172, -0.01101994514465332, -0.010020256042480469, -0.009020566940307617, -0.008020877838134766, -0.007021188735961914, -0.0060214996337890625, -0.005021810531616211, -0.004022121429443359, -0.003022432327270508, -0.0020227432250976562, -0.0010230541229248047, -2.3365020751953125e-05, 0.0009763240814208984, 0.00197601318359375, 0.0029757022857666016, 0.003975391387939453, 0.004975080490112305, 0.005974769592285156, 0.006974458694458008, 0.00797414779663086, 0.008973836898803711, 0.009973526000976562, 0.010973215103149414, 0.011972904205322266, 0.012972593307495117, 0.013972282409667969, 0.01497197151184082, 0.015971660614013672, 0.016971349716186523, 0.017971038818359375, 0.018970727920532227, 0.019970417022705078, 0.02097010612487793, 0.02196979522705078, 0.022969484329223633, 0.023969173431396484, 0.024968862533569336, 0.025968551635742188, 0.02696824073791504, 0.02796792984008789, 0.028967618942260742, 0.029967308044433594, 0.030966997146606445, 0.0319666862487793, 0.03296637535095215, 0.033966064453125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 18.0, 22.0, 26.0, 56.0, 72.0, 111.0, 151.0, 119.0, 141.0, 102.0, 71.0, 51.0, 22.0, 15.0, 7.0, 8.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3377261459827423, -0.3202654719352722, -0.3028047978878021, -0.28534412384033203, -0.26788341999053955, -0.25042277574539185, -0.23296207189559937, -0.21550139784812927, -0.19804072380065918, -0.1805800497531891, -0.163119375705719, -0.1456586867570877, -0.12819801270961761, -0.11073733866214752, -0.09327665716409683, -0.07581597566604614, -0.05835530161857605, -0.04089462384581566, -0.023433946073055267, -0.005973268300294876, 0.011487409472465515, 0.028948083519935608, 0.0464087650179863, 0.06386944651603699, 0.08133012056350708, 0.09879079461097717, 0.11625147610902786, 0.13371215760707855, 0.15117283165454865, 0.16863350570201874, 0.18609419465065002, 0.20355486869812012, 0.2210155725479126, 0.2384762465953827, 0.2559369206428528, 0.2733975946903229, 0.29085826873779297, 0.30831897258758545, 0.32577964663505554, 0.34324032068252563, 0.3607009947299957, 0.3781616687774658, 0.3956223428249359, 0.413083016872406, 0.4305437207221985, 0.4480043649673462, 0.46546506881713867, 0.48292574286460876, 0.5003864169120789, 0.5178471207618713, 0.535307765007019, 0.5527684688568115, 0.5702291131019592, 0.5876898169517517, 0.6051504611968994, 0.6226111650466919, 0.6400718688964844, 0.6575325727462769, 0.6749932169914246, 0.692453920841217, 0.7099145650863647, 0.7273752689361572, 0.7448359131813049, 0.7622966170310974, 0.7797572612762451]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 6.0, 2.0, 3.0, 4.0, 9.0, 8.0, 13.0, 8.0, 15.0, 21.0, 21.0, 29.0, 25.0, 32.0, 44.0, 38.0, 51.0, 51.0, 52.0, 61.0, 62.0, 45.0, 50.0, 45.0, 42.0, 39.0, 38.0, 25.0, 27.0, 22.0, 25.0, 16.0, 20.0, 16.0, 16.0, 9.0, 6.0, 5.0, 6.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43339109420776367, -0.4191264510154724, -0.40486177802085876, -0.3905971348285675, -0.37633249163627625, -0.3620678186416626, -0.34780317544937134, -0.3335385322570801, -0.3192738890647888, -0.30500924587249756, -0.2907445728778839, -0.27647992968559265, -0.2622152864933014, -0.24795062839984894, -0.23368597030639648, -0.21942132711410522, -0.20515665411949158, -0.19089199602603912, -0.17662735283374786, -0.1623626947402954, -0.14809805154800415, -0.1338333934545517, -0.11956873536109924, -0.10530408471822739, -0.09103943407535553, -0.07677478343248367, -0.06251013278961182, -0.04824547469615936, -0.033980824053287506, -0.01971617341041565, -0.005451515316963196, 0.008813135325908661, 0.023077785968780518, 0.037342436611652374, 0.05160709097981453, 0.06587174534797668, 0.08013639599084854, 0.0944010466337204, 0.10866570472717285, 0.12293035537004471, 0.13719500601291656, 0.15145966410636902, 0.16572430729866028, 0.17998896539211273, 0.19425362348556519, 0.20851826667785645, 0.2227829247713089, 0.23704758286476135, 0.2513122260570526, 0.26557686924934387, 0.2798415422439575, 0.2941061854362488, 0.30837082862854004, 0.3226354718208313, 0.33690014481544495, 0.3511647880077362, 0.36542946100234985, 0.3796941041946411, 0.39395877718925476, 0.408223420381546, 0.4224880635738373, 0.4367527365684509, 0.4510173797607422, 0.46528202295303345, 0.4795466661453247]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 5.0, 3.0, 7.0, 7.0, 15.0, 24.0, 41.0, 47.0, 72.0, 124.0, 182.0, 330.0, 465.0, 855.0, 1526.0, 2742.0, 5600.0, 12451.0, 32995.0, 116116.0, 2611960.0, 1256076.0, 100176.0, 29441.0, 11362.0, 5294.0, 2673.0, 1488.0, 842.0, 492.0, 309.0, 167.0, 113.0, 72.0, 78.0, 49.0, 31.0, 23.0, 8.0, 10.0, 6.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.07763671875, -0.07541561126708984, -0.07319450378417969, -0.07097339630126953, -0.06875228881835938, -0.06653118133544922, -0.06431007385253906, -0.062088966369628906, -0.05986785888671875, -0.057646751403808594, -0.05542564392089844, -0.05320453643798828, -0.050983428955078125, -0.04876232147216797, -0.04654121398925781, -0.044320106506347656, -0.0420989990234375, -0.039877891540527344, -0.03765678405761719, -0.03543567657470703, -0.033214569091796875, -0.03099346160888672, -0.028772354125976562, -0.026551246643066406, -0.02433013916015625, -0.022109031677246094, -0.019887924194335938, -0.01766681671142578, -0.015445709228515625, -0.013224601745605469, -0.011003494262695312, -0.008782386779785156, -0.006561279296875, -0.004340171813964844, -0.0021190643310546875, 0.00010204315185546875, 0.002323150634765625, 0.004544258117675781, 0.0067653656005859375, 0.008986473083496094, 0.01120758056640625, 0.013428688049316406, 0.015649795532226562, 0.01787090301513672, 0.020092010498046875, 0.02231311798095703, 0.024534225463867188, 0.026755332946777344, 0.0289764404296875, 0.031197547912597656, 0.03341865539550781, 0.03563976287841797, 0.037860870361328125, 0.04008197784423828, 0.04230308532714844, 0.044524192810058594, 0.04674530029296875, 0.048966407775878906, 0.05118751525878906, 0.05340862274169922, 0.055629730224609375, 0.05785083770751953, 0.06007194519042969, 0.062293052673339844, 0.06451416015625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 0.0, 1.0, 4.0, 6.0, 9.0, 4.0, 11.0, 9.0, 21.0, 17.0, 21.0, 28.0, 34.0, 39.0, 53.0, 58.0, 53.0, 51.0, 56.0, 57.0, 45.0, 71.0, 52.0, 58.0, 41.0, 41.0, 33.0, 29.0, 21.0, 18.0, 16.0, 4.0, 9.0, 8.0, 11.0, 2.0, 5.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.01776123046875, -0.017196178436279297, -0.016631126403808594, -0.01606607437133789, -0.015501022338867188, -0.014935970306396484, -0.014370918273925781, -0.013805866241455078, -0.013240814208984375, -0.012675762176513672, -0.012110710144042969, -0.011545658111572266, -0.010980606079101562, -0.01041555404663086, -0.009850502014160156, -0.009285449981689453, -0.00872039794921875, -0.008155345916748047, -0.007590293884277344, -0.007025241851806641, -0.0064601898193359375, -0.005895137786865234, -0.005330085754394531, -0.004765033721923828, -0.004199981689453125, -0.003634929656982422, -0.0030698776245117188, -0.0025048255920410156, -0.0019397735595703125, -0.0013747215270996094, -0.0008096694946289062, -0.0002446174621582031, 0.0003204345703125, 0.0008854866027832031, 0.0014505386352539062, 0.0020155906677246094, 0.0025806427001953125, 0.0031456947326660156, 0.0037107467651367188, 0.004275798797607422, 0.004840850830078125, 0.005405902862548828, 0.005970954895019531, 0.006536006927490234, 0.0071010589599609375, 0.007666110992431641, 0.008231163024902344, 0.008796215057373047, 0.00936126708984375, 0.009926319122314453, 0.010491371154785156, 0.01105642318725586, 0.011621475219726562, 0.012186527252197266, 0.012751579284667969, 0.013316631317138672, 0.013881683349609375, 0.014446735382080078, 0.015011787414550781, 0.015576839447021484, 0.016141891479492188, 0.01670694351196289, 0.017271995544433594, 0.017837047576904297, 0.018402099609375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 4.0, 10.0, 11.0, 18.0, 29.0, 70.0, 95.0, 197.0, 394.0, 828.0, 1912.0, 4823.0, 13501.0, 46696.0, 278781.0, 3484700.0, 293013.0, 47539.0, 13437.0, 4719.0, 1810.0, 833.0, 405.0, 209.0, 107.0, 56.0, 21.0, 21.0, 9.0, 13.0, 5.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.1243896484375, -0.12139320373535156, -0.11839675903320312, -0.11540031433105469, -0.11240386962890625, -0.10940742492675781, -0.10641098022460938, -0.10341453552246094, -0.1004180908203125, -0.09742164611816406, -0.09442520141601562, -0.09142875671386719, -0.08843231201171875, -0.08543586730957031, -0.08243942260742188, -0.07944297790527344, -0.076446533203125, -0.07345008850097656, -0.07045364379882812, -0.06745719909667969, -0.06446075439453125, -0.06146430969238281, -0.058467864990234375, -0.05547142028808594, -0.0524749755859375, -0.04947853088378906, -0.046482086181640625, -0.04348564147949219, -0.04048919677734375, -0.03749275207519531, -0.034496307373046875, -0.03149986267089844, -0.02850341796875, -0.025506973266601562, -0.022510528564453125, -0.019514083862304688, -0.01651763916015625, -0.013521194458007812, -0.010524749755859375, -0.0075283050537109375, -0.0045318603515625, -0.0015354156494140625, 0.001461029052734375, 0.0044574737548828125, 0.00745391845703125, 0.010450363159179688, 0.013446807861328125, 0.016443252563476562, 0.019439697265625, 0.022436141967773438, 0.025432586669921875, 0.028429031372070312, 0.03142547607421875, 0.03442192077636719, 0.037418365478515625, 0.04041481018066406, 0.0434112548828125, 0.04640769958496094, 0.049404144287109375, 0.05240058898925781, 0.05539703369140625, 0.05839347839355469, 0.061389923095703125, 0.06438636779785156, 0.0673828125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 1.0, 9.0, 7.0, 11.0, 9.0, 10.0, 22.0, 25.0, 25.0, 39.0, 69.0, 86.0, 166.0, 275.0, 608.0, 1476.0, 545.0, 268.0, 140.0, 84.0, 56.0, 32.0, 34.0, 24.0, 18.0, 10.0, 4.0, 3.0, 12.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0379638671875, -0.03682994842529297, -0.03569602966308594, -0.034562110900878906, -0.033428192138671875, -0.032294273376464844, -0.031160354614257812, -0.03002643585205078, -0.02889251708984375, -0.02775859832763672, -0.026624679565429688, -0.025490760803222656, -0.024356842041015625, -0.023222923278808594, -0.022089004516601562, -0.02095508575439453, -0.0198211669921875, -0.01868724822998047, -0.017553329467773438, -0.016419410705566406, -0.015285491943359375, -0.014151573181152344, -0.013017654418945312, -0.011883735656738281, -0.01074981689453125, -0.009615898132324219, -0.008481979370117188, -0.007348060607910156, -0.006214141845703125, -0.005080223083496094, -0.0039463043212890625, -0.0028123855590820312, -0.001678466796875, -0.0005445480346679688, 0.0005893707275390625, 0.0017232894897460938, 0.002857208251953125, 0.003991127014160156, 0.0051250457763671875, 0.006258964538574219, 0.00739288330078125, 0.008526802062988281, 0.009660720825195312, 0.010794639587402344, 0.011928558349609375, 0.013062477111816406, 0.014196395874023438, 0.015330314636230469, 0.0164642333984375, 0.01759815216064453, 0.018732070922851562, 0.019865989685058594, 0.020999908447265625, 0.022133827209472656, 0.023267745971679688, 0.02440166473388672, 0.02553558349609375, 0.02666950225830078, 0.027803421020507812, 0.028937339782714844, 0.030071258544921875, 0.031205177307128906, 0.03233909606933594, 0.03347301483154297, 0.03460693359375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 14.0, 64.0, 272.0, 414.0, 202.0, 30.0, 11.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2561997175216675, -1.2291288375854492, -1.202057957649231, -1.1749869585037231, -1.1479160785675049, -1.1208451986312866, -1.0937743186950684, -1.0667033195495605, -1.0396324396133423, -1.012561559677124, -0.985490620136261, -0.9584197402000427, -0.9313488006591797, -0.9042779207229614, -0.8772069811820984, -0.8501361012458801, -0.8230651617050171, -0.7959942817687988, -0.7689233422279358, -0.7418524622917175, -0.7147815227508545, -0.6877106428146362, -0.6606397032737732, -0.6335688233375549, -0.6064979434013367, -0.5794270634651184, -0.5523561239242554, -0.5252852439880371, -0.4982143044471741, -0.4711434245109558, -0.4440724849700928, -0.4170016050338745, -0.3899306654930115, -0.3628597557544708, -0.3357888460159302, -0.3087179362773895, -0.2816470265388489, -0.2545761466026306, -0.22750522196292877, -0.20043431222438812, -0.17336340248584747, -0.14629249274730682, -0.11922158300876617, -0.09215068072080612, -0.06507977098226547, -0.03800886869430542, -0.01093795895576477, 0.01613295078277588, 0.04320386052131653, 0.07027477025985718, 0.09734567999839783, 0.12441658228635788, 0.15148749947547913, 0.17855839431285858, 0.20562930405139923, 0.23270021378993988, 0.25977110862731934, 0.28684201836586, 0.31391292810440063, 0.3409838378429413, 0.36805474758148193, 0.3951256275177002, 0.42219656705856323, 0.4492674469947815, 0.47633838653564453]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 9.0, 2.0, 0.0, 3.0, 5.0, 9.0, 5.0, 6.0, 4.0, 16.0, 13.0, 13.0, 12.0, 22.0, 12.0, 21.0, 44.0, 33.0, 41.0, 33.0, 29.0, 32.0, 49.0, 36.0, 66.0, 29.0, 54.0, 42.0, 47.0, 48.0, 35.0, 29.0, 36.0, 22.0, 13.0, 18.0, 21.0, 26.0, 15.0, 13.0, 13.0, 8.0, 8.0, 4.0, 6.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.12559539079666138, -0.12173214554786682, -0.11786890029907227, -0.11400565505027771, -0.11014240980148315, -0.1062791645526886, -0.10241591930389404, -0.09855267405509949, -0.09468942880630493, -0.09082618355751038, -0.08696293830871582, -0.08309969305992126, -0.07923644781112671, -0.07537320256233215, -0.0715099573135376, -0.06764671206474304, -0.06378346681594849, -0.05992022156715393, -0.056056976318359375, -0.05219373106956482, -0.048330485820770264, -0.04446724057197571, -0.04060399532318115, -0.0367407500743866, -0.03287750482559204, -0.029014259576797485, -0.02515101432800293, -0.021287769079208374, -0.01742452383041382, -0.013561278581619263, -0.009698033332824707, -0.005834788084030151, -0.0019715428352355957, 0.00189170241355896, 0.005754947662353516, 0.009618192911148071, 0.013481438159942627, 0.017344683408737183, 0.02120792865753174, 0.025071173906326294, 0.02893441915512085, 0.032797664403915405, 0.03666090965270996, 0.04052415490150452, 0.04438740015029907, 0.04825064539909363, 0.052113890647888184, 0.05597713589668274, 0.059840381145477295, 0.06370362639427185, 0.0675668716430664, 0.07143011689186096, 0.07529336214065552, 0.07915660738945007, 0.08301985263824463, 0.08688309788703918, 0.09074634313583374, 0.0946095883846283, 0.09847283363342285, 0.10233607888221741, 0.10619932413101196, 0.11006256937980652, 0.11392581462860107, 0.11778905987739563, 0.12165230512619019]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 10.0, 12.0, 20.0, 20.0, 22.0, 50.0, 77.0, 133.0, 213.0, 389.0, 698.0, 1182.0, 2302.0, 4781.0, 9938.0, 22600.0, 54874.0, 144223.0, 384357.0, 262352.0, 92685.0, 37247.0, 15795.0, 7141.0, 3549.0, 1694.0, 881.0, 501.0, 293.0, 197.0, 96.0, 85.0, 45.0, 26.0, 20.0, 12.0, 8.0, 6.0, 6.0, 3.0, 2.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0833740234375, -0.08090591430664062, -0.07843780517578125, -0.07596969604492188, -0.0735015869140625, -0.07103347778320312, -0.06856536865234375, -0.06609725952148438, -0.063629150390625, -0.061161041259765625, -0.05869293212890625, -0.056224822998046875, -0.0537567138671875, -0.051288604736328125, -0.04882049560546875, -0.046352386474609375, -0.04388427734375, -0.041416168212890625, -0.03894805908203125, -0.036479949951171875, -0.0340118408203125, -0.031543731689453125, -0.02907562255859375, -0.026607513427734375, -0.024139404296875, -0.021671295166015625, -0.01920318603515625, -0.016735076904296875, -0.0142669677734375, -0.011798858642578125, -0.00933074951171875, -0.006862640380859375, -0.00439453125, -0.001926422119140625, 0.00054168701171875, 0.003009796142578125, 0.0054779052734375, 0.007946014404296875, 0.01041412353515625, 0.012882232666015625, 0.015350341796875, 0.017818450927734375, 0.02028656005859375, 0.022754669189453125, 0.0252227783203125, 0.027690887451171875, 0.03015899658203125, 0.032627105712890625, 0.03509521484375, 0.037563323974609375, 0.04003143310546875, 0.042499542236328125, 0.0449676513671875, 0.047435760498046875, 0.04990386962890625, 0.052371978759765625, 0.054840087890625, 0.057308197021484375, 0.05977630615234375, 0.062244415283203125, 0.0647125244140625, 0.06718063354492188, 0.06964874267578125, 0.07211685180664062, 0.0745849609375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 0.0, 7.0, 2.0, 6.0, 8.0, 15.0, 8.0, 9.0, 27.0, 16.0, 30.0, 45.0, 36.0, 50.0, 59.0, 54.0, 57.0, 67.0, 62.0, 74.0, 69.0, 46.0, 46.0, 32.0, 37.0, 33.0, 15.0, 23.0, 19.0, 16.0, 10.0, 5.0, 6.0, 6.0, 3.0, 1.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0177764892578125, -0.01718282699584961, -0.01658916473388672, -0.015995502471923828, -0.015401840209960938, -0.014808177947998047, -0.014214515686035156, -0.013620853424072266, -0.013027191162109375, -0.012433528900146484, -0.011839866638183594, -0.011246204376220703, -0.010652542114257812, -0.010058879852294922, -0.009465217590332031, -0.00887155532836914, -0.00827789306640625, -0.007684230804443359, -0.007090568542480469, -0.006496906280517578, -0.0059032440185546875, -0.005309581756591797, -0.004715919494628906, -0.004122257232666016, -0.003528594970703125, -0.0029349327087402344, -0.0023412704467773438, -0.0017476081848144531, -0.0011539459228515625, -0.0005602836608886719, 3.337860107421875e-05, 0.0006270408630371094, 0.001220703125, 0.0018143653869628906, 0.0024080276489257812, 0.003001689910888672, 0.0035953521728515625, 0.004189014434814453, 0.004782676696777344, 0.005376338958740234, 0.005970001220703125, 0.006563663482666016, 0.007157325744628906, 0.007750988006591797, 0.008344650268554688, 0.008938312530517578, 0.009531974792480469, 0.01012563705444336, 0.01071929931640625, 0.01131296157836914, 0.011906623840332031, 0.012500286102294922, 0.013093948364257812, 0.013687610626220703, 0.014281272888183594, 0.014874935150146484, 0.015468597412109375, 0.016062259674072266, 0.016655921936035156, 0.017249584197998047, 0.017843246459960938, 0.018436908721923828, 0.01903057098388672, 0.01962423324584961, 0.0202178955078125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 5.0, 4.0, 5.0, 10.0, 14.0, 28.0, 35.0, 46.0, 72.0, 108.0, 208.0, 301.0, 496.0, 907.0, 1654.0, 3553.0, 7945.0, 20558.0, 60520.0, 186049.0, 425891.0, 225195.0, 72996.0, 24486.0, 9325.0, 3903.0, 1896.0, 927.0, 504.0, 323.0, 206.0, 118.0, 88.0, 55.0, 36.0, 24.0, 21.0, 16.0, 12.0, 6.0, 4.0, 6.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.070068359375, -0.06785011291503906, -0.06563186645507812, -0.06341361999511719, -0.06119537353515625, -0.05897712707519531, -0.056758880615234375, -0.05454063415527344, -0.0523223876953125, -0.05010414123535156, -0.047885894775390625, -0.04566764831542969, -0.04344940185546875, -0.04123115539550781, -0.039012908935546875, -0.03679466247558594, -0.034576416015625, -0.03235816955566406, -0.030139923095703125, -0.027921676635742188, -0.02570343017578125, -0.023485183715820312, -0.021266937255859375, -0.019048690795898438, -0.0168304443359375, -0.014612197875976562, -0.012393951416015625, -0.010175704956054688, -0.00795745849609375, -0.0057392120361328125, -0.003520965576171875, -0.0013027191162109375, 0.00091552734375, 0.0031337738037109375, 0.005352020263671875, 0.0075702667236328125, 0.00978851318359375, 0.012006759643554688, 0.014225006103515625, 0.016443252563476562, 0.0186614990234375, 0.020879745483398438, 0.023097991943359375, 0.025316238403320312, 0.02753448486328125, 0.029752731323242188, 0.031970977783203125, 0.03418922424316406, 0.036407470703125, 0.03862571716308594, 0.040843963623046875, 0.04306221008300781, 0.04528045654296875, 0.04749870300292969, 0.049716949462890625, 0.05193519592285156, 0.0541534423828125, 0.05637168884277344, 0.058589935302734375, 0.06080818176269531, 0.06302642822265625, 0.06524467468261719, 0.06746292114257812, 0.06968116760253906, 0.0718994140625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 0.0, 4.0, 6.0, 7.0, 8.0, 8.0, 17.0, 14.0, 15.0, 23.0, 16.0, 24.0, 27.0, 28.0, 39.0, 40.0, 33.0, 39.0, 50.0, 41.0, 44.0, 33.0, 48.0, 48.0, 42.0, 30.0, 37.0, 41.0, 27.0, 31.0, 34.0, 24.0, 22.0, 19.0, 14.0, 12.0, 10.0, 5.0, 8.0, 8.0, 3.0, 8.0, 7.0, 0.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06646728515625, -0.06432056427001953, -0.06217384338378906, -0.060027122497558594, -0.057880401611328125, -0.055733680725097656, -0.05358695983886719, -0.05144023895263672, -0.04929351806640625, -0.04714679718017578, -0.04500007629394531, -0.042853355407714844, -0.040706634521484375, -0.038559913635253906, -0.03641319274902344, -0.03426647186279297, -0.0321197509765625, -0.02997303009033203, -0.027826309204101562, -0.025679588317871094, -0.023532867431640625, -0.021386146545410156, -0.019239425659179688, -0.01709270477294922, -0.01494598388671875, -0.012799263000488281, -0.010652542114257812, -0.008505821228027344, -0.006359100341796875, -0.004212379455566406, -0.0020656585693359375, 8.106231689453125e-05, 0.002227783203125, 0.004374504089355469, 0.0065212249755859375, 0.008667945861816406, 0.010814666748046875, 0.012961387634277344, 0.015108108520507812, 0.01725482940673828, 0.01940155029296875, 0.02154827117919922, 0.023694992065429688, 0.025841712951660156, 0.027988433837890625, 0.030135154724121094, 0.03228187561035156, 0.03442859649658203, 0.0365753173828125, 0.03872203826904297, 0.04086875915527344, 0.043015480041503906, 0.045162200927734375, 0.047308921813964844, 0.04945564270019531, 0.05160236358642578, 0.05374908447265625, 0.05589580535888672, 0.05804252624511719, 0.060189247131347656, 0.062335968017578125, 0.0644826889038086, 0.06662940979003906, 0.06877613067626953, 0.0709228515625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 7.0, 6.0, 8.0, 12.0, 15.0, 19.0, 41.0, 59.0, 131.0, 258.0, 527.0, 1017.0, 2567.0, 6846.0, 22209.0, 94465.0, 536496.0, 307505.0, 53914.0, 14344.0, 4678.0, 1846.0, 749.0, 401.0, 195.0, 101.0, 61.0, 34.0, 20.0, 12.0, 6.0, 8.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061614990234375, -0.05954885482788086, -0.05748271942138672, -0.05541658401489258, -0.05335044860839844, -0.0512843132019043, -0.049218177795410156, -0.047152042388916016, -0.045085906982421875, -0.043019771575927734, -0.040953636169433594, -0.03888750076293945, -0.03682136535644531, -0.03475522994995117, -0.03268909454345703, -0.03062295913696289, -0.02855682373046875, -0.02649068832397461, -0.02442455291748047, -0.022358417510986328, -0.020292282104492188, -0.018226146697998047, -0.016160011291503906, -0.014093875885009766, -0.012027740478515625, -0.009961605072021484, -0.007895469665527344, -0.005829334259033203, -0.0037631988525390625, -0.0016970634460449219, 0.00036907196044921875, 0.0024352073669433594, 0.0045013427734375, 0.006567478179931641, 0.008633613586425781, 0.010699748992919922, 0.012765884399414062, 0.014832019805908203, 0.016898155212402344, 0.018964290618896484, 0.021030426025390625, 0.023096561431884766, 0.025162696838378906, 0.027228832244873047, 0.029294967651367188, 0.03136110305786133, 0.03342723846435547, 0.03549337387084961, 0.03755950927734375, 0.03962564468383789, 0.04169178009033203, 0.04375791549682617, 0.04582405090332031, 0.04789018630981445, 0.049956321716308594, 0.052022457122802734, 0.054088592529296875, 0.056154727935791016, 0.058220863342285156, 0.0602869987487793, 0.06235313415527344, 0.06441926956176758, 0.06648540496826172, 0.06855154037475586, 0.07061767578125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 4.0, 11.0, 22.0, 26.0, 43.0, 59.0, 81.0, 113.0, 151.0, 146.0, 129.0, 77.0, 48.0, 39.0, 28.0, 10.0, 8.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5418739318847656e-05, -4.372932016849518e-05, -4.20399010181427e-05, -4.035048186779022e-05, -3.8661062717437744e-05, -3.6971643567085266e-05, -3.528222441673279e-05, -3.359280526638031e-05, -3.190338611602783e-05, -3.0213966965675354e-05, -2.8524547815322876e-05, -2.6835128664970398e-05, -2.514570951461792e-05, -2.3456290364265442e-05, -2.1766871213912964e-05, -2.0077452063560486e-05, -1.8388032913208008e-05, -1.669861376285553e-05, -1.5009194612503052e-05, -1.3319775462150574e-05, -1.1630356311798096e-05, -9.940937161445618e-06, -8.25151801109314e-06, -6.562098860740662e-06, -4.872679710388184e-06, -3.1832605600357056e-06, -1.4938414096832275e-06, 1.955777406692505e-07, 1.8849968910217285e-06, 3.5744160413742065e-06, 5.2638351917266846e-06, 6.953254342079163e-06, 8.64267349243164e-06, 1.0332092642784119e-05, 1.2021511793136597e-05, 1.3710930943489075e-05, 1.5400350093841553e-05, 1.708976924419403e-05, 1.877918839454651e-05, 2.0468607544898987e-05, 2.2158026695251465e-05, 2.3847445845603943e-05, 2.553686499595642e-05, 2.72262841463089e-05, 2.8915703296661377e-05, 3.0605122447013855e-05, 3.229454159736633e-05, 3.398396074771881e-05, 3.567337989807129e-05, 3.736279904842377e-05, 3.9052218198776245e-05, 4.074163734912872e-05, 4.24310564994812e-05, 4.412047564983368e-05, 4.580989480018616e-05, 4.7499313950538635e-05, 4.918873310089111e-05, 5.087815225124359e-05, 5.256757140159607e-05, 5.425699055194855e-05, 5.5946409702301025e-05, 5.7635828852653503e-05, 5.932524800300598e-05, 6.101466715335846e-05, 6.270408630371094e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 1.0, 8.0, 12.0, 12.0, 21.0, 25.0, 39.0, 81.0, 123.0, 195.0, 306.0, 572.0, 1096.0, 2334.0, 5581.0, 15525.0, 51111.0, 221162.0, 549411.0, 144456.0, 36221.0, 11901.0, 4314.0, 1894.0, 913.0, 486.0, 275.0, 182.0, 96.0, 70.0, 48.0, 25.0, 19.0, 13.0, 8.0, 5.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.056732177734375, -0.05512809753417969, -0.053524017333984375, -0.05191993713378906, -0.05031585693359375, -0.04871177673339844, -0.047107696533203125, -0.04550361633300781, -0.0438995361328125, -0.04229545593261719, -0.040691375732421875, -0.03908729553222656, -0.03748321533203125, -0.03587913513183594, -0.034275054931640625, -0.03267097473144531, -0.03106689453125, -0.029462814331054688, -0.027858734130859375, -0.026254653930664062, -0.02465057373046875, -0.023046493530273438, -0.021442413330078125, -0.019838333129882812, -0.0182342529296875, -0.016630172729492188, -0.015026092529296875, -0.013422012329101562, -0.01181793212890625, -0.010213851928710938, -0.008609771728515625, -0.0070056915283203125, -0.005401611328125, -0.0037975311279296875, -0.002193450927734375, -0.0005893707275390625, 0.00101470947265625, 0.0026187896728515625, 0.004222869873046875, 0.0058269500732421875, 0.0074310302734375, 0.009035110473632812, 0.010639190673828125, 0.012243270874023438, 0.01384735107421875, 0.015451431274414062, 0.017055511474609375, 0.018659591674804688, 0.020263671875, 0.021867752075195312, 0.023471832275390625, 0.025075912475585938, 0.02667999267578125, 0.028284072875976562, 0.029888153076171875, 0.03149223327636719, 0.0330963134765625, 0.03470039367675781, 0.036304473876953125, 0.03790855407714844, 0.03951263427734375, 0.04111671447753906, 0.042720794677734375, 0.04432487487792969, 0.045928955078125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 8.0, 1.0, 4.0, 8.0, 4.0, 10.0, 14.0, 22.0, 18.0, 22.0, 32.0, 34.0, 42.0, 51.0, 92.0, 97.0, 96.0, 87.0, 76.0, 61.0, 43.0, 33.0, 39.0, 22.0, 20.0, 22.0, 15.0, 12.0, 3.0, 4.0, 4.0, 4.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.042999267578125, -0.041748046875, -0.040496826171875, -0.03924560546875, -0.037994384765625, -0.0367431640625, -0.035491943359375, -0.03424072265625, -0.032989501953125, -0.03173828125, -0.030487060546875, -0.02923583984375, -0.027984619140625, -0.0267333984375, -0.025482177734375, -0.02423095703125, -0.022979736328125, -0.021728515625, -0.020477294921875, -0.01922607421875, -0.017974853515625, -0.0167236328125, -0.015472412109375, -0.01422119140625, -0.012969970703125, -0.01171875, -0.010467529296875, -0.00921630859375, -0.007965087890625, -0.0067138671875, -0.005462646484375, -0.00421142578125, -0.002960205078125, -0.001708984375, -0.000457763671875, 0.00079345703125, 0.002044677734375, 0.0032958984375, 0.004547119140625, 0.00579833984375, 0.007049560546875, 0.00830078125, 0.009552001953125, 0.01080322265625, 0.012054443359375, 0.0133056640625, 0.014556884765625, 0.01580810546875, 0.017059326171875, 0.018310546875, 0.019561767578125, 0.02081298828125, 0.022064208984375, 0.0233154296875, 0.024566650390625, 0.02581787109375, 0.027069091796875, 0.0283203125, 0.029571533203125, 0.03082275390625, 0.032073974609375, 0.0333251953125, 0.034576416015625, 0.03582763671875, 0.037078857421875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 9.0, 42.0, 72.0, 138.0, 179.0, 187.0, 177.0, 98.0, 52.0, 23.0, 12.0, 8.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6950697302818298, -0.6665341258049011, -0.6379985213279724, -0.6094629764556885, -0.5809273719787598, -0.552391767501831, -0.5238561630249023, -0.49532055854797363, -0.4667849838733673, -0.4382493793964386, -0.4097138047218323, -0.38117820024490356, -0.35264259576797485, -0.32410702109336853, -0.2955714166164398, -0.2670358419418335, -0.23850023746490479, -0.20996464788913727, -0.18142905831336975, -0.15289345383644104, -0.12435786426067352, -0.095822274684906, -0.0672866702079773, -0.03875108063220978, -0.01021549105644226, 0.018320102244615555, 0.04685569554567337, 0.07539129257202148, 0.103926882147789, 0.13246247172355652, 0.16099807620048523, 0.18953366577625275, 0.21806931495666504, 0.24660490453243256, 0.2751404941082001, 0.3036760985851288, 0.3322116732597351, 0.3607472777366638, 0.38928288221359253, 0.41781848669052124, 0.44635406136512756, 0.4748896658420563, 0.5034252405166626, 0.5319608449935913, 0.56049644947052, 0.5890320539474487, 0.6175676584243774, 0.6461032032966614, 0.6746388077735901, 0.7031744122505188, 0.7317100167274475, 0.7602455615997314, 0.7887811660766602, 0.8173167705535889, 0.8458523750305176, 0.8743879795074463, 0.902923583984375, 0.9314591884613037, 0.9599947929382324, 0.9885303974151611, 1.0170660018920898, 1.0456016063690186, 1.0741372108459473, 1.1026726961135864, 1.1312083005905151]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 0.0, 1.0, 6.0, 6.0, 3.0, 6.0, 17.0, 19.0, 17.0, 19.0, 30.0, 30.0, 32.0, 39.0, 33.0, 47.0, 39.0, 52.0, 46.0, 60.0, 55.0, 50.0, 48.0, 57.0, 48.0, 38.0, 43.0, 36.0, 24.0, 27.0, 16.0, 15.0, 11.0, 10.0, 3.0, 8.0, 4.0, 7.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43116235733032227, -0.4161853790283203, -0.40120840072631836, -0.3862314224243164, -0.37125447392463684, -0.3562774956226349, -0.34130051732063293, -0.326323539018631, -0.3113465905189514, -0.29636961221694946, -0.2813926339149475, -0.26641565561294556, -0.251438707113266, -0.23646172881126404, -0.22148475050926208, -0.20650777220726013, -0.19153079390525818, -0.17655381560325623, -0.16157685220241547, -0.1465998739004135, -0.13162291049957275, -0.1166459321975708, -0.10166895389556885, -0.08669198304414749, -0.07171501219272614, -0.05673804134130478, -0.041761066764593124, -0.02678409218788147, -0.011807121336460114, 0.0031698495149612427, 0.018146827816963196, 0.03312379866838455, 0.04810076951980591, 0.06307774037122726, 0.07805471122264862, 0.09303168952465057, 0.10800866037607193, 0.12298563122749329, 0.13796260952949524, 0.1529395878314972, 0.16791655123233795, 0.1828935295343399, 0.19787049293518066, 0.21284747123718262, 0.22782444953918457, 0.24280141294002533, 0.2577784061431885, 0.27275535464286804, 0.28773233294487, 0.30270931124687195, 0.3176862895488739, 0.33266323804855347, 0.3476402163505554, 0.3626171946525574, 0.3775941729545593, 0.3925711512565613, 0.40754812955856323, 0.4225251078605652, 0.43750208616256714, 0.4524790644645691, 0.46745601296424866, 0.4824329912662506, 0.49740996956825256, 0.5123869180679321, 0.5273638963699341]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 5.0, 8.0, 8.0, 16.0, 26.0, 37.0, 53.0, 108.0, 158.0, 234.0, 397.0, 677.0, 1250.0, 2270.0, 4771.0, 11174.0, 29903.0, 112532.0, 3425749.0, 504155.0, 64729.0, 19988.0, 7844.0, 3713.0, 1841.0, 1062.0, 571.0, 362.0, 215.0, 137.0, 111.0, 58.0, 40.0, 28.0, 12.0, 9.0, 9.0, 6.0, 3.0, 5.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07421875, -0.07145118713378906, -0.06868362426757812, -0.06591606140136719, -0.06314849853515625, -0.06038093566894531, -0.057613372802734375, -0.05484580993652344, -0.0520782470703125, -0.04931068420410156, -0.046543121337890625, -0.04377555847167969, -0.04100799560546875, -0.03824043273925781, -0.035472869873046875, -0.03270530700683594, -0.029937744140625, -0.027170181274414062, -0.024402618408203125, -0.021635055541992188, -0.01886749267578125, -0.016099929809570312, -0.013332366943359375, -0.010564804077148438, -0.0077972412109375, -0.0050296783447265625, -0.002262115478515625, 0.0005054473876953125, 0.00327301025390625, 0.0060405731201171875, 0.008808135986328125, 0.011575698852539062, 0.01434326171875, 0.017110824584960938, 0.019878387451171875, 0.022645950317382812, 0.02541351318359375, 0.028181076049804688, 0.030948638916015625, 0.03371620178222656, 0.0364837646484375, 0.03925132751464844, 0.042018890380859375, 0.04478645324707031, 0.04755401611328125, 0.05032157897949219, 0.053089141845703125, 0.05585670471191406, 0.058624267578125, 0.06139183044433594, 0.06415939331054688, 0.06692695617675781, 0.06969451904296875, 0.07246208190917969, 0.07522964477539062, 0.07799720764160156, 0.0807647705078125, 0.08353233337402344, 0.08629989624023438, 0.08906745910644531, 0.09183502197265625, 0.09460258483886719, 0.09737014770507812, 0.10013771057128906, 0.1029052734375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 10.0, 4.0, 9.0, 9.0, 11.0, 18.0, 25.0, 43.0, 38.0, 48.0, 67.0, 57.0, 78.0, 53.0, 69.0, 72.0, 65.0, 64.0, 52.0, 44.0, 44.0, 29.0, 14.0, 32.0, 10.0, 11.0, 7.0, 2.0, 4.0, 6.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0169219970703125, -0.016196012496948242, -0.015470027923583984, -0.014744043350219727, -0.014018058776855469, -0.013292074203491211, -0.012566089630126953, -0.011840105056762695, -0.011114120483398438, -0.01038813591003418, -0.009662151336669922, -0.008936166763305664, -0.008210182189941406, -0.0074841976165771484, -0.006758213043212891, -0.006032228469848633, -0.005306243896484375, -0.004580259323120117, -0.0038542747497558594, -0.0031282901763916016, -0.0024023056030273438, -0.001676321029663086, -0.0009503364562988281, -0.0002243518829345703, 0.0005016326904296875, 0.0012276172637939453, 0.001953601837158203, 0.002679586410522461, 0.0034055709838867188, 0.0041315555572509766, 0.004857540130615234, 0.005583524703979492, 0.00630950927734375, 0.007035493850708008, 0.007761478424072266, 0.008487462997436523, 0.009213447570800781, 0.009939432144165039, 0.010665416717529297, 0.011391401290893555, 0.012117385864257812, 0.01284337043762207, 0.013569355010986328, 0.014295339584350586, 0.015021324157714844, 0.0157473087310791, 0.01647329330444336, 0.017199277877807617, 0.017925262451171875, 0.018651247024536133, 0.01937723159790039, 0.02010321617126465, 0.020829200744628906, 0.021555185317993164, 0.022281169891357422, 0.02300715446472168, 0.023733139038085938, 0.024459123611450195, 0.025185108184814453, 0.02591109275817871, 0.02663707733154297, 0.027363061904907227, 0.028089046478271484, 0.028815031051635742, 0.029541015625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 5.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 6.0, 13.0, 12.0, 23.0, 44.0, 46.0, 80.0, 100.0, 162.0, 235.0, 337.0, 501.0, 725.0, 1105.0, 1742.0, 2813.0, 4485.0, 7744.0, 13434.0, 25155.0, 52981.0, 135021.0, 644599.0, 2866360.0, 266990.0, 85334.0, 37628.0, 19226.0, 10745.0, 6177.0, 3777.0, 2313.0, 1460.0, 972.0, 580.0, 459.0, 287.0, 175.0, 111.0, 112.0, 80.0, 48.0, 20.0, 27.0, 16.0, 8.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.053863525390625, -0.05214071273803711, -0.05041790008544922, -0.04869508743286133, -0.04697227478027344, -0.04524946212768555, -0.043526649475097656, -0.041803836822509766, -0.040081024169921875, -0.038358211517333984, -0.036635398864746094, -0.0349125862121582, -0.03318977355957031, -0.03146696090698242, -0.02974414825439453, -0.02802133560180664, -0.02629852294921875, -0.02457571029663086, -0.02285289764404297, -0.021130084991455078, -0.019407272338867188, -0.017684459686279297, -0.015961647033691406, -0.014238834381103516, -0.012516021728515625, -0.010793209075927734, -0.009070396423339844, -0.007347583770751953, -0.0056247711181640625, -0.003901958465576172, -0.0021791458129882812, -0.0004563331604003906, 0.0012664794921875, 0.0029892921447753906, 0.004712104797363281, 0.006434917449951172, 0.008157730102539062, 0.009880542755126953, 0.011603355407714844, 0.013326168060302734, 0.015048980712890625, 0.016771793365478516, 0.018494606018066406, 0.020217418670654297, 0.021940231323242188, 0.023663043975830078, 0.02538585662841797, 0.02710866928100586, 0.02883148193359375, 0.03055429458618164, 0.03227710723876953, 0.03399991989135742, 0.03572273254394531, 0.0374455451965332, 0.039168357849121094, 0.040891170501708984, 0.042613983154296875, 0.044336795806884766, 0.046059608459472656, 0.04778242111206055, 0.04950523376464844, 0.05122804641723633, 0.05295085906982422, 0.05467367172241211, 0.056396484375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 6.0, 8.0, 10.0, 8.0, 17.0, 21.0, 19.0, 38.0, 64.0, 85.0, 168.0, 361.0, 1660.0, 849.0, 295.0, 138.0, 96.0, 56.0, 43.0, 32.0, 26.0, 20.0, 18.0, 9.0, 12.0, 5.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034942626953125, -0.03368806838989258, -0.032433509826660156, -0.031178951263427734, -0.029924392700195312, -0.02866983413696289, -0.02741527557373047, -0.026160717010498047, -0.024906158447265625, -0.023651599884033203, -0.02239704132080078, -0.02114248275756836, -0.019887924194335938, -0.018633365631103516, -0.017378807067871094, -0.016124248504638672, -0.01486968994140625, -0.013615131378173828, -0.012360572814941406, -0.011106014251708984, -0.009851455688476562, -0.00859689712524414, -0.007342338562011719, -0.006087779998779297, -0.004833221435546875, -0.003578662872314453, -0.0023241043090820312, -0.0010695457458496094, 0.0001850128173828125, 0.0014395713806152344, 0.0026941299438476562, 0.003948688507080078, 0.0052032470703125, 0.006457805633544922, 0.007712364196777344, 0.008966922760009766, 0.010221481323242188, 0.01147603988647461, 0.012730598449707031, 0.013985157012939453, 0.015239715576171875, 0.016494274139404297, 0.01774883270263672, 0.01900339126586914, 0.020257949829101562, 0.021512508392333984, 0.022767066955566406, 0.024021625518798828, 0.02527618408203125, 0.026530742645263672, 0.027785301208496094, 0.029039859771728516, 0.030294418334960938, 0.03154897689819336, 0.03280353546142578, 0.0340580940246582, 0.035312652587890625, 0.03656721115112305, 0.03782176971435547, 0.03907632827758789, 0.04033088684082031, 0.041585445404052734, 0.042840003967285156, 0.04409456253051758, 0.04534912109375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 11.0, 20.0, 37.0, 67.0, 115.0, 168.0, 169.0, 165.0, 110.0, 62.0, 34.0, 24.0, 14.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17778435349464417, -0.16735491156578064, -0.15692545473575592, -0.1464960128068924, -0.13606657087802887, -0.12563711404800415, -0.11520767211914062, -0.1047782301902771, -0.09434878081083298, -0.08391933143138885, -0.07348988950252533, -0.06306044012308121, -0.05263099446892738, -0.04220154881477356, -0.03177209943532944, -0.021342657506465912, -0.01091320812702179, -0.0004837615415453911, 0.009945685043931007, 0.02037513256072998, 0.030804578214883804, 0.04123402386903763, 0.05166347324848175, 0.062092915177345276, 0.0725223645567894, 0.08295181393623352, 0.09338125586509705, 0.10381070524454117, 0.11424015462398529, 0.12466959655284882, 0.13509905338287354, 0.14552849531173706, 0.15595793724060059, 0.1663873791694641, 0.17681683599948883, 0.18724627792835236, 0.19767571985721588, 0.2081051766872406, 0.21853461861610413, 0.22896406054496765, 0.23939350247383118, 0.2498229444026947, 0.2602523863315582, 0.27068185806274414, 0.28111129999160767, 0.2915407419204712, 0.3019701838493347, 0.31239962577819824, 0.32282906770706177, 0.3332585096359253, 0.3436879515647888, 0.35411739349365234, 0.36454686522483826, 0.3749763071537018, 0.3854057490825653, 0.39583519101142883, 0.40626466274261475, 0.41669410467147827, 0.4271235466003418, 0.4375529885292053, 0.44798246026039124, 0.45841190218925476, 0.4688413441181183, 0.4792707860469818, 0.48970022797584534]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 5.0, 5.0, 2.0, 10.0, 10.0, 7.0, 15.0, 11.0, 16.0, 14.0, 20.0, 20.0, 27.0, 27.0, 18.0, 39.0, 39.0, 27.0, 35.0, 29.0, 45.0, 25.0, 48.0, 48.0, 35.0, 47.0, 40.0, 35.0, 30.0, 37.0, 29.0, 32.0, 28.0, 14.0, 14.0, 18.0, 17.0, 10.0, 21.0, 11.0, 10.0, 8.0, 10.0, 3.0, 4.0, 3.0, 1.0, 1.0, 5.0, 2.0], "bins": [-0.1448119878768921, -0.14098496735095978, -0.13715794682502747, -0.13333092629909515, -0.12950390577316284, -0.12567687034606934, -0.12184984982013702, -0.11802282929420471, -0.1141958087682724, -0.11036878824234009, -0.10654176771640778, -0.10271473973989487, -0.09888771921396255, -0.09506069868803024, -0.09123367071151733, -0.08740665018558502, -0.08357962965965271, -0.0797526091337204, -0.07592558860778809, -0.07209856063127518, -0.06827154010534286, -0.06444451957941055, -0.06061749532818794, -0.05679047107696533, -0.05296345055103302, -0.04913643002510071, -0.0453094057738781, -0.04148238152265549, -0.037655360996723175, -0.03382834047079086, -0.030001316219568253, -0.02617429383099079, -0.02234727144241333, -0.01852024905383587, -0.014693226665258408, -0.010866204276680946, -0.007039181888103485, -0.003212159499526024, 0.0006148628890514374, 0.004441885277628899, 0.00826890766620636, 0.012095930054783821, 0.015922952443361282, 0.019749974831938744, 0.023576997220516205, 0.027404019609093666, 0.031231041997671127, 0.03505806624889374, 0.03888508677482605, 0.04271210730075836, 0.04653913155198097, 0.05036615580320358, 0.054193176329135895, 0.05802019685506821, 0.06184722110629082, 0.06567424535751343, 0.06950126588344574, 0.07332828640937805, 0.07715530693531036, 0.08098233491182327, 0.08480935543775558, 0.0886363759636879, 0.0924634039402008, 0.09629042446613312, 0.10011744499206543]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 8.0, 3.0, 5.0, 4.0, 9.0, 9.0, 18.0, 31.0, 47.0, 57.0, 72.0, 113.0, 145.0, 256.0, 374.0, 525.0, 851.0, 1359.0, 2296.0, 3776.0, 6470.0, 11826.0, 22424.0, 44515.0, 93869.0, 208800.0, 322422.0, 170001.0, 77334.0, 37447.0, 18991.0, 10211.0, 5571.0, 3276.0, 1976.0, 1232.0, 813.0, 482.0, 326.0, 207.0, 134.0, 84.0, 58.0, 42.0, 27.0, 24.0, 16.0, 8.0, 10.0, 2.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.056488037109375, -0.0545649528503418, -0.052641868591308594, -0.05071878433227539, -0.04879570007324219, -0.046872615814208984, -0.04494953155517578, -0.04302644729614258, -0.041103363037109375, -0.03918027877807617, -0.03725719451904297, -0.035334110260009766, -0.03341102600097656, -0.03148794174194336, -0.029564857482910156, -0.027641773223876953, -0.02571868896484375, -0.023795604705810547, -0.021872520446777344, -0.01994943618774414, -0.018026351928710938, -0.016103267669677734, -0.014180183410644531, -0.012257099151611328, -0.010334014892578125, -0.008410930633544922, -0.006487846374511719, -0.004564762115478516, -0.0026416778564453125, -0.0007185935974121094, 0.0012044906616210938, 0.003127574920654297, 0.0050506591796875, 0.006973743438720703, 0.008896827697753906, 0.01081991195678711, 0.012742996215820312, 0.014666080474853516, 0.01658916473388672, 0.018512248992919922, 0.020435333251953125, 0.022358417510986328, 0.02428150177001953, 0.026204586029052734, 0.028127670288085938, 0.03005075454711914, 0.031973838806152344, 0.03389692306518555, 0.03582000732421875, 0.03774309158325195, 0.039666175842285156, 0.04158926010131836, 0.04351234436035156, 0.045435428619384766, 0.04735851287841797, 0.04928159713745117, 0.051204681396484375, 0.05312776565551758, 0.05505084991455078, 0.056973934173583984, 0.05889701843261719, 0.06082010269165039, 0.0627431869506836, 0.0646662712097168, 0.06658935546875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 6.0, 5.0, 7.0, 2.0, 5.0, 8.0, 11.0, 5.0, 11.0, 26.0, 34.0, 37.0, 47.0, 41.0, 57.0, 55.0, 55.0, 58.0, 56.0, 62.0, 73.0, 83.0, 40.0, 31.0, 39.0, 33.0, 29.0, 18.0, 20.0, 12.0, 15.0, 6.0, 5.0, 7.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01824951171875, -0.01758432388305664, -0.01691913604736328, -0.016253948211669922, -0.015588760375976562, -0.014923572540283203, -0.014258384704589844, -0.013593196868896484, -0.012928009033203125, -0.012262821197509766, -0.011597633361816406, -0.010932445526123047, -0.010267257690429688, -0.009602069854736328, -0.008936882019042969, -0.00827169418334961, -0.00760650634765625, -0.006941318511962891, -0.006276130676269531, -0.005610942840576172, -0.0049457550048828125, -0.004280567169189453, -0.0036153793334960938, -0.0029501914978027344, -0.002285003662109375, -0.0016198158264160156, -0.0009546279907226562, -0.0002894401550292969, 0.0003757476806640625, 0.0010409355163574219, 0.0017061233520507812, 0.0023713111877441406, 0.0030364990234375, 0.0037016868591308594, 0.004366874694824219, 0.005032062530517578, 0.0056972503662109375, 0.006362438201904297, 0.007027626037597656, 0.007692813873291016, 0.008358001708984375, 0.009023189544677734, 0.009688377380371094, 0.010353565216064453, 0.011018753051757812, 0.011683940887451172, 0.012349128723144531, 0.01301431655883789, 0.01367950439453125, 0.01434469223022461, 0.015009880065917969, 0.015675067901611328, 0.016340255737304688, 0.017005443572998047, 0.017670631408691406, 0.018335819244384766, 0.019001007080078125, 0.019666194915771484, 0.020331382751464844, 0.020996570587158203, 0.021661758422851562, 0.022326946258544922, 0.02299213409423828, 0.02365732192993164, 0.024322509765625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 9.0, 5.0, 8.0, 7.0, 7.0, 23.0, 35.0, 42.0, 69.0, 89.0, 124.0, 159.0, 243.0, 421.0, 550.0, 1054.0, 2137.0, 5378.0, 13835.0, 41200.0, 130828.0, 391507.0, 313058.0, 97694.0, 31067.0, 10612.0, 4074.0, 1843.0, 953.0, 494.0, 312.0, 229.0, 139.0, 94.0, 58.0, 58.0, 38.0, 25.0, 23.0, 20.0, 16.0, 8.0, 4.0, 4.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0694580078125, -0.06713294982910156, -0.06480789184570312, -0.06248283386230469, -0.06015777587890625, -0.05783271789550781, -0.055507659912109375, -0.05318260192871094, -0.0508575439453125, -0.04853248596191406, -0.046207427978515625, -0.04388236999511719, -0.04155731201171875, -0.03923225402832031, -0.036907196044921875, -0.03458213806152344, -0.032257080078125, -0.029932022094726562, -0.027606964111328125, -0.025281906127929688, -0.02295684814453125, -0.020631790161132812, -0.018306732177734375, -0.015981674194335938, -0.0136566162109375, -0.011331558227539062, -0.009006500244140625, -0.0066814422607421875, -0.00435638427734375, -0.0020313262939453125, 0.000293731689453125, 0.0026187896728515625, 0.00494384765625, 0.0072689056396484375, 0.009593963623046875, 0.011919021606445312, 0.01424407958984375, 0.016569137573242188, 0.018894195556640625, 0.021219253540039062, 0.0235443115234375, 0.025869369506835938, 0.028194427490234375, 0.030519485473632812, 0.03284454345703125, 0.03516960144042969, 0.037494659423828125, 0.03981971740722656, 0.042144775390625, 0.04446983337402344, 0.046794891357421875, 0.04911994934082031, 0.05144500732421875, 0.05377006530761719, 0.056095123291015625, 0.05842018127441406, 0.0607452392578125, 0.06307029724121094, 0.06539535522460938, 0.06772041320800781, 0.07004547119140625, 0.07237052917480469, 0.07469558715820312, 0.07702064514160156, 0.079345703125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 5.0, 4.0, 3.0, 5.0, 9.0, 7.0, 13.0, 9.0, 16.0, 13.0, 16.0, 20.0, 27.0, 21.0, 32.0, 33.0, 32.0, 40.0, 32.0, 50.0, 38.0, 42.0, 40.0, 64.0, 26.0, 23.0, 34.0, 29.0, 42.0, 35.0, 31.0, 34.0, 25.0, 24.0, 24.0, 25.0, 18.0, 16.0, 9.0, 5.0, 7.0, 8.0, 5.0, 4.0, 5.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.06695556640625, -0.06477832794189453, -0.06260108947753906, -0.060423851013183594, -0.058246612548828125, -0.056069374084472656, -0.05389213562011719, -0.05171489715576172, -0.04953765869140625, -0.04736042022705078, -0.04518318176269531, -0.043005943298339844, -0.040828704833984375, -0.038651466369628906, -0.03647422790527344, -0.03429698944091797, -0.0321197509765625, -0.02994251251220703, -0.027765274047851562, -0.025588035583496094, -0.023410797119140625, -0.021233558654785156, -0.019056320190429688, -0.01687908172607422, -0.01470184326171875, -0.012524604797363281, -0.010347366333007812, -0.008170127868652344, -0.005992889404296875, -0.0038156509399414062, -0.0016384124755859375, 0.0005388259887695312, 0.002716064453125, 0.004893302917480469, 0.0070705413818359375, 0.009247779846191406, 0.011425018310546875, 0.013602256774902344, 0.015779495239257812, 0.01795673370361328, 0.02013397216796875, 0.02231121063232422, 0.024488449096679688, 0.026665687561035156, 0.028842926025390625, 0.031020164489746094, 0.03319740295410156, 0.03537464141845703, 0.0375518798828125, 0.03972911834716797, 0.04190635681152344, 0.044083595275878906, 0.046260833740234375, 0.048438072204589844, 0.05061531066894531, 0.05279254913330078, 0.05496978759765625, 0.05714702606201172, 0.05932426452636719, 0.061501502990722656, 0.06367874145507812, 0.0658559799194336, 0.06803321838378906, 0.07021045684814453, 0.0723876953125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 8.0, 12.0, 15.0, 21.0, 41.0, 52.0, 81.0, 135.0, 227.0, 387.0, 697.0, 1286.0, 2446.0, 5103.0, 11898.0, 30100.0, 87626.0, 286990.0, 408766.0, 137465.0, 44516.0, 16661.0, 7025.0, 3212.0, 1630.0, 874.0, 500.0, 289.0, 168.0, 106.0, 59.0, 53.0, 39.0, 17.0, 9.0, 9.0, 6.0, 10.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03887939453125, -0.03763294219970703, -0.03638648986816406, -0.035140037536621094, -0.033893585205078125, -0.032647132873535156, -0.03140068054199219, -0.03015422821044922, -0.02890777587890625, -0.02766132354736328, -0.026414871215820312, -0.025168418884277344, -0.023921966552734375, -0.022675514221191406, -0.021429061889648438, -0.02018260955810547, -0.0189361572265625, -0.01768970489501953, -0.016443252563476562, -0.015196800231933594, -0.013950347900390625, -0.012703895568847656, -0.011457443237304688, -0.010210990905761719, -0.00896453857421875, -0.007718086242675781, -0.0064716339111328125, -0.005225181579589844, -0.003978729248046875, -0.0027322769165039062, -0.0014858245849609375, -0.00023937225341796875, 0.001007080078125, 0.0022535324096679688, 0.0034999847412109375, 0.004746437072753906, 0.005992889404296875, 0.007239341735839844, 0.008485794067382812, 0.009732246398925781, 0.01097869873046875, 0.012225151062011719, 0.013471603393554688, 0.014718055725097656, 0.015964508056640625, 0.017210960388183594, 0.018457412719726562, 0.01970386505126953, 0.0209503173828125, 0.02219676971435547, 0.023443222045898438, 0.024689674377441406, 0.025936126708984375, 0.027182579040527344, 0.028429031372070312, 0.02967548370361328, 0.03092193603515625, 0.03216838836669922, 0.03341484069824219, 0.034661293029785156, 0.035907745361328125, 0.037154197692871094, 0.03840065002441406, 0.03964710235595703, 0.0408935546875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 6.0, 12.0, 12.0, 15.0, 24.0, 20.0, 46.0, 68.0, 67.0, 84.0, 96.0, 106.0, 91.0, 86.0, 65.0, 57.0, 36.0, 29.0, 26.0, 22.0, 5.0, 11.0, 1.0, 5.0, 8.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5822391510009766e-05, -3.46088781952858e-05, -3.339536488056183e-05, -3.218185156583786e-05, -3.096833825111389e-05, -2.9754824936389923e-05, -2.8541311621665955e-05, -2.7327798306941986e-05, -2.6114284992218018e-05, -2.490077167749405e-05, -2.368725836277008e-05, -2.2473745048046112e-05, -2.1260231733322144e-05, -2.0046718418598175e-05, -1.8833205103874207e-05, -1.7619691789150238e-05, -1.640617847442627e-05, -1.5192665159702301e-05, -1.3979151844978333e-05, -1.2765638530254364e-05, -1.1552125215530396e-05, -1.0338611900806427e-05, -9.125098586082458e-06, -7.91158527135849e-06, -6.6980719566345215e-06, -5.484558641910553e-06, -4.2710453271865845e-06, -3.057532012462616e-06, -1.8440186977386475e-06, -6.30505383014679e-07, 5.830079317092896e-07, 1.796521246433258e-06, 3.0100345611572266e-06, 4.223547875881195e-06, 5.4370611906051636e-06, 6.650574505329132e-06, 7.8640878200531e-06, 9.077601134777069e-06, 1.0291114449501038e-05, 1.1504627764225006e-05, 1.2718141078948975e-05, 1.3931654393672943e-05, 1.5145167708396912e-05, 1.635868102312088e-05, 1.757219433784485e-05, 1.8785707652568817e-05, 1.9999220967292786e-05, 2.1212734282016754e-05, 2.2426247596740723e-05, 2.363976091146469e-05, 2.485327422618866e-05, 2.6066787540912628e-05, 2.7280300855636597e-05, 2.8493814170360565e-05, 2.9707327485084534e-05, 3.09208407998085e-05, 3.213435411453247e-05, 3.334786742925644e-05, 3.456138074398041e-05, 3.5774894058704376e-05, 3.6988407373428345e-05, 3.820192068815231e-05, 3.941543400287628e-05, 4.062894731760025e-05, 4.184246063232422e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 4.0, 6.0, 10.0, 11.0, 18.0, 20.0, 37.0, 51.0, 77.0, 114.0, 160.0, 308.0, 547.0, 995.0, 2022.0, 4057.0, 8856.0, 21707.0, 63537.0, 225624.0, 474423.0, 164985.0, 48794.0, 17735.0, 7199.0, 3478.0, 1708.0, 819.0, 489.0, 279.0, 158.0, 106.0, 73.0, 35.0, 31.0, 21.0, 18.0, 20.0, 3.0, 7.0, 4.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.041229248046875, -0.03991556167602539, -0.03860187530517578, -0.03728818893432617, -0.03597450256347656, -0.03466081619262695, -0.033347129821777344, -0.032033443450927734, -0.030719757080078125, -0.029406070709228516, -0.028092384338378906, -0.026778697967529297, -0.025465011596679688, -0.024151325225830078, -0.02283763885498047, -0.02152395248413086, -0.02021026611328125, -0.01889657974243164, -0.01758289337158203, -0.016269207000732422, -0.014955520629882812, -0.013641834259033203, -0.012328147888183594, -0.011014461517333984, -0.009700775146484375, -0.008387088775634766, -0.007073402404785156, -0.005759716033935547, -0.0044460296630859375, -0.003132343292236328, -0.0018186569213867188, -0.0005049705505371094, 0.0008087158203125, 0.0021224021911621094, 0.0034360885620117188, 0.004749774932861328, 0.0060634613037109375, 0.007377147674560547, 0.008690834045410156, 0.010004520416259766, 0.011318206787109375, 0.012631893157958984, 0.013945579528808594, 0.015259265899658203, 0.016572952270507812, 0.017886638641357422, 0.01920032501220703, 0.02051401138305664, 0.02182769775390625, 0.02314138412475586, 0.02445507049560547, 0.025768756866455078, 0.027082443237304688, 0.028396129608154297, 0.029709815979003906, 0.031023502349853516, 0.032337188720703125, 0.033650875091552734, 0.034964561462402344, 0.03627824783325195, 0.03759193420410156, 0.03890562057495117, 0.04021930694580078, 0.04153299331665039, 0.0428466796875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 8.0, 13.0, 15.0, 21.0, 21.0, 21.0, 36.0, 36.0, 65.0, 72.0, 69.0, 103.0, 78.0, 75.0, 60.0, 52.0, 36.0, 52.0, 30.0, 24.0, 28.0, 13.0, 14.0, 7.0, 14.0, 9.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0297698974609375, -0.02870965003967285, -0.027649402618408203, -0.026589155197143555, -0.025528907775878906, -0.024468660354614258, -0.02340841293334961, -0.02234816551208496, -0.021287918090820312, -0.020227670669555664, -0.019167423248291016, -0.018107175827026367, -0.01704692840576172, -0.01598668098449707, -0.014926433563232422, -0.013866186141967773, -0.012805938720703125, -0.011745691299438477, -0.010685443878173828, -0.00962519645690918, -0.008564949035644531, -0.007504701614379883, -0.006444454193115234, -0.005384206771850586, -0.0043239593505859375, -0.003263711929321289, -0.0022034645080566406, -0.0011432170867919922, -8.296966552734375e-05, 0.0009772777557373047, 0.002037525177001953, 0.0030977725982666016, 0.00415802001953125, 0.0052182674407958984, 0.006278514862060547, 0.007338762283325195, 0.008399009704589844, 0.009459257125854492, 0.01051950454711914, 0.011579751968383789, 0.012639999389648438, 0.013700246810913086, 0.014760494232177734, 0.015820741653442383, 0.01688098907470703, 0.01794123649597168, 0.019001483917236328, 0.020061731338500977, 0.021121978759765625, 0.022182226181030273, 0.023242473602294922, 0.02430272102355957, 0.02536296844482422, 0.026423215866088867, 0.027483463287353516, 0.028543710708618164, 0.029603958129882812, 0.03066420555114746, 0.03172445297241211, 0.03278470039367676, 0.033844947814941406, 0.034905195236206055, 0.0359654426574707, 0.03702569007873535, 0.0380859375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 8.0, 12.0, 20.0, 48.0, 64.0, 115.0, 168.0, 183.0, 153.0, 113.0, 67.0, 34.0, 13.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8925408124923706, -0.8664276003837585, -0.8403143882751465, -0.8142011165618896, -0.7880879044532776, -0.7619746923446655, -0.7358614802360535, -0.7097482681274414, -0.6836349964141846, -0.6575217843055725, -0.6314085721969604, -0.6052953004837036, -0.5791820883750916, -0.5530688762664795, -0.5269556641578674, -0.5008424520492554, -0.4747292101383209, -0.44861599802970886, -0.4225027561187744, -0.39638954401016235, -0.3702763020992279, -0.34416308999061584, -0.3180498480796814, -0.29193663597106934, -0.2658234238624573, -0.23971019685268402, -0.21359696984291077, -0.1874837577342987, -0.16137051582336426, -0.1352573037147522, -0.10914407670497894, -0.08303084969520569, -0.05691760778427124, -0.030804382637143135, -0.00469115749001503, 0.021422065794467926, 0.04753529280424118, 0.07364851236343384, 0.09976173937320709, 0.12587496638298035, 0.1519881933927536, 0.17810142040252686, 0.2042146474123001, 0.23032787442207336, 0.2564410865306854, 0.2825543284416199, 0.30866754055023193, 0.334780752658844, 0.36089399456977844, 0.3870072066783905, 0.41312044858932495, 0.439233660697937, 0.46534690260887146, 0.4914601147174835, 0.517573356628418, 0.54368656873703, 0.5697997808456421, 0.5959129929542542, 0.6220262050628662, 0.648139476776123, 0.6742526888847351, 0.7003659009933472, 0.7264791131019592, 0.7525923252105713, 0.7787055969238281]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 9.0, 10.0, 6.0, 11.0, 9.0, 8.0, 21.0, 24.0, 20.0, 35.0, 33.0, 34.0, 53.0, 31.0, 45.0, 41.0, 48.0, 47.0, 57.0, 36.0, 51.0, 43.0, 56.0, 39.0, 46.0, 32.0, 21.0, 17.0, 24.0, 11.0, 14.0, 9.0, 9.0, 11.0, 11.0, 13.0, 3.0, 3.0, 2.0, 1.0, 1.0, 6.0, 4.0, 1.0], "bins": [-0.551406741142273, -0.5369205474853516, -0.5224342942237854, -0.507948100566864, -0.49346187710762024, -0.47897568345069885, -0.4644894599914551, -0.4500032663345337, -0.4355170428752899, -0.42103081941604614, -0.40654462575912476, -0.392058402299881, -0.3775721788406372, -0.3630859851837158, -0.34859976172447205, -0.33411353826522827, -0.3196273446083069, -0.3051411211490631, -0.2906549274921417, -0.27616870403289795, -0.2616824805736542, -0.2471962869167328, -0.232710063457489, -0.21822385489940643, -0.20373761653900146, -0.18925140798091888, -0.1747651845216751, -0.16027897596359253, -0.14579276740550995, -0.13130655884742737, -0.1168203353881836, -0.10233412683010101, -0.08784791827201843, -0.07336170226335526, -0.058875493705272675, -0.0443892776966095, -0.029903065413236618, -0.015416853129863739, -0.0009306371212005615, 0.013555571436882019, 0.028041787445545197, 0.042527999728918076, 0.057014212012290955, 0.07150042802095413, 0.08598664402961731, 0.10047285258769989, 0.11495906859636307, 0.12944528460502625, 0.14393149316310883, 0.1584177017211914, 0.17290392518043518, 0.18739013373851776, 0.20187634229660034, 0.21636256575584412, 0.2308487743139267, 0.24533498287200928, 0.25982120633125305, 0.2743074297904968, 0.2887936234474182, 0.303279846906662, 0.31776607036590576, 0.33225226402282715, 0.3467384874820709, 0.3612247109413147, 0.3757109045982361]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 6.0, 13.0, 15.0, 17.0, 27.0, 39.0, 50.0, 92.0, 150.0, 213.0, 375.0, 679.0, 1127.0, 2288.0, 4617.0, 10707.0, 29043.0, 108291.0, 2983123.0, 928258.0, 82833.0, 24093.0, 9256.0, 4139.0, 1983.0, 1134.0, 614.0, 397.0, 214.0, 154.0, 105.0, 76.0, 45.0, 40.0, 19.0, 17.0, 9.0, 8.0, 5.0, 2.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0782470703125, -0.07544422149658203, -0.07264137268066406, -0.0698385238647461, -0.06703567504882812, -0.06423282623291016, -0.06142997741699219, -0.05862712860107422, -0.05582427978515625, -0.05302143096923828, -0.05021858215332031, -0.047415733337402344, -0.044612884521484375, -0.041810035705566406, -0.03900718688964844, -0.03620433807373047, -0.0334014892578125, -0.03059864044189453, -0.027795791625976562, -0.024992942810058594, -0.022190093994140625, -0.019387245178222656, -0.016584396362304688, -0.013781547546386719, -0.01097869873046875, -0.008175849914550781, -0.0053730010986328125, -0.0025701522827148438, 0.000232696533203125, 0.0030355453491210938, 0.0058383941650390625, 0.008641242980957031, 0.011444091796875, 0.014246940612792969, 0.017049789428710938, 0.019852638244628906, 0.022655487060546875, 0.025458335876464844, 0.028261184692382812, 0.03106403350830078, 0.03386688232421875, 0.03666973114013672, 0.03947257995605469, 0.042275428771972656, 0.045078277587890625, 0.047881126403808594, 0.05068397521972656, 0.05348682403564453, 0.0562896728515625, 0.05909252166748047, 0.06189537048339844, 0.0646982192993164, 0.06750106811523438, 0.07030391693115234, 0.07310676574707031, 0.07590961456298828, 0.07871246337890625, 0.08151531219482422, 0.08431816101074219, 0.08712100982666016, 0.08992385864257812, 0.0927267074584961, 0.09552955627441406, 0.09833240509033203, 0.10113525390625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 4.0, 6.0, 5.0, 3.0, 4.0, 4.0, 7.0, 8.0, 13.0, 16.0, 25.0, 47.0, 43.0, 47.0, 63.0, 66.0, 49.0, 67.0, 77.0, 68.0, 65.0, 65.0, 64.0, 41.0, 25.0, 25.0, 21.0, 20.0, 17.0, 14.0, 8.0, 6.0, 3.0, 4.0, 6.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01751708984375, -0.016731739044189453, -0.015946388244628906, -0.01516103744506836, -0.014375686645507812, -0.013590335845947266, -0.012804985046386719, -0.012019634246826172, -0.011234283447265625, -0.010448932647705078, -0.009663581848144531, -0.008878231048583984, -0.008092880249023438, -0.007307529449462891, -0.006522178649902344, -0.005736827850341797, -0.00495147705078125, -0.004166126251220703, -0.0033807754516601562, -0.0025954246520996094, -0.0018100738525390625, -0.0010247230529785156, -0.00023937225341796875, 0.0005459785461425781, 0.001331329345703125, 0.002116680145263672, 0.0029020309448242188, 0.0036873817443847656, 0.0044727325439453125, 0.005258083343505859, 0.006043434143066406, 0.006828784942626953, 0.0076141357421875, 0.008399486541748047, 0.009184837341308594, 0.00997018814086914, 0.010755538940429688, 0.011540889739990234, 0.012326240539550781, 0.013111591339111328, 0.013896942138671875, 0.014682292938232422, 0.015467643737792969, 0.016252994537353516, 0.017038345336914062, 0.01782369613647461, 0.018609046936035156, 0.019394397735595703, 0.02017974853515625, 0.020965099334716797, 0.021750450134277344, 0.02253580093383789, 0.023321151733398438, 0.024106502532958984, 0.02489185333251953, 0.025677204132080078, 0.026462554931640625, 0.027247905731201172, 0.02803325653076172, 0.028818607330322266, 0.029603958129882812, 0.03038930892944336, 0.031174659729003906, 0.03196001052856445, 0.032745361328125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 9.0, 14.0, 20.0, 30.0, 41.0, 73.0, 118.0, 178.0, 305.0, 471.0, 970.0, 1748.0, 3324.0, 6416.0, 14026.0, 32387.0, 88407.0, 356761.0, 3100699.0, 425053.0, 98352.0, 35132.0, 15211.0, 6930.0, 3565.0, 1788.0, 919.0, 547.0, 313.0, 178.0, 100.0, 69.0, 42.0, 30.0, 18.0, 14.0, 10.0, 9.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.07757568359375, -0.0753931999206543, -0.0732107162475586, -0.07102823257446289, -0.06884574890136719, -0.06666326522827148, -0.06448078155517578, -0.06229829788208008, -0.060115814208984375, -0.05793333053588867, -0.05575084686279297, -0.053568363189697266, -0.05138587951660156, -0.04920339584350586, -0.047020912170410156, -0.04483842849731445, -0.04265594482421875, -0.04047346115112305, -0.038290977478027344, -0.03610849380493164, -0.03392601013183594, -0.031743526458740234, -0.02956104278564453, -0.027378559112548828, -0.025196075439453125, -0.023013591766357422, -0.02083110809326172, -0.018648624420166016, -0.016466140747070312, -0.01428365707397461, -0.012101173400878906, -0.009918689727783203, -0.0077362060546875, -0.005553722381591797, -0.0033712387084960938, -0.0011887550354003906, 0.0009937286376953125, 0.0031762123107910156, 0.005358695983886719, 0.007541179656982422, 0.009723663330078125, 0.011906147003173828, 0.014088630676269531, 0.016271114349365234, 0.018453598022460938, 0.02063608169555664, 0.022818565368652344, 0.025001049041748047, 0.02718353271484375, 0.029366016387939453, 0.031548500061035156, 0.03373098373413086, 0.03591346740722656, 0.038095951080322266, 0.04027843475341797, 0.04246091842651367, 0.044643402099609375, 0.04682588577270508, 0.04900836944580078, 0.051190853118896484, 0.05337333679199219, 0.05555582046508789, 0.057738304138183594, 0.0599207878112793, 0.062103271484375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 4.0, 8.0, 13.0, 14.0, 15.0, 23.0, 29.0, 43.0, 57.0, 84.0, 109.0, 209.0, 469.0, 1376.0, 793.0, 291.0, 170.0, 102.0, 72.0, 49.0, 33.0, 26.0, 19.0, 14.0, 17.0, 11.0, 9.0, 7.0, 4.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036590576171875, -0.035320281982421875, -0.03404998779296875, -0.032779693603515625, -0.0315093994140625, -0.030239105224609375, -0.02896881103515625, -0.027698516845703125, -0.02642822265625, -0.025157928466796875, -0.02388763427734375, -0.022617340087890625, -0.0213470458984375, -0.020076751708984375, -0.01880645751953125, -0.017536163330078125, -0.016265869140625, -0.014995574951171875, -0.01372528076171875, -0.012454986572265625, -0.0111846923828125, -0.009914398193359375, -0.00864410400390625, -0.007373809814453125, -0.006103515625, -0.004833221435546875, -0.00356292724609375, -0.002292633056640625, -0.0010223388671875, 0.000247955322265625, 0.00151824951171875, 0.002788543701171875, 0.004058837890625, 0.005329132080078125, 0.00659942626953125, 0.007869720458984375, 0.0091400146484375, 0.010410308837890625, 0.01168060302734375, 0.012950897216796875, 0.01422119140625, 0.015491485595703125, 0.01676177978515625, 0.018032073974609375, 0.0193023681640625, 0.020572662353515625, 0.02184295654296875, 0.023113250732421875, 0.024383544921875, 0.025653839111328125, 0.02692413330078125, 0.028194427490234375, 0.0294647216796875, 0.030735015869140625, 0.03200531005859375, 0.033275604248046875, 0.0345458984375, 0.035816192626953125, 0.03708648681640625, 0.038356781005859375, 0.0396270751953125, 0.040897369384765625, 0.04216766357421875, 0.043437957763671875, 0.044708251953125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 8.0, 11.0, 12.0, 31.0, 38.0, 104.0, 127.0, 167.0, 177.0, 128.0, 101.0, 53.0, 29.0, 11.0, 7.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3000304102897644, -0.28862038254737854, -0.2772103548049927, -0.2658003270626068, -0.25439029932022095, -0.24298027157783508, -0.23157022893428802, -0.22016020119190216, -0.2087501734495163, -0.19734014570713043, -0.18593011796474457, -0.1745200753211975, -0.16311004757881165, -0.15170001983642578, -0.14028999209403992, -0.12887996435165405, -0.11746993660926819, -0.10605990886688232, -0.09464988112449646, -0.08323984593153, -0.07182981818914413, -0.06041979044675827, -0.04900975525379181, -0.037599727511405945, -0.02618969976902008, -0.014779670163989067, -0.0033696405589580536, 0.008040390908718109, 0.019450418651103973, 0.030860446393489838, 0.0422704815864563, 0.05368050932884216, 0.06509053707122803, 0.07650056481361389, 0.08791059255599976, 0.09932062774896622, 0.11073065549135208, 0.12214068323373795, 0.1335507184267044, 0.14496074616909027, 0.15637077391147614, 0.167780801653862, 0.17919082939624786, 0.19060087203979492, 0.2020108997821808, 0.21342092752456665, 0.22483095526695251, 0.23624098300933838, 0.24765101075172424, 0.2590610384941101, 0.27047106623649597, 0.28188109397888184, 0.2932911217212677, 0.30470114946365356, 0.3161112070083618, 0.3275212049484253, 0.33893126249313354, 0.3503412902355194, 0.3617513179779053, 0.37316134572029114, 0.384571373462677, 0.39598140120506287, 0.40739142894744873, 0.418801486492157, 0.43021148443222046]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 6.0, 5.0, 4.0, 5.0, 5.0, 8.0, 4.0, 8.0, 17.0, 18.0, 10.0, 21.0, 21.0, 26.0, 23.0, 34.0, 41.0, 33.0, 37.0, 46.0, 46.0, 45.0, 48.0, 36.0, 30.0, 48.0, 38.0, 37.0, 35.0, 33.0, 21.0, 28.0, 21.0, 29.0, 18.0, 14.0, 13.0, 15.0, 23.0, 10.0, 15.0, 7.0, 9.0, 1.0, 1.0, 7.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.14985984563827515, -0.14571259915828705, -0.14156536757946014, -0.13741812109947205, -0.13327087461948395, -0.12912362813949585, -0.12497639656066895, -0.12082915008068085, -0.11668191105127335, -0.11253467202186584, -0.10838742554187775, -0.10424018651247025, -0.10009294748306274, -0.09594570100307465, -0.09179846197366714, -0.08765122294425964, -0.08350397646427155, -0.07935673743486404, -0.07520949095487595, -0.07106225192546844, -0.06691500544548035, -0.06276776641607285, -0.058620527386665344, -0.054473284631967545, -0.050326041877269745, -0.046178799122571945, -0.042031556367874146, -0.037884317338466644, -0.033737074583768845, -0.029589831829071045, -0.025442590937018394, -0.021295350044965744, -0.017148107290267944, -0.01300086546689272, -0.008853623643517494, -0.004706381820142269, -0.0005591399967670441, 0.0035881027579307556, 0.007735343649983406, 0.011882584542036057, 0.016029827296733856, 0.020177070051431656, 0.024324310943484306, 0.028471551835536957, 0.032618794590234756, 0.036766037344932556, 0.04091327637434006, 0.04506051912903786, 0.04920776188373566, 0.053355004638433456, 0.057502247393131256, 0.06164948642253876, 0.06579673290252686, 0.06994397193193436, 0.07409121096134186, 0.07823845744132996, 0.08238569647073746, 0.08653293550014496, 0.09068018198013306, 0.09482742100954056, 0.09897466003894806, 0.10312190651893616, 0.10726914554834366, 0.11141638457775116, 0.11556363105773926]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 11.0, 7.0, 11.0, 7.0, 16.0, 31.0, 64.0, 90.0, 133.0, 213.0, 350.0, 653.0, 1030.0, 2004.0, 3648.0, 7365.0, 15371.0, 36325.0, 100324.0, 486710.0, 275957.0, 67270.0, 26595.0, 11870.0, 5724.0, 2996.0, 1606.0, 869.0, 519.0, 275.0, 179.0, 111.0, 70.0, 57.0, 28.0, 22.0, 17.0, 14.0, 3.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.076416015625, -0.07376480102539062, -0.07111358642578125, -0.06846237182617188, -0.0658111572265625, -0.06315994262695312, -0.06050872802734375, -0.057857513427734375, -0.055206298828125, -0.052555084228515625, -0.04990386962890625, -0.047252655029296875, -0.0446014404296875, -0.041950225830078125, -0.03929901123046875, -0.036647796630859375, -0.03399658203125, -0.031345367431640625, -0.02869415283203125, -0.026042938232421875, -0.0233917236328125, -0.020740509033203125, -0.01808929443359375, -0.015438079833984375, -0.012786865234375, -0.010135650634765625, -0.00748443603515625, -0.004833221435546875, -0.0021820068359375, 0.000469207763671875, 0.00312042236328125, 0.005771636962890625, 0.0084228515625, 0.011074066162109375, 0.01372528076171875, 0.016376495361328125, 0.0190277099609375, 0.021678924560546875, 0.02433013916015625, 0.026981353759765625, 0.029632568359375, 0.032283782958984375, 0.03493499755859375, 0.037586212158203125, 0.0402374267578125, 0.042888641357421875, 0.04553985595703125, 0.048191070556640625, 0.05084228515625, 0.053493499755859375, 0.05614471435546875, 0.058795928955078125, 0.0614471435546875, 0.06409835815429688, 0.06674957275390625, 0.06940078735351562, 0.072052001953125, 0.07470321655273438, 0.07735443115234375, 0.08000564575195312, 0.0826568603515625, 0.08530807495117188, 0.08795928955078125, 0.09061050415039062, 0.09326171875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 0.0, 5.0, 8.0, 2.0, 3.0, 6.0, 2.0, 5.0, 13.0, 11.0, 21.0, 24.0, 22.0, 34.0, 32.0, 39.0, 40.0, 47.0, 43.0, 52.0, 71.0, 49.0, 53.0, 47.0, 51.0, 53.0, 40.0, 32.0, 32.0, 28.0, 28.0, 20.0, 18.0, 23.0, 7.0, 8.0, 11.0, 3.0, 3.0, 5.0, 2.0, 5.0, 5.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0175628662109375, -0.01695084571838379, -0.016338825225830078, -0.015726804733276367, -0.015114784240722656, -0.014502763748168945, -0.013890743255615234, -0.013278722763061523, -0.012666702270507812, -0.012054681777954102, -0.01144266128540039, -0.01083064079284668, -0.010218620300292969, -0.009606599807739258, -0.008994579315185547, -0.008382558822631836, -0.007770538330078125, -0.007158517837524414, -0.006546497344970703, -0.005934476852416992, -0.005322456359863281, -0.00471043586730957, -0.004098415374755859, -0.0034863948822021484, -0.0028743743896484375, -0.0022623538970947266, -0.0016503334045410156, -0.0010383129119873047, -0.00042629241943359375, 0.0001857280731201172, 0.0007977485656738281, 0.001409769058227539, 0.00202178955078125, 0.002633810043334961, 0.003245830535888672, 0.003857851028442383, 0.004469871520996094, 0.005081892013549805, 0.005693912506103516, 0.0063059329986572266, 0.0069179534912109375, 0.0075299739837646484, 0.00814199447631836, 0.00875401496887207, 0.009366035461425781, 0.009978055953979492, 0.010590076446533203, 0.011202096939086914, 0.011814117431640625, 0.012426137924194336, 0.013038158416748047, 0.013650178909301758, 0.014262199401855469, 0.01487421989440918, 0.01548624038696289, 0.0160982608795166, 0.016710281372070312, 0.017322301864624023, 0.017934322357177734, 0.018546342849731445, 0.019158363342285156, 0.019770383834838867, 0.020382404327392578, 0.02099442481994629, 0.0216064453125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 11.0, 9.0, 22.0, 29.0, 29.0, 32.0, 57.0, 96.0, 109.0, 197.0, 307.0, 487.0, 828.0, 1702.0, 4010.0, 11796.0, 42259.0, 194815.0, 638600.0, 110886.0, 27962.0, 8250.0, 2926.0, 1366.0, 665.0, 407.0, 213.0, 135.0, 100.0, 67.0, 43.0, 51.0, 26.0, 16.0, 9.0, 12.0, 9.0, 7.0, 2.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.08184814453125, -0.07885456085205078, -0.07586097717285156, -0.07286739349365234, -0.06987380981445312, -0.0668802261352539, -0.06388664245605469, -0.06089305877685547, -0.05789947509765625, -0.05490589141845703, -0.05191230773925781, -0.048918724060058594, -0.045925140380859375, -0.042931556701660156, -0.03993797302246094, -0.03694438934326172, -0.0339508056640625, -0.03095722198486328, -0.027963638305664062, -0.024970054626464844, -0.021976470947265625, -0.018982887268066406, -0.015989303588867188, -0.012995719909667969, -0.01000213623046875, -0.007008552551269531, -0.0040149688720703125, -0.0010213851928710938, 0.001972198486328125, 0.004965782165527344, 0.007959365844726562, 0.010952949523925781, 0.013946533203125, 0.01694011688232422, 0.019933700561523438, 0.022927284240722656, 0.025920867919921875, 0.028914451599121094, 0.03190803527832031, 0.03490161895751953, 0.03789520263671875, 0.04088878631591797, 0.04388236999511719, 0.046875953674316406, 0.049869537353515625, 0.052863121032714844, 0.05585670471191406, 0.05885028839111328, 0.0618438720703125, 0.06483745574951172, 0.06783103942871094, 0.07082462310791016, 0.07381820678710938, 0.0768117904663086, 0.07980537414550781, 0.08279895782470703, 0.08579254150390625, 0.08878612518310547, 0.09177970886230469, 0.0947732925415039, 0.09776687622070312, 0.10076045989990234, 0.10375404357910156, 0.10674762725830078, 0.1097412109375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 9.0, 9.0, 5.0, 6.0, 16.0, 15.0, 27.0, 14.0, 18.0, 23.0, 33.0, 27.0, 37.0, 40.0, 37.0, 51.0, 48.0, 58.0, 56.0, 51.0, 52.0, 51.0, 37.0, 35.0, 33.0, 31.0, 26.0, 24.0, 20.0, 18.0, 22.0, 14.0, 11.0, 6.0, 11.0, 9.0, 1.0, 3.0, 6.0, 4.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07958984375, -0.07706356048583984, -0.07453727722167969, -0.07201099395751953, -0.06948471069335938, -0.06695842742919922, -0.06443214416503906, -0.061905860900878906, -0.05937957763671875, -0.056853294372558594, -0.05432701110839844, -0.05180072784423828, -0.049274444580078125, -0.04674816131591797, -0.04422187805175781, -0.041695594787597656, -0.0391693115234375, -0.036643028259277344, -0.03411674499511719, -0.03159046173095703, -0.029064178466796875, -0.02653789520263672, -0.024011611938476562, -0.021485328674316406, -0.01895904541015625, -0.016432762145996094, -0.013906478881835938, -0.011380195617675781, -0.008853912353515625, -0.006327629089355469, -0.0038013458251953125, -0.0012750625610351562, 0.001251220703125, 0.0037775039672851562, 0.0063037872314453125, 0.008830070495605469, 0.011356353759765625, 0.013882637023925781, 0.016408920288085938, 0.018935203552246094, 0.02146148681640625, 0.023987770080566406, 0.026514053344726562, 0.02904033660888672, 0.031566619873046875, 0.03409290313720703, 0.03661918640136719, 0.039145469665527344, 0.0416717529296875, 0.044198036193847656, 0.04672431945800781, 0.04925060272216797, 0.051776885986328125, 0.05430316925048828, 0.05682945251464844, 0.059355735778808594, 0.06188201904296875, 0.0644083023071289, 0.06693458557128906, 0.06946086883544922, 0.07198715209960938, 0.07451343536376953, 0.07703971862792969, 0.07956600189208984, 0.08209228515625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 4.0, 4.0, 12.0, 11.0, 16.0, 15.0, 18.0, 36.0, 50.0, 58.0, 102.0, 166.0, 262.0, 416.0, 648.0, 1165.0, 2013.0, 3953.0, 8286.0, 19796.0, 56535.0, 376594.0, 472795.0, 65050.0, 21838.0, 9149.0, 4285.0, 2154.0, 1213.0, 695.0, 419.0, 245.0, 188.0, 113.0, 60.0, 53.0, 39.0, 22.0, 16.0, 17.0, 13.0, 8.0, 2.0, 9.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.055938720703125, -0.05424642562866211, -0.05255413055419922, -0.05086183547973633, -0.04916954040527344, -0.04747724533081055, -0.045784950256347656, -0.044092655181884766, -0.042400360107421875, -0.040708065032958984, -0.039015769958496094, -0.0373234748840332, -0.03563117980957031, -0.03393888473510742, -0.03224658966064453, -0.03055429458618164, -0.02886199951171875, -0.02716970443725586, -0.02547740936279297, -0.023785114288330078, -0.022092819213867188, -0.020400524139404297, -0.018708229064941406, -0.017015933990478516, -0.015323638916015625, -0.013631343841552734, -0.011939048767089844, -0.010246753692626953, -0.008554458618164062, -0.006862163543701172, -0.005169868469238281, -0.0034775733947753906, -0.0017852783203125, -9.298324584960938e-05, 0.0015993118286132812, 0.003291606903076172, 0.0049839019775390625, 0.006676197052001953, 0.008368492126464844, 0.010060787200927734, 0.011753082275390625, 0.013445377349853516, 0.015137672424316406, 0.016829967498779297, 0.018522262573242188, 0.020214557647705078, 0.02190685272216797, 0.02359914779663086, 0.02529144287109375, 0.02698373794555664, 0.02867603302001953, 0.030368328094482422, 0.03206062316894531, 0.0337529182434082, 0.035445213317871094, 0.037137508392333984, 0.038829803466796875, 0.040522098541259766, 0.042214393615722656, 0.04390668869018555, 0.04559898376464844, 0.04729127883911133, 0.04898357391357422, 0.05067586898803711, 0.0523681640625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 11.0, 8.0, 16.0, 37.0, 51.0, 118.0, 169.0, 198.0, 170.0, 88.0, 63.0, 28.0, 22.0, 11.0, 6.0, 4.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.159875869750977e-05, -7.935706526041031e-05, -7.711537182331085e-05, -7.48736783862114e-05, -7.263198494911194e-05, -7.039029151201248e-05, -6.814859807491302e-05, -6.590690463781357e-05, -6.366521120071411e-05, -6.142351776361465e-05, -5.91818243265152e-05, -5.694013088941574e-05, -5.4698437452316284e-05, -5.245674401521683e-05, -5.021505057811737e-05, -4.7973357141017914e-05, -4.573166370391846e-05, -4.3489970266819e-05, -4.1248276829719543e-05, -3.900658339262009e-05, -3.676488995552063e-05, -3.452319651842117e-05, -3.2281503081321716e-05, -3.003980964422226e-05, -2.7798116207122803e-05, -2.5556422770023346e-05, -2.331472933292389e-05, -2.1073035895824432e-05, -1.8831342458724976e-05, -1.658964902162552e-05, -1.4347955584526062e-05, -1.2106262147426605e-05, -9.864568710327148e-06, -7.622875273227692e-06, -5.381181836128235e-06, -3.139488399028778e-06, -8.977949619293213e-07, 1.3438984751701355e-06, 3.5855919122695923e-06, 5.827285349369049e-06, 8.068978786468506e-06, 1.0310672223567963e-05, 1.255236566066742e-05, 1.4794059097766876e-05, 1.7035752534866333e-05, 1.927744597196579e-05, 2.1519139409065247e-05, 2.3760832846164703e-05, 2.600252628326416e-05, 2.8244219720363617e-05, 3.0485913157463074e-05, 3.272760659456253e-05, 3.496930003166199e-05, 3.7210993468761444e-05, 3.94526869058609e-05, 4.169438034296036e-05, 4.3936073780059814e-05, 4.617776721715927e-05, 4.841946065425873e-05, 5.0661154091358185e-05, 5.290284752845764e-05, 5.51445409655571e-05, 5.7386234402656555e-05, 5.962792783975601e-05, 6.186962127685547e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 3.0, 6.0, 8.0, 9.0, 14.0, 20.0, 37.0, 39.0, 83.0, 118.0, 197.0, 289.0, 454.0, 804.0, 1510.0, 2779.0, 6218.0, 16559.0, 57549.0, 568942.0, 325672.0, 43194.0, 13305.0, 5161.0, 2416.0, 1252.0, 711.0, 436.0, 251.0, 164.0, 121.0, 73.0, 41.0, 32.0, 24.0, 16.0, 12.0, 11.0, 8.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0545654296875, -0.05260944366455078, -0.05065345764160156, -0.048697471618652344, -0.046741485595703125, -0.044785499572753906, -0.04282951354980469, -0.04087352752685547, -0.03891754150390625, -0.03696155548095703, -0.03500556945800781, -0.033049583435058594, -0.031093597412109375, -0.029137611389160156, -0.027181625366210938, -0.02522563934326172, -0.0232696533203125, -0.02131366729736328, -0.019357681274414062, -0.017401695251464844, -0.015445709228515625, -0.013489723205566406, -0.011533737182617188, -0.009577751159667969, -0.00762176513671875, -0.005665779113769531, -0.0037097930908203125, -0.0017538070678710938, 0.000202178955078125, 0.0021581649780273438, 0.0041141510009765625, 0.006070137023925781, 0.008026123046875, 0.009982109069824219, 0.011938095092773438, 0.013894081115722656, 0.015850067138671875, 0.017806053161621094, 0.019762039184570312, 0.02171802520751953, 0.02367401123046875, 0.02562999725341797, 0.027585983276367188, 0.029541969299316406, 0.031497955322265625, 0.033453941345214844, 0.03540992736816406, 0.03736591339111328, 0.0393218994140625, 0.04127788543701172, 0.04323387145996094, 0.045189857482910156, 0.047145843505859375, 0.049101829528808594, 0.05105781555175781, 0.05301380157470703, 0.05496978759765625, 0.05692577362060547, 0.05888175964355469, 0.060837745666503906, 0.06279373168945312, 0.06474971771240234, 0.06670570373535156, 0.06866168975830078, 0.07061767578125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 4.0, 8.0, 9.0, 7.0, 10.0, 12.0, 25.0, 23.0, 38.0, 46.0, 75.0, 127.0, 187.0, 131.0, 87.0, 48.0, 36.0, 29.0, 24.0, 10.0, 7.0, 9.0, 8.0, 10.0, 6.0, 2.0, 3.0, 1.0, 2.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.045379638671875, -0.0439448356628418, -0.042510032653808594, -0.04107522964477539, -0.03964042663574219, -0.038205623626708984, -0.03677082061767578, -0.03533601760864258, -0.033901214599609375, -0.03246641159057617, -0.03103160858154297, -0.029596805572509766, -0.028162002563476562, -0.02672719955444336, -0.025292396545410156, -0.023857593536376953, -0.02242279052734375, -0.020987987518310547, -0.019553184509277344, -0.01811838150024414, -0.016683578491210938, -0.015248775482177734, -0.013813972473144531, -0.012379169464111328, -0.010944366455078125, -0.009509563446044922, -0.008074760437011719, -0.006639957427978516, -0.0052051544189453125, -0.0037703514099121094, -0.0023355484008789062, -0.0009007453918457031, 0.0005340576171875, 0.001968860626220703, 0.0034036636352539062, 0.004838466644287109, 0.0062732696533203125, 0.007708072662353516, 0.009142875671386719, 0.010577678680419922, 0.012012481689453125, 0.013447284698486328, 0.014882087707519531, 0.016316890716552734, 0.017751693725585938, 0.01918649673461914, 0.020621299743652344, 0.022056102752685547, 0.02349090576171875, 0.024925708770751953, 0.026360511779785156, 0.02779531478881836, 0.029230117797851562, 0.030664920806884766, 0.03209972381591797, 0.03353452682495117, 0.034969329833984375, 0.03640413284301758, 0.03783893585205078, 0.039273738861083984, 0.04070854187011719, 0.04214334487915039, 0.043578147888183594, 0.0450129508972168, 0.04644775390625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 9.0, 9.0, 54.0, 154.0, 294.0, 287.0, 149.0, 39.0, 10.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.5535879135131836, -2.5014238357543945, -2.4492597579956055, -2.3970954418182373, -2.3449313640594482, -2.292767286300659, -2.24060320854187, -2.188438892364502, -2.136274814605713, -2.084110736846924, -2.0319466590881348, -1.9797824621200562, -1.9276182651519775, -1.8754541873931885, -1.8232901096343994, -1.7711259126663208, -1.7189618349075317, -1.6667977571487427, -1.614633560180664, -1.562469482421875, -1.5103052854537964, -1.4581412076950073, -1.4059770107269287, -1.3538129329681396, -1.3016488552093506, -1.2494847774505615, -1.197320580482483, -1.1451565027236938, -1.0929923057556152, -1.0408282279968262, -0.9886640906333923, -0.9364999532699585, -0.8843357563018799, -0.832171618938446, -0.7800074815750122, -0.7278434038162231, -0.6756792068481445, -0.6235151290893555, -0.5713509917259216, -0.5191868543624878, -0.46702271699905396, -0.4148585796356201, -0.3626944422721863, -0.31053033471107483, -0.258366197347641, -0.20620205998420715, -0.1540379524230957, -0.10187381505966187, -0.04970967769622803, 0.0024544522166252136, 0.054618582129478455, 0.1067827045917511, 0.15894684195518494, 0.21111097931861877, 0.2632750868797302, 0.31543922424316406, 0.3676033616065979, 0.41976749897003174, 0.4719316363334656, 0.5240957736968994, 0.5762598514556885, 0.6284240484237671, 0.6805881261825562, 0.73275226354599, 0.7849164009094238]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 1.0, 4.0, 6.0, 4.0, 8.0, 8.0, 16.0, 17.0, 20.0, 21.0, 18.0, 35.0, 21.0, 40.0, 41.0, 38.0, 41.0, 41.0, 36.0, 42.0, 35.0, 46.0, 41.0, 51.0, 55.0, 45.0, 35.0, 43.0, 27.0, 25.0, 19.0, 21.0, 15.0, 18.0, 14.0, 10.0, 13.0, 7.0, 7.0, 6.0, 4.0, 3.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36976349353790283, -0.3567947745323181, -0.3438260555267334, -0.3308573365211487, -0.31788861751556396, -0.30491989850997925, -0.29195117950439453, -0.2789824604988098, -0.2660137414932251, -0.2530450224876404, -0.24007630348205566, -0.22710758447647095, -0.21413886547088623, -0.2011701464653015, -0.1882014274597168, -0.17523270845413208, -0.16226397454738617, -0.14929525554180145, -0.13632653653621674, -0.12335781753063202, -0.1103890985250473, -0.09742037206888199, -0.08445165306329727, -0.07148293405771255, -0.05851421505212784, -0.04554549604654312, -0.032576777040958405, -0.01960805431008339, -0.0066393353044986725, 0.006329387426376343, 0.01929810643196106, 0.032266825437545776, 0.04523554444313049, 0.05820426344871521, 0.07117298245429993, 0.08414170145988464, 0.09711042046546936, 0.11007914692163467, 0.12304786592721939, 0.1360165774822235, 0.14898529648780823, 0.16195401549339294, 0.17492273449897766, 0.18789145350456238, 0.2008601725101471, 0.2138288915157318, 0.22679761052131653, 0.23976632952690125, 0.25273507833480835, 0.26570379734039307, 0.2786725163459778, 0.2916412353515625, 0.3046099543571472, 0.31757867336273193, 0.33054739236831665, 0.34351611137390137, 0.3564848303794861, 0.3694535493850708, 0.3824222683906555, 0.39539098739624023, 0.40835970640182495, 0.42132842540740967, 0.4342971444129944, 0.4472658634185791, 0.4602345824241638]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 7.0, 4.0, 12.0, 14.0, 24.0, 31.0, 58.0, 94.0, 110.0, 175.0, 302.0, 426.0, 725.0, 1201.0, 1877.0, 3351.0, 6361.0, 12574.0, 29478.0, 88837.0, 628344.0, 3208204.0, 137802.0, 40268.0, 15863.0, 7774.0, 4062.0, 2296.0, 1425.0, 878.0, 569.0, 378.0, 258.0, 144.0, 115.0, 72.0, 58.0, 31.0, 25.0, 17.0, 13.0, 7.0, 9.0, 6.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06707763671875, -0.06477737426757812, -0.06247711181640625, -0.060176849365234375, -0.0578765869140625, -0.055576324462890625, -0.05327606201171875, -0.050975799560546875, -0.048675537109375, -0.046375274658203125, -0.04407501220703125, -0.041774749755859375, -0.0394744873046875, -0.037174224853515625, -0.03487396240234375, -0.032573699951171875, -0.0302734375, -0.027973175048828125, -0.02567291259765625, -0.023372650146484375, -0.0210723876953125, -0.018772125244140625, -0.01647186279296875, -0.014171600341796875, -0.011871337890625, -0.009571075439453125, -0.00727081298828125, -0.004970550537109375, -0.0026702880859375, -0.000370025634765625, 0.00193023681640625, 0.004230499267578125, 0.00653076171875, 0.008831024169921875, 0.01113128662109375, 0.013431549072265625, 0.0157318115234375, 0.018032073974609375, 0.02033233642578125, 0.022632598876953125, 0.024932861328125, 0.027233123779296875, 0.02953338623046875, 0.031833648681640625, 0.0341339111328125, 0.036434173583984375, 0.03873443603515625, 0.041034698486328125, 0.0433349609375, 0.045635223388671875, 0.04793548583984375, 0.050235748291015625, 0.0525360107421875, 0.054836273193359375, 0.05713653564453125, 0.059436798095703125, 0.061737060546875, 0.06403732299804688, 0.06633758544921875, 0.06863784790039062, 0.0709381103515625, 0.07323837280273438, 0.07553863525390625, 0.07783889770507812, 0.08013916015625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 7.0, 2.0, 2.0, 7.0, 6.0, 8.0, 6.0, 17.0, 14.0, 21.0, 25.0, 41.0, 35.0, 39.0, 49.0, 61.0, 39.0, 56.0, 71.0, 54.0, 57.0, 45.0, 48.0, 52.0, 44.0, 33.0, 35.0, 28.0, 18.0, 23.0, 14.0, 12.0, 11.0, 4.0, 9.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015869140625, -0.015159845352172852, -0.014450550079345703, -0.013741254806518555, -0.013031959533691406, -0.012322664260864258, -0.01161336898803711, -0.010904073715209961, -0.010194778442382812, -0.009485483169555664, -0.008776187896728516, -0.008066892623901367, -0.007357597351074219, -0.00664830207824707, -0.005939006805419922, -0.0052297115325927734, -0.004520416259765625, -0.0038111209869384766, -0.003101825714111328, -0.0023925304412841797, -0.0016832351684570312, -0.0009739398956298828, -0.0002646446228027344, 0.00044465065002441406, 0.0011539459228515625, 0.001863241195678711, 0.0025725364685058594, 0.003281831741333008, 0.003991127014160156, 0.004700422286987305, 0.005409717559814453, 0.0061190128326416016, 0.00682830810546875, 0.0075376033782958984, 0.008246898651123047, 0.008956193923950195, 0.009665489196777344, 0.010374784469604492, 0.01108407974243164, 0.011793375015258789, 0.012502670288085938, 0.013211965560913086, 0.013921260833740234, 0.014630556106567383, 0.015339851379394531, 0.01604914665222168, 0.016758441925048828, 0.017467737197875977, 0.018177032470703125, 0.018886327743530273, 0.019595623016357422, 0.02030491828918457, 0.02101421356201172, 0.021723508834838867, 0.022432804107666016, 0.023142099380493164, 0.023851394653320312, 0.02456068992614746, 0.02526998519897461, 0.025979280471801758, 0.026688575744628906, 0.027397871017456055, 0.028107166290283203, 0.02881646156311035, 0.0295257568359375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 8.0, 9.0, 20.0, 14.0, 27.0, 44.0, 59.0, 133.0, 163.0, 257.0, 449.0, 749.0, 1354.0, 2465.0, 4679.0, 9077.0, 19332.0, 47862.0, 159069.0, 2491786.0, 1240920.0, 136003.0, 42958.0, 18162.0, 8776.0, 4342.0, 2344.0, 1294.0, 765.0, 429.0, 272.0, 190.0, 76.0, 66.0, 47.0, 29.0, 21.0, 15.0, 8.0, 7.0, 0.0, 5.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.063720703125, -0.061440467834472656, -0.05916023254394531, -0.05687999725341797, -0.054599761962890625, -0.05231952667236328, -0.05003929138183594, -0.047759056091308594, -0.04547882080078125, -0.043198585510253906, -0.04091835021972656, -0.03863811492919922, -0.036357879638671875, -0.03407764434814453, -0.03179740905761719, -0.029517173767089844, -0.0272369384765625, -0.024956703186035156, -0.022676467895507812, -0.02039623260498047, -0.018115997314453125, -0.01583576202392578, -0.013555526733398438, -0.011275291442871094, -0.00899505615234375, -0.006714820861816406, -0.0044345855712890625, -0.0021543502807617188, 0.000125885009765625, 0.0024061203002929688, 0.0046863555908203125, 0.006966590881347656, 0.009246826171875, 0.011527061462402344, 0.013807296752929688, 0.01608753204345703, 0.018367767333984375, 0.02064800262451172, 0.022928237915039062, 0.025208473205566406, 0.02748870849609375, 0.029768943786621094, 0.03204917907714844, 0.03432941436767578, 0.036609649658203125, 0.03888988494873047, 0.04117012023925781, 0.043450355529785156, 0.0457305908203125, 0.048010826110839844, 0.05029106140136719, 0.05257129669189453, 0.054851531982421875, 0.05713176727294922, 0.05941200256347656, 0.061692237854003906, 0.06397247314453125, 0.0662527084350586, 0.06853294372558594, 0.07081317901611328, 0.07309341430664062, 0.07537364959716797, 0.07765388488769531, 0.07993412017822266, 0.08221435546875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 7.0, 8.0, 13.0, 15.0, 24.0, 31.0, 43.0, 65.0, 123.0, 246.0, 690.0, 1881.0, 426.0, 193.0, 91.0, 66.0, 37.0, 30.0, 21.0, 15.0, 14.0, 12.0, 8.0, 6.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047454833984375, -0.04602956771850586, -0.04460430145263672, -0.04317903518676758, -0.04175376892089844, -0.0403285026550293, -0.038903236389160156, -0.037477970123291016, -0.036052703857421875, -0.034627437591552734, -0.033202171325683594, -0.03177690505981445, -0.030351638793945312, -0.028926372528076172, -0.02750110626220703, -0.02607583999633789, -0.02465057373046875, -0.02322530746459961, -0.02180004119873047, -0.020374774932861328, -0.018949508666992188, -0.017524242401123047, -0.016098976135253906, -0.014673709869384766, -0.013248443603515625, -0.011823177337646484, -0.010397911071777344, -0.008972644805908203, -0.0075473785400390625, -0.006122112274169922, -0.004696846008300781, -0.0032715797424316406, -0.0018463134765625, -0.0004210472106933594, 0.0010042190551757812, 0.002429485321044922, 0.0038547515869140625, 0.005280017852783203, 0.006705284118652344, 0.008130550384521484, 0.009555816650390625, 0.010981082916259766, 0.012406349182128906, 0.013831615447998047, 0.015256881713867188, 0.016682147979736328, 0.01810741424560547, 0.01953268051147461, 0.02095794677734375, 0.02238321304321289, 0.02380847930908203, 0.025233745574951172, 0.026659011840820312, 0.028084278106689453, 0.029509544372558594, 0.030934810638427734, 0.032360076904296875, 0.033785343170166016, 0.035210609436035156, 0.0366358757019043, 0.03806114196777344, 0.03948640823364258, 0.04091167449951172, 0.04233694076538086, 0.04376220703125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 10.0, 10.0, 36.0, 70.0, 130.0, 181.0, 193.0, 153.0, 111.0, 61.0, 25.0, 17.0, 5.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.14869078993797302, -0.13735340535640717, -0.1260160207748413, -0.11467864364385605, -0.10334125906229019, -0.09200387448072433, -0.08066649734973907, -0.06932911276817322, -0.05799172818660736, -0.046654343605041504, -0.035316962748765945, -0.023979581892490387, -0.01264219731092453, -0.001304812729358673, 0.010032564401626587, 0.021369948983192444, 0.0327073335647583, 0.04404471814632416, 0.055382099002599716, 0.06671947985887527, 0.07805686444044113, 0.08939424902200699, 0.10073162615299225, 0.1120690107345581, 0.12340639531612396, 0.13474377989768982, 0.14608116447925568, 0.15741854906082153, 0.1687559187412262, 0.18009331822395325, 0.1914306879043579, 0.20276807248592377, 0.21410542726516724, 0.2254428118467331, 0.23678019642829895, 0.2481175661087036, 0.25945496559143066, 0.2707923352718353, 0.28212970495224, 0.29346710443496704, 0.3048045039176941, 0.31614187359809875, 0.3274792730808258, 0.33881664276123047, 0.3501540422439575, 0.3614914119243622, 0.37282878160476685, 0.3841661810874939, 0.39550355076789856, 0.4068409204483032, 0.4181783199310303, 0.42951568961143494, 0.440853089094162, 0.45219045877456665, 0.4635278582572937, 0.47486522793769836, 0.486202597618103, 0.4975399672985077, 0.5088773369789124, 0.5202147364616394, 0.5315521359443665, 0.5428895354270935, 0.5542268753051758, 0.5655642747879028, 0.5769016742706299]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 5.0, 7.0, 8.0, 11.0, 16.0, 27.0, 34.0, 29.0, 33.0, 28.0, 35.0, 36.0, 45.0, 35.0, 52.0, 55.0, 51.0, 53.0, 62.0, 44.0, 51.0, 42.0, 45.0, 32.0, 24.0, 28.0, 23.0, 28.0, 13.0, 16.0, 10.0, 7.0, 5.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11925679445266724, -0.11501452326774597, -0.11077225208282471, -0.10652998089790344, -0.10228770971298218, -0.09804543852806091, -0.09380317479372025, -0.08956090360879898, -0.08531863242387772, -0.08107636123895645, -0.07683409005403519, -0.07259181886911392, -0.06834955513477325, -0.06410728394985199, -0.059865012764930725, -0.05562274158000946, -0.051380470395088196, -0.04713819921016693, -0.042895928025245667, -0.0386536605656147, -0.034411389380693436, -0.03016911819577217, -0.025926848873496056, -0.02168457955121994, -0.017442308366298676, -0.013200038112699986, -0.008957767859101295, -0.0047154976055026054, -0.0004732273519039154, 0.0037690438330173492, 0.008011313155293465, 0.01225358247756958, 0.016495853662490845, 0.02073812484741211, 0.024980394169688225, 0.02922266349196434, 0.033464934676885605, 0.03770720586180687, 0.041949473321437836, 0.0461917445063591, 0.050434015691280365, 0.05467628687620163, 0.058918558061122894, 0.06316082924604416, 0.06740309298038483, 0.07164536416530609, 0.07588763535022736, 0.08012990653514862, 0.08437217772006989, 0.08861444890499115, 0.09285672008991241, 0.09709899127483368, 0.10134126245975494, 0.10558353364467621, 0.10982579737901688, 0.11406806856393814, 0.1183103397488594, 0.12255261093378067, 0.12679487466812134, 0.1310371458530426, 0.13527941703796387, 0.13952168822288513, 0.1437639594078064, 0.14800623059272766, 0.15224850177764893]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 1.0, 4.0, 7.0, 9.0, 17.0, 14.0, 38.0, 38.0, 65.0, 135.0, 237.0, 476.0, 1029.0, 2567.0, 6415.0, 17366.0, 50876.0, 229459.0, 577964.0, 110242.0, 32394.0, 11485.0, 4345.0, 1759.0, 778.0, 357.0, 183.0, 99.0, 63.0, 49.0, 32.0, 14.0, 15.0, 7.0, 4.0, 3.0, 8.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07135009765625, -0.06863689422607422, -0.06592369079589844, -0.06321048736572266, -0.060497283935546875, -0.057784080505371094, -0.05507087707519531, -0.05235767364501953, -0.04964447021484375, -0.04693126678466797, -0.04421806335449219, -0.041504859924316406, -0.038791656494140625, -0.036078453063964844, -0.03336524963378906, -0.03065204620361328, -0.0279388427734375, -0.02522563934326172, -0.022512435913085938, -0.019799232482910156, -0.017086029052734375, -0.014372825622558594, -0.011659622192382812, -0.008946418762207031, -0.00623321533203125, -0.0035200119018554688, -0.0008068084716796875, 0.0019063949584960938, 0.004619598388671875, 0.007332801818847656, 0.010046005249023438, 0.012759208679199219, 0.015472412109375, 0.01818561553955078, 0.020898818969726562, 0.023612022399902344, 0.026325225830078125, 0.029038429260253906, 0.03175163269042969, 0.03446483612060547, 0.03717803955078125, 0.03989124298095703, 0.04260444641113281, 0.045317649841308594, 0.048030853271484375, 0.050744056701660156, 0.05345726013183594, 0.05617046356201172, 0.0588836669921875, 0.06159687042236328, 0.06431007385253906, 0.06702327728271484, 0.06973648071289062, 0.0724496841430664, 0.07516288757324219, 0.07787609100341797, 0.08058929443359375, 0.08330249786376953, 0.08601570129394531, 0.0887289047241211, 0.09144210815429688, 0.09415531158447266, 0.09686851501464844, 0.09958171844482422, 0.102294921875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 7.0, 4.0, 4.0, 4.0, 6.0, 4.0, 11.0, 18.0, 24.0, 17.0, 37.0, 22.0, 26.0, 37.0, 46.0, 52.0, 38.0, 49.0, 67.0, 57.0, 49.0, 49.0, 49.0, 40.0, 46.0, 32.0, 38.0, 25.0, 28.0, 17.0, 22.0, 11.0, 10.0, 16.0, 8.0, 9.0, 5.0, 7.0, 4.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0184173583984375, -0.017778873443603516, -0.01714038848876953, -0.016501903533935547, -0.015863418579101562, -0.015224933624267578, -0.014586448669433594, -0.01394796371459961, -0.013309478759765625, -0.01267099380493164, -0.012032508850097656, -0.011394023895263672, -0.010755538940429688, -0.010117053985595703, -0.009478569030761719, -0.008840084075927734, -0.00820159912109375, -0.007563114166259766, -0.006924629211425781, -0.006286144256591797, -0.0056476593017578125, -0.005009174346923828, -0.004370689392089844, -0.0037322044372558594, -0.003093719482421875, -0.0024552345275878906, -0.0018167495727539062, -0.0011782646179199219, -0.0005397796630859375, 9.870529174804688e-05, 0.0007371902465820312, 0.0013756752014160156, 0.00201416015625, 0.0026526451110839844, 0.0032911300659179688, 0.003929615020751953, 0.0045680999755859375, 0.005206584930419922, 0.005845069885253906, 0.006483554840087891, 0.007122039794921875, 0.007760524749755859, 0.008399009704589844, 0.009037494659423828, 0.009675979614257812, 0.010314464569091797, 0.010952949523925781, 0.011591434478759766, 0.01222991943359375, 0.012868404388427734, 0.013506889343261719, 0.014145374298095703, 0.014783859252929688, 0.015422344207763672, 0.016060829162597656, 0.01669931411743164, 0.017337799072265625, 0.01797628402709961, 0.018614768981933594, 0.019253253936767578, 0.019891738891601562, 0.020530223846435547, 0.02116870880126953, 0.021807193756103516, 0.0224456787109375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 5.0, 3.0, 3.0, 4.0, 7.0, 5.0, 5.0, 14.0, 11.0, 16.0, 31.0, 37.0, 58.0, 93.0, 145.0, 256.0, 464.0, 844.0, 1947.0, 4356.0, 10931.0, 29395.0, 96361.0, 629253.0, 204077.0, 43211.0, 15706.0, 6100.0, 2628.0, 1132.0, 591.0, 321.0, 186.0, 112.0, 71.0, 55.0, 34.0, 21.0, 16.0, 15.0, 10.0, 11.0, 1.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.09130859375, -0.08859825134277344, -0.08588790893554688, -0.08317756652832031, -0.08046722412109375, -0.07775688171386719, -0.07504653930664062, -0.07233619689941406, -0.0696258544921875, -0.06691551208496094, -0.06420516967773438, -0.06149482727050781, -0.05878448486328125, -0.05607414245605469, -0.053363800048828125, -0.05065345764160156, -0.047943115234375, -0.04523277282714844, -0.042522430419921875, -0.03981208801269531, -0.03710174560546875, -0.03439140319824219, -0.031681060791015625, -0.028970718383789062, -0.0262603759765625, -0.023550033569335938, -0.020839691162109375, -0.018129348754882812, -0.01541900634765625, -0.012708663940429688, -0.009998321533203125, -0.0072879791259765625, -0.00457763671875, -0.0018672943115234375, 0.000843048095703125, 0.0035533905029296875, 0.00626373291015625, 0.008974075317382812, 0.011684417724609375, 0.014394760131835938, 0.0171051025390625, 0.019815444946289062, 0.022525787353515625, 0.025236129760742188, 0.02794647216796875, 0.030656814575195312, 0.033367156982421875, 0.03607749938964844, 0.038787841796875, 0.04149818420410156, 0.044208526611328125, 0.04691886901855469, 0.04962921142578125, 0.05233955383300781, 0.055049896240234375, 0.05776023864746094, 0.0604705810546875, 0.06318092346191406, 0.06589126586914062, 0.06860160827636719, 0.07131195068359375, 0.07402229309082031, 0.07673263549804688, 0.07944297790527344, 0.0821533203125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 6.0, 7.0, 5.0, 13.0, 8.0, 16.0, 19.0, 23.0, 31.0, 46.0, 58.0, 57.0, 58.0, 66.0, 68.0, 73.0, 45.0, 57.0, 61.0, 62.0, 37.0, 38.0, 30.0, 24.0, 15.0, 22.0, 12.0, 10.0, 10.0, 6.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11737060546875, -0.1137704849243164, -0.11017036437988281, -0.10657024383544922, -0.10297012329101562, -0.09937000274658203, -0.09576988220214844, -0.09216976165771484, -0.08856964111328125, -0.08496952056884766, -0.08136940002441406, -0.07776927947998047, -0.07416915893554688, -0.07056903839111328, -0.06696891784667969, -0.0633687973022461, -0.0597686767578125, -0.056168556213378906, -0.05256843566894531, -0.04896831512451172, -0.045368194580078125, -0.04176807403564453, -0.03816795349121094, -0.034567832946777344, -0.03096771240234375, -0.027367591857910156, -0.023767471313476562, -0.02016735076904297, -0.016567230224609375, -0.012967109680175781, -0.009366989135742188, -0.005766868591308594, -0.002166748046875, 0.0014333724975585938, 0.0050334930419921875, 0.008633613586425781, 0.012233734130859375, 0.01583385467529297, 0.019433975219726562, 0.023034095764160156, 0.02663421630859375, 0.030234336853027344, 0.03383445739746094, 0.03743457794189453, 0.041034698486328125, 0.04463481903076172, 0.04823493957519531, 0.051835060119628906, 0.0554351806640625, 0.059035301208496094, 0.06263542175292969, 0.06623554229736328, 0.06983566284179688, 0.07343578338623047, 0.07703590393066406, 0.08063602447509766, 0.08423614501953125, 0.08783626556396484, 0.09143638610839844, 0.09503650665283203, 0.09863662719726562, 0.10223674774169922, 0.10583686828613281, 0.1094369888305664, 0.113037109375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 8.0, 5.0, 16.0, 14.0, 29.0, 31.0, 61.0, 67.0, 93.0, 128.0, 217.0, 301.0, 431.0, 752.0, 1166.0, 2052.0, 3795.0, 8838.0, 23927.0, 96725.0, 689110.0, 165999.0, 32836.0, 11130.0, 4804.0, 2371.0, 1335.0, 765.0, 559.0, 333.0, 188.0, 140.0, 106.0, 71.0, 44.0, 34.0, 30.0, 18.0, 10.0, 4.0, 2.0, 8.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048675537109375, -0.047086238861083984, -0.04549694061279297, -0.04390764236450195, -0.04231834411621094, -0.04072904586791992, -0.039139747619628906, -0.03755044937133789, -0.035961151123046875, -0.03437185287475586, -0.032782554626464844, -0.031193256378173828, -0.029603958129882812, -0.028014659881591797, -0.02642536163330078, -0.024836063385009766, -0.02324676513671875, -0.021657466888427734, -0.02006816864013672, -0.018478870391845703, -0.016889572143554688, -0.015300273895263672, -0.013710975646972656, -0.01212167739868164, -0.010532379150390625, -0.00894308090209961, -0.007353782653808594, -0.005764484405517578, -0.0041751861572265625, -0.002585887908935547, -0.0009965896606445312, 0.0005927085876464844, 0.0021820068359375, 0.0037713050842285156, 0.005360603332519531, 0.006949901580810547, 0.008539199829101562, 0.010128498077392578, 0.011717796325683594, 0.01330709457397461, 0.014896392822265625, 0.01648569107055664, 0.018074989318847656, 0.019664287567138672, 0.021253585815429688, 0.022842884063720703, 0.02443218231201172, 0.026021480560302734, 0.02761077880859375, 0.029200077056884766, 0.03078937530517578, 0.0323786735534668, 0.03396797180175781, 0.03555727005004883, 0.037146568298339844, 0.03873586654663086, 0.040325164794921875, 0.04191446304321289, 0.043503761291503906, 0.04509305953979492, 0.04668235778808594, 0.04827165603637695, 0.04986095428466797, 0.051450252532958984, 0.05303955078125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 8.0, 6.0, 13.0, 17.0, 29.0, 55.0, 77.0, 111.0, 177.0, 142.0, 143.0, 91.0, 55.0, 25.0, 15.0, 7.0, 11.0, 7.0, 8.0, 8.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.036592483520508e-05, -4.874635487794876e-05, -4.7126784920692444e-05, -4.550721496343613e-05, -4.388764500617981e-05, -4.226807504892349e-05, -4.0648505091667175e-05, -3.902893513441086e-05, -3.740936517715454e-05, -3.5789795219898224e-05, -3.417022526264191e-05, -3.255065530538559e-05, -3.093108534812927e-05, -2.9311515390872955e-05, -2.7691945433616638e-05, -2.607237547636032e-05, -2.4452805519104004e-05, -2.2833235561847687e-05, -2.121366560459137e-05, -1.9594095647335052e-05, -1.7974525690078735e-05, -1.6354955732822418e-05, -1.4735385775566101e-05, -1.3115815818309784e-05, -1.1496245861053467e-05, -9.87667590379715e-06, -8.257105946540833e-06, -6.637535989284515e-06, -5.017966032028198e-06, -3.398396074771881e-06, -1.778826117515564e-06, -1.5925616025924683e-07, 1.4603137969970703e-06, 3.0798837542533875e-06, 4.699453711509705e-06, 6.319023668766022e-06, 7.938593626022339e-06, 9.558163583278656e-06, 1.1177733540534973e-05, 1.279730349779129e-05, 1.4416873455047607e-05, 1.6036443412303925e-05, 1.7656013369560242e-05, 1.927558332681656e-05, 2.0895153284072876e-05, 2.2514723241329193e-05, 2.413429319858551e-05, 2.5753863155841827e-05, 2.7373433113098145e-05, 2.899300307035446e-05, 3.061257302761078e-05, 3.2232142984867096e-05, 3.385171294212341e-05, 3.547128289937973e-05, 3.709085285663605e-05, 3.8710422813892365e-05, 4.032999277114868e-05, 4.1949562728405e-05, 4.3569132685661316e-05, 4.518870264291763e-05, 4.680827260017395e-05, 4.842784255743027e-05, 5.0047412514686584e-05, 5.16669824719429e-05, 5.328655242919922e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 10.0, 5.0, 8.0, 17.0, 22.0, 23.0, 38.0, 79.0, 114.0, 207.0, 389.0, 902.0, 2444.0, 7322.0, 34522.0, 718804.0, 254899.0, 20190.0, 5154.0, 1879.0, 792.0, 325.0, 148.0, 91.0, 58.0, 39.0, 24.0, 21.0, 7.0, 13.0, 4.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08721923828125, -0.08448123931884766, -0.08174324035644531, -0.07900524139404297, -0.07626724243164062, -0.07352924346923828, -0.07079124450683594, -0.0680532455444336, -0.06531524658203125, -0.0625772476196289, -0.05983924865722656, -0.05710124969482422, -0.054363250732421875, -0.05162525177001953, -0.04888725280761719, -0.046149253845214844, -0.0434112548828125, -0.040673255920410156, -0.03793525695800781, -0.03519725799560547, -0.032459259033203125, -0.02972126007080078, -0.026983261108398438, -0.024245262145996094, -0.02150726318359375, -0.018769264221191406, -0.016031265258789062, -0.013293266296386719, -0.010555267333984375, -0.007817268371582031, -0.0050792694091796875, -0.0023412704467773438, 0.000396728515625, 0.0031347274780273438, 0.0058727264404296875, 0.008610725402832031, 0.011348724365234375, 0.014086723327636719, 0.016824722290039062, 0.019562721252441406, 0.02230072021484375, 0.025038719177246094, 0.027776718139648438, 0.03051471710205078, 0.033252716064453125, 0.03599071502685547, 0.03872871398925781, 0.041466712951660156, 0.0442047119140625, 0.046942710876464844, 0.04968070983886719, 0.05241870880126953, 0.055156707763671875, 0.05789470672607422, 0.06063270568847656, 0.0633707046508789, 0.06610870361328125, 0.0688467025756836, 0.07158470153808594, 0.07432270050048828, 0.07706069946289062, 0.07979869842529297, 0.08253669738769531, 0.08527469635009766, 0.0880126953125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 4.0, 4.0, 9.0, 6.0, 16.0, 14.0, 22.0, 47.0, 88.0, 147.0, 211.0, 172.0, 89.0, 67.0, 32.0, 15.0, 8.0, 11.0, 4.0, 6.0, 7.0, 5.0, 1.0, 1.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.072265625, -0.07039642333984375, -0.0685272216796875, -0.06665802001953125, -0.064788818359375, -0.06291961669921875, -0.0610504150390625, -0.05918121337890625, -0.05731201171875, -0.05544281005859375, -0.0535736083984375, -0.05170440673828125, -0.049835205078125, -0.04796600341796875, -0.0460968017578125, -0.04422760009765625, -0.0423583984375, -0.04048919677734375, -0.0386199951171875, -0.03675079345703125, -0.034881591796875, -0.03301239013671875, -0.0311431884765625, -0.02927398681640625, -0.02740478515625, -0.02553558349609375, -0.0236663818359375, -0.02179718017578125, -0.019927978515625, -0.01805877685546875, -0.0161895751953125, -0.01432037353515625, -0.012451171875, -0.01058197021484375, -0.0087127685546875, -0.00684356689453125, -0.004974365234375, -0.00310516357421875, -0.0012359619140625, 0.00063323974609375, 0.00250244140625, 0.00437164306640625, 0.0062408447265625, 0.00811004638671875, 0.009979248046875, 0.01184844970703125, 0.0137176513671875, 0.01558685302734375, 0.0174560546875, 0.01932525634765625, 0.0211944580078125, 0.02306365966796875, 0.024932861328125, 0.02680206298828125, 0.0286712646484375, 0.03054046630859375, 0.03240966796875, 0.03427886962890625, 0.0361480712890625, 0.03801727294921875, 0.039886474609375, 0.04175567626953125, 0.0436248779296875, 0.04549407958984375, 0.04736328125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 7.0, 28.0, 38.0, 87.0, 158.0, 237.0, 203.0, 113.0, 84.0, 33.0, 13.0, 6.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9615683555603027, -0.9269771575927734, -0.8923859596252441, -0.8577947616577148, -0.8232035636901855, -0.7886123657226562, -0.754021167755127, -0.7194299697875977, -0.6848387718200684, -0.6502475738525391, -0.6156563758850098, -0.5810651779174805, -0.5464739799499512, -0.5118827819824219, -0.4772915840148926, -0.4427003860473633, -0.408109188079834, -0.3735179901123047, -0.3389267921447754, -0.3043355941772461, -0.2697443962097168, -0.2351531982421875, -0.2005620002746582, -0.1659708023071289, -0.1313796043395996, -0.09678840637207031, -0.062197208404541016, -0.02760601043701172, 0.006985187530517578, 0.041576385498046875, 0.07616758346557617, 0.11075878143310547, 0.14534986019134521, 0.1799410581588745, 0.2145322561264038, 0.2491234540939331, 0.2837146520614624, 0.3183058500289917, 0.352897047996521, 0.3874882459640503, 0.4220794439315796, 0.4566706418991089, 0.4912618398666382, 0.5258530378341675, 0.5604442358016968, 0.5950354337692261, 0.6296266317367554, 0.6642178297042847, 0.698809027671814, 0.7334002256393433, 0.7679914236068726, 0.8025826215744019, 0.8371738195419312, 0.8717650175094604, 0.9063562154769897, 0.940947413444519, 0.9755386114120483, 1.0101298093795776, 1.044721007347107, 1.0793122053146362, 1.1139034032821655, 1.1484946012496948, 1.1830857992172241, 1.2176769971847534, 1.2522681951522827]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 4.0, 5.0, 2.0, 8.0, 9.0, 15.0, 10.0, 19.0, 9.0, 11.0, 21.0, 23.0, 23.0, 24.0, 24.0, 35.0, 32.0, 41.0, 34.0, 42.0, 40.0, 43.0, 34.0, 39.0, 47.0, 46.0, 33.0, 43.0, 34.0, 27.0, 25.0, 23.0, 22.0, 21.0, 20.0, 23.0, 13.0, 9.0, 15.0, 8.0, 8.0, 5.0, 9.0, 4.0, 6.0, 8.0, 3.0, 0.0, 1.0, 3.0, 3.0, 0.0, 2.0], "bins": [-0.3852055072784424, -0.37379270792007446, -0.36237990856170654, -0.350967139005661, -0.3395543396472931, -0.32814154028892517, -0.31672874093055725, -0.3053159713745117, -0.2939031720161438, -0.2824903726577759, -0.27107757329940796, -0.2596648037433624, -0.2482520043849945, -0.2368392050266266, -0.22542640566825867, -0.21401362121105194, -0.20260082185268402, -0.1911880224943161, -0.17977523803710938, -0.16836243867874146, -0.15694965422153473, -0.1455368548631668, -0.13412407040596008, -0.12271127104759216, -0.11129847913980484, -0.09988568723201752, -0.0884728953242302, -0.07706010341644287, -0.06564730405807495, -0.05423451587557793, -0.042821720242500305, -0.03140892833471298, -0.01999613642692566, -0.008583343587815762, 0.002829449251294136, 0.014242243021726608, 0.02565503492951393, 0.037067826837301254, 0.048480622470378876, 0.0598934143781662, 0.07130620628595352, 0.08271899819374084, 0.09413179010152817, 0.10554458200931549, 0.11695738136768341, 0.12837016582489014, 0.13978296518325806, 0.15119576454162598, 0.1626085489988327, 0.17402134835720062, 0.18543413281440735, 0.19684693217277527, 0.208259716629982, 0.21967251598834991, 0.23108530044555664, 0.24249809980392456, 0.2539108991622925, 0.2653236985206604, 0.2767364978790283, 0.28814926743507385, 0.2995620667934418, 0.3109748661518097, 0.3223876655101776, 0.33380043506622314, 0.34521323442459106]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 7.0, 5.0, 20.0, 23.0, 21.0, 48.0, 62.0, 92.0, 168.0, 223.0, 390.0, 722.0, 1101.0, 2141.0, 4268.0, 9189.0, 22546.0, 73230.0, 644900.0, 3277758.0, 106134.0, 28944.0, 11243.0, 5045.0, 2602.0, 1341.0, 789.0, 464.0, 255.0, 189.0, 113.0, 72.0, 53.0, 33.0, 24.0, 16.0, 13.0, 6.0, 8.0, 7.0, 6.0, 4.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10296630859375, -0.09954833984375, -0.09613037109375, -0.09271240234375, -0.08929443359375, -0.08587646484375, -0.08245849609375, -0.07904052734375, -0.07562255859375, -0.07220458984375, -0.06878662109375, -0.06536865234375, -0.06195068359375, -0.05853271484375, -0.05511474609375, -0.05169677734375, -0.04827880859375, -0.04486083984375, -0.04144287109375, -0.03802490234375, -0.03460693359375, -0.03118896484375, -0.02777099609375, -0.02435302734375, -0.02093505859375, -0.01751708984375, -0.01409912109375, -0.01068115234375, -0.00726318359375, -0.00384521484375, -0.00042724609375, 0.00299072265625, 0.00640869140625, 0.00982666015625, 0.01324462890625, 0.01666259765625, 0.02008056640625, 0.02349853515625, 0.02691650390625, 0.03033447265625, 0.03375244140625, 0.03717041015625, 0.04058837890625, 0.04400634765625, 0.04742431640625, 0.05084228515625, 0.05426025390625, 0.05767822265625, 0.06109619140625, 0.06451416015625, 0.06793212890625, 0.07135009765625, 0.07476806640625, 0.07818603515625, 0.08160400390625, 0.08502197265625, 0.08843994140625, 0.09185791015625, 0.09527587890625, 0.09869384765625, 0.10211181640625, 0.10552978515625, 0.10894775390625, 0.11236572265625, 0.11578369140625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 6.0, 3.0, 10.0, 8.0, 9.0, 16.0, 14.0, 26.0, 16.0, 33.0, 28.0, 35.0, 50.0, 44.0, 56.0, 49.0, 56.0, 62.0, 53.0, 61.0, 39.0, 53.0, 49.0, 35.0, 31.0, 32.0, 29.0, 14.0, 15.0, 18.0, 4.0, 10.0, 8.0, 10.0, 8.0, 2.0, 4.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0175933837890625, -0.016881942749023438, -0.016170501708984375, -0.015459060668945312, -0.01474761962890625, -0.014036178588867188, -0.013324737548828125, -0.012613296508789062, -0.01190185546875, -0.011190414428710938, -0.010478973388671875, -0.009767532348632812, -0.00905609130859375, -0.008344650268554688, -0.007633209228515625, -0.0069217681884765625, -0.0062103271484375, -0.0054988861083984375, -0.004787445068359375, -0.0040760040283203125, -0.00336456298828125, -0.0026531219482421875, -0.001941680908203125, -0.0012302398681640625, -0.000518798828125, 0.0001926422119140625, 0.000904083251953125, 0.0016155242919921875, 0.00232696533203125, 0.0030384063720703125, 0.003749847412109375, 0.0044612884521484375, 0.0051727294921875, 0.0058841705322265625, 0.006595611572265625, 0.0073070526123046875, 0.00801849365234375, 0.008729934692382812, 0.009441375732421875, 0.010152816772460938, 0.0108642578125, 0.011575698852539062, 0.012287139892578125, 0.012998580932617188, 0.01371002197265625, 0.014421463012695312, 0.015132904052734375, 0.015844345092773438, 0.0165557861328125, 0.017267227172851562, 0.017978668212890625, 0.018690109252929688, 0.01940155029296875, 0.020112991333007812, 0.020824432373046875, 0.021535873413085938, 0.022247314453125, 0.022958755493164062, 0.023670196533203125, 0.024381637573242188, 0.02509307861328125, 0.025804519653320312, 0.026515960693359375, 0.027227401733398438, 0.0279388427734375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 7.0, 2.0, 6.0, 6.0, 12.0, 14.0, 25.0, 25.0, 31.0, 55.0, 75.0, 106.0, 162.0, 226.0, 359.0, 638.0, 1054.0, 1990.0, 3982.0, 8114.0, 18702.0, 52059.0, 209444.0, 3370290.0, 405085.0, 75245.0, 25433.0, 10554.0, 4977.0, 2340.0, 1346.0, 731.0, 445.0, 253.0, 154.0, 104.0, 67.0, 48.0, 35.0, 27.0, 17.0, 8.0, 8.0, 8.0, 9.0, 4.0, 1.0, 4.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10577392578125, -0.10232353210449219, -0.09887313842773438, -0.09542274475097656, -0.09197235107421875, -0.08852195739746094, -0.08507156372070312, -0.08162117004394531, -0.0781707763671875, -0.07472038269042969, -0.07126998901367188, -0.06781959533691406, -0.06436920166015625, -0.06091880798339844, -0.057468414306640625, -0.05401802062988281, -0.050567626953125, -0.04711723327636719, -0.043666839599609375, -0.04021644592285156, -0.03676605224609375, -0.03331565856933594, -0.029865264892578125, -0.026414871215820312, -0.0229644775390625, -0.019514083862304688, -0.016063690185546875, -0.012613296508789062, -0.00916290283203125, -0.0057125091552734375, -0.002262115478515625, 0.0011882781982421875, 0.004638671875, 0.008089065551757812, 0.011539459228515625, 0.014989852905273438, 0.01844024658203125, 0.021890640258789062, 0.025341033935546875, 0.028791427612304688, 0.0322418212890625, 0.03569221496582031, 0.039142608642578125, 0.04259300231933594, 0.04604339599609375, 0.04949378967285156, 0.052944183349609375, 0.05639457702636719, 0.059844970703125, 0.06329536437988281, 0.06674575805664062, 0.07019615173339844, 0.07364654541015625, 0.07709693908691406, 0.08054733276367188, 0.08399772644042969, 0.0874481201171875, 0.09089851379394531, 0.09434890747070312, 0.09779930114746094, 0.10124969482421875, 0.10470008850097656, 0.10815048217773438, 0.11160087585449219, 0.11505126953125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 1.0, 4.0, 6.0, 10.0, 16.0, 19.0, 41.0, 38.0, 65.0, 83.0, 134.0, 301.0, 1821.0, 895.0, 245.0, 126.0, 71.0, 50.0, 50.0, 24.0, 18.0, 8.0, 10.0, 12.0, 7.0, 2.0, 6.0, 3.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049835205078125, -0.04822063446044922, -0.04660606384277344, -0.044991493225097656, -0.043376922607421875, -0.041762351989746094, -0.04014778137207031, -0.03853321075439453, -0.03691864013671875, -0.03530406951904297, -0.03368949890136719, -0.032074928283691406, -0.030460357666015625, -0.028845787048339844, -0.027231216430664062, -0.02561664581298828, -0.0240020751953125, -0.02238750457763672, -0.020772933959960938, -0.019158363342285156, -0.017543792724609375, -0.015929222106933594, -0.014314651489257812, -0.012700080871582031, -0.01108551025390625, -0.009470939636230469, -0.007856369018554688, -0.006241798400878906, -0.004627227783203125, -0.0030126571655273438, -0.0013980865478515625, 0.00021648406982421875, 0.0018310546875, 0.0034456253051757812, 0.0050601959228515625, 0.006674766540527344, 0.008289337158203125, 0.009903907775878906, 0.011518478393554688, 0.013133049011230469, 0.01474761962890625, 0.01636219024658203, 0.017976760864257812, 0.019591331481933594, 0.021205902099609375, 0.022820472717285156, 0.024435043334960938, 0.02604961395263672, 0.0276641845703125, 0.02927875518798828, 0.030893325805664062, 0.032507896423339844, 0.034122467041015625, 0.035737037658691406, 0.03735160827636719, 0.03896617889404297, 0.04058074951171875, 0.04219532012939453, 0.04380989074707031, 0.045424461364746094, 0.047039031982421875, 0.048653602600097656, 0.05026817321777344, 0.05188274383544922, 0.053497314453125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 7.0, 5.0, 7.0, 15.0, 20.0, 53.0, 63.0, 100.0, 124.0, 144.0, 125.0, 113.0, 96.0, 51.0, 36.0, 19.0, 9.0, 14.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34678295254707336, -0.33577069640159607, -0.3247584104537964, -0.3137461543083191, -0.3027338981628418, -0.2917216420173645, -0.2807093858718872, -0.2696970999240875, -0.25868484377861023, -0.24767258763313293, -0.23666031658649445, -0.22564804553985596, -0.21463578939437866, -0.20362353324890137, -0.19261126220226288, -0.1815989911556244, -0.1705867350101471, -0.1595744788646698, -0.1485622078180313, -0.13754993677139282, -0.12653768062591553, -0.11552541702985764, -0.10451315343379974, -0.09350088983774185, -0.08248862624168396, -0.07147636264562607, -0.060464099049568176, -0.049451835453510284, -0.03843957185745239, -0.0274273082613945, -0.01641504466533661, -0.005402781069278717, 0.0056095123291015625, 0.016621775925159454, 0.027634039521217346, 0.03864630311727524, 0.04965856671333313, 0.06067083030939102, 0.07168309390544891, 0.0826953575015068, 0.0937076210975647, 0.10471988469362259, 0.11573214828968048, 0.12674441933631897, 0.13775667548179626, 0.14876893162727356, 0.15978120267391205, 0.17079347372055054, 0.18180572986602783, 0.19281798601150513, 0.20383025705814362, 0.2148425281047821, 0.2258547842502594, 0.2368670403957367, 0.24787931144237518, 0.25889158248901367, 0.26990383863449097, 0.28091609477996826, 0.29192835092544556, 0.30294063687324524, 0.31395289301872253, 0.32496514916419983, 0.3359774351119995, 0.3469896912574768, 0.3580019474029541]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 8.0, 5.0, 11.0, 8.0, 12.0, 12.0, 15.0, 13.0, 27.0, 24.0, 22.0, 22.0, 28.0, 17.0, 40.0, 29.0, 35.0, 31.0, 50.0, 41.0, 46.0, 37.0, 49.0, 33.0, 36.0, 46.0, 35.0, 27.0, 26.0, 25.0, 26.0, 28.0, 24.0, 14.0, 14.0, 13.0, 6.0, 9.0, 11.0, 5.0, 8.0, 6.0, 7.0, 7.0, 7.0, 1.0, 4.0, 0.0, 2.0], "bins": [-0.155536949634552, -0.15125305950641632, -0.14696915447711945, -0.14268526434898376, -0.1384013593196869, -0.1341174691915512, -0.12983357906341553, -0.12554967403411865, -0.12126578390598297, -0.1169818863272667, -0.11269798874855042, -0.10841409862041473, -0.10413020104169846, -0.09984630346298218, -0.0955624133348465, -0.09127851575613022, -0.08699461817741394, -0.08271072059869766, -0.07842682301998138, -0.0741429328918457, -0.06985903531312943, -0.06557513773441315, -0.06129124388098717, -0.05700735002756119, -0.05272345244884491, -0.04843955487012863, -0.04415566101670265, -0.03987176716327667, -0.035587869584560394, -0.031303972005844116, -0.027020078152418137, -0.022736182436347008, -0.01845228672027588, -0.01416839100420475, -0.009884495288133621, -0.005600599572062492, -0.0013167038559913635, 0.0029671918600797653, 0.007251087576150894, 0.011534983292222023, 0.015818879008293152, 0.02010277472436428, 0.02438667044043541, 0.02867056615650654, 0.03295446187257767, 0.037238359451293945, 0.041522253304719925, 0.045806147158145905, 0.05009004473686218, 0.05437394231557846, 0.05865783616900444, 0.06294173002243042, 0.0672256276011467, 0.07150952517986298, 0.07579341530799866, 0.08007731288671494, 0.08436121046543121, 0.08864510804414749, 0.09292900562286377, 0.09721289575099945, 0.10149679332971573, 0.105780690908432, 0.11006458103656769, 0.11434847861528397, 0.11863237619400024]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 2.0, 7.0, 5.0, 17.0, 15.0, 17.0, 29.0, 58.0, 60.0, 114.0, 142.0, 247.0, 367.0, 634.0, 1094.0, 1857.0, 3454.0, 6297.0, 11836.0, 22768.0, 43621.0, 85845.0, 183577.0, 322907.0, 184358.0, 86831.0, 43383.0, 22349.0, 11887.0, 6429.0, 3556.0, 1921.0, 1166.0, 635.0, 375.0, 266.0, 131.0, 90.0, 62.0, 46.0, 26.0, 22.0, 20.0, 14.0, 5.0, 3.0, 6.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.065673828125, -0.06371355056762695, -0.061753273010253906, -0.05979299545288086, -0.05783271789550781, -0.055872440338134766, -0.05391216278076172, -0.05195188522338867, -0.049991607666015625, -0.04803133010864258, -0.04607105255126953, -0.044110774993896484, -0.04215049743652344, -0.04019021987915039, -0.038229942321777344, -0.0362696647644043, -0.03430938720703125, -0.0323491096496582, -0.030388832092285156, -0.02842855453491211, -0.026468276977539062, -0.024507999420166016, -0.02254772186279297, -0.020587444305419922, -0.018627166748046875, -0.016666889190673828, -0.014706611633300781, -0.012746334075927734, -0.010786056518554688, -0.00882577896118164, -0.006865501403808594, -0.004905223846435547, -0.0029449462890625, -0.0009846687316894531, 0.0009756088256835938, 0.0029358863830566406, 0.0048961639404296875, 0.006856441497802734, 0.008816719055175781, 0.010776996612548828, 0.012737274169921875, 0.014697551727294922, 0.01665782928466797, 0.018618106842041016, 0.020578384399414062, 0.02253866195678711, 0.024498939514160156, 0.026459217071533203, 0.02841949462890625, 0.030379772186279297, 0.032340049743652344, 0.03430032730102539, 0.03626060485839844, 0.038220882415771484, 0.04018115997314453, 0.04214143753051758, 0.044101715087890625, 0.04606199264526367, 0.04802227020263672, 0.049982547760009766, 0.05194282531738281, 0.05390310287475586, 0.055863380432128906, 0.05782365798950195, 0.059783935546875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 8.0, 6.0, 9.0, 7.0, 13.0, 9.0, 8.0, 16.0, 23.0, 21.0, 25.0, 16.0, 30.0, 28.0, 30.0, 42.0, 52.0, 48.0, 47.0, 36.0, 49.0, 42.0, 33.0, 41.0, 28.0, 45.0, 31.0, 33.0, 34.0, 21.0, 18.0, 24.0, 24.0, 19.0, 9.0, 11.0, 12.0, 10.0, 12.0, 6.0, 2.0, 3.0, 4.0, 3.0, 3.0, 3.0, 3.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.01678466796875, -0.016205310821533203, -0.015625953674316406, -0.01504659652709961, -0.014467239379882812, -0.013887882232666016, -0.013308525085449219, -0.012729167938232422, -0.012149810791015625, -0.011570453643798828, -0.010991096496582031, -0.010411739349365234, -0.009832382202148438, -0.00925302505493164, -0.008673667907714844, -0.008094310760498047, -0.00751495361328125, -0.006935596466064453, -0.006356239318847656, -0.005776882171630859, -0.0051975250244140625, -0.004618167877197266, -0.004038810729980469, -0.003459453582763672, -0.002880096435546875, -0.002300739288330078, -0.0017213821411132812, -0.0011420249938964844, -0.0005626678466796875, 1.6689300537109375e-05, 0.0005960464477539062, 0.0011754035949707031, 0.0017547607421875, 0.002334117889404297, 0.0029134750366210938, 0.0034928321838378906, 0.0040721893310546875, 0.004651546478271484, 0.005230903625488281, 0.005810260772705078, 0.006389617919921875, 0.006968975067138672, 0.007548332214355469, 0.008127689361572266, 0.008707046508789062, 0.00928640365600586, 0.009865760803222656, 0.010445117950439453, 0.01102447509765625, 0.011603832244873047, 0.012183189392089844, 0.01276254653930664, 0.013341903686523438, 0.013921260833740234, 0.014500617980957031, 0.015079975128173828, 0.015659332275390625, 0.016238689422607422, 0.01681804656982422, 0.017397403717041016, 0.017976760864257812, 0.01855611801147461, 0.019135475158691406, 0.019714832305908203, 0.020294189453125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 8.0, 9.0, 7.0, 14.0, 21.0, 18.0, 41.0, 62.0, 69.0, 94.0, 131.0, 160.0, 267.0, 379.0, 582.0, 1014.0, 1747.0, 3596.0, 8250.0, 20084.0, 52175.0, 142129.0, 438034.0, 244519.0, 80789.0, 30855.0, 12358.0, 5111.0, 2496.0, 1252.0, 741.0, 469.0, 285.0, 201.0, 161.0, 97.0, 95.0, 66.0, 49.0, 36.0, 16.0, 25.0, 11.0, 9.0, 6.0, 10.0, 0.0, 1.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.06939697265625, -0.06698131561279297, -0.06456565856933594, -0.062150001525878906, -0.059734344482421875, -0.057318687438964844, -0.05490303039550781, -0.05248737335205078, -0.05007171630859375, -0.04765605926513672, -0.04524040222167969, -0.042824745178222656, -0.040409088134765625, -0.037993431091308594, -0.03557777404785156, -0.03316211700439453, -0.0307464599609375, -0.02833080291748047, -0.025915145874023438, -0.023499488830566406, -0.021083831787109375, -0.018668174743652344, -0.016252517700195312, -0.013836860656738281, -0.01142120361328125, -0.009005546569824219, -0.0065898895263671875, -0.004174232482910156, -0.001758575439453125, 0.0006570816040039062, 0.0030727386474609375, 0.005488395690917969, 0.007904052734375, 0.010319709777832031, 0.012735366821289062, 0.015151023864746094, 0.017566680908203125, 0.019982337951660156, 0.022397994995117188, 0.02481365203857422, 0.02722930908203125, 0.02964496612548828, 0.03206062316894531, 0.034476280212402344, 0.036891937255859375, 0.039307594299316406, 0.04172325134277344, 0.04413890838623047, 0.0465545654296875, 0.04897022247314453, 0.05138587951660156, 0.053801536560058594, 0.056217193603515625, 0.058632850646972656, 0.06104850769042969, 0.06346416473388672, 0.06587982177734375, 0.06829547882080078, 0.07071113586425781, 0.07312679290771484, 0.07554244995117188, 0.0779581069946289, 0.08037376403808594, 0.08278942108154297, 0.085205078125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 3.0, 6.0, 6.0, 11.0, 12.0, 10.0, 8.0, 18.0, 18.0, 33.0, 39.0, 31.0, 46.0, 25.0, 44.0, 44.0, 37.0, 46.0, 44.0, 46.0, 38.0, 48.0, 54.0, 21.0, 46.0, 47.0, 39.0, 29.0, 20.0, 27.0, 17.0, 10.0, 13.0, 13.0, 14.0, 9.0, 4.0, 5.0, 7.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1044921875, -0.10136032104492188, -0.09822845458984375, -0.09509658813476562, -0.0919647216796875, -0.08883285522460938, -0.08570098876953125, -0.08256912231445312, -0.079437255859375, -0.07630538940429688, -0.07317352294921875, -0.07004165649414062, -0.0669097900390625, -0.06377792358398438, -0.06064605712890625, -0.057514190673828125, -0.05438232421875, -0.051250457763671875, -0.04811859130859375, -0.044986724853515625, -0.0418548583984375, -0.038722991943359375, -0.03559112548828125, -0.032459259033203125, -0.029327392578125, -0.026195526123046875, -0.02306365966796875, -0.019931793212890625, -0.0167999267578125, -0.013668060302734375, -0.01053619384765625, -0.007404327392578125, -0.0042724609375, -0.001140594482421875, 0.00199127197265625, 0.005123138427734375, 0.0082550048828125, 0.011386871337890625, 0.01451873779296875, 0.017650604248046875, 0.020782470703125, 0.023914337158203125, 0.02704620361328125, 0.030178070068359375, 0.0333099365234375, 0.036441802978515625, 0.03957366943359375, 0.042705535888671875, 0.04583740234375, 0.048969268798828125, 0.05210113525390625, 0.055233001708984375, 0.0583648681640625, 0.061496734619140625, 0.06462860107421875, 0.06776046752929688, 0.070892333984375, 0.07402420043945312, 0.07715606689453125, 0.08028793334960938, 0.0834197998046875, 0.08655166625976562, 0.08968353271484375, 0.09281539916992188, 0.095947265625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 5.0, 3.0, 6.0, 12.0, 13.0, 23.0, 33.0, 57.0, 109.0, 238.0, 507.0, 1266.0, 3743.0, 13626.0, 68414.0, 421708.0, 446997.0, 71331.0, 14383.0, 3790.0, 1331.0, 487.0, 220.0, 104.0, 69.0, 39.0, 20.0, 7.0, 9.0, 6.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07391357421875, -0.07160472869873047, -0.06929588317871094, -0.0669870376586914, -0.06467819213867188, -0.062369346618652344, -0.06006050109863281, -0.05775165557861328, -0.05544281005859375, -0.05313396453857422, -0.05082511901855469, -0.048516273498535156, -0.046207427978515625, -0.043898582458496094, -0.04158973693847656, -0.03928089141845703, -0.0369720458984375, -0.03466320037841797, -0.03235435485839844, -0.030045509338378906, -0.027736663818359375, -0.025427818298339844, -0.023118972778320312, -0.02081012725830078, -0.01850128173828125, -0.01619243621826172, -0.013883590698242188, -0.011574745178222656, -0.009265899658203125, -0.006957054138183594, -0.0046482086181640625, -0.0023393630981445312, -3.0517578125e-05, 0.0022783279418945312, 0.0045871734619140625, 0.006896018981933594, 0.009204864501953125, 0.011513710021972656, 0.013822555541992188, 0.01613140106201172, 0.01844024658203125, 0.02074909210205078, 0.023057937622070312, 0.025366783142089844, 0.027675628662109375, 0.029984474182128906, 0.03229331970214844, 0.03460216522216797, 0.0369110107421875, 0.03921985626220703, 0.04152870178222656, 0.043837547302246094, 0.046146392822265625, 0.048455238342285156, 0.05076408386230469, 0.05307292938232422, 0.05538177490234375, 0.05769062042236328, 0.05999946594238281, 0.062308311462402344, 0.06461715698242188, 0.0669260025024414, 0.06923484802246094, 0.07154369354248047, 0.0738525390625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 9.0, 11.0, 14.0, 20.0, 14.0, 21.0, 30.0, 37.0, 56.0, 68.0, 98.0, 91.0, 87.0, 94.0, 69.0, 61.0, 66.0, 36.0, 24.0, 22.0, 16.0, 14.0, 8.0, 9.0, 6.0, 9.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.170967102050781e-05, -3.06982547044754e-05, -2.9686838388442993e-05, -2.8675422072410583e-05, -2.7664005756378174e-05, -2.6652589440345764e-05, -2.5641173124313354e-05, -2.4629756808280945e-05, -2.3618340492248535e-05, -2.2606924176216125e-05, -2.1595507860183716e-05, -2.0584091544151306e-05, -1.9572675228118896e-05, -1.8561258912086487e-05, -1.7549842596054077e-05, -1.6538426280021667e-05, -1.5527009963989258e-05, -1.4515593647956848e-05, -1.3504177331924438e-05, -1.2492761015892029e-05, -1.1481344699859619e-05, -1.046992838382721e-05, -9.4585120677948e-06, -8.44709575176239e-06, -7.4356794357299805e-06, -6.424263119697571e-06, -5.412846803665161e-06, -4.4014304876327515e-06, -3.390014171600342e-06, -2.378597855567932e-06, -1.3671815395355225e-06, -3.557652235031128e-07, 6.556510925292969e-07, 1.6670674085617065e-06, 2.678483724594116e-06, 3.689900040626526e-06, 4.7013163566589355e-06, 5.712732672691345e-06, 6.724148988723755e-06, 7.735565304756165e-06, 8.746981620788574e-06, 9.758397936820984e-06, 1.0769814252853394e-05, 1.1781230568885803e-05, 1.2792646884918213e-05, 1.3804063200950623e-05, 1.4815479516983032e-05, 1.5826895833015442e-05, 1.683831214904785e-05, 1.784972846508026e-05, 1.886114478111267e-05, 1.987256109714508e-05, 2.088397741317749e-05, 2.18953937292099e-05, 2.290681004524231e-05, 2.391822636127472e-05, 2.492964267730713e-05, 2.594105899333954e-05, 2.6952475309371948e-05, 2.7963891625404358e-05, 2.8975307941436768e-05, 2.9986724257469177e-05, 3.099814057350159e-05, 3.2009556889533997e-05, 3.3020973205566406e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 6.0, 6.0, 9.0, 20.0, 42.0, 88.0, 210.0, 497.0, 1423.0, 5322.0, 36800.0, 470600.0, 487388.0, 38337.0, 5493.0, 1454.0, 502.0, 193.0, 74.0, 36.0, 21.0, 15.0, 9.0, 7.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12078857421875, -0.11733818054199219, -0.11388778686523438, -0.11043739318847656, -0.10698699951171875, -0.10353660583496094, -0.10008621215820312, -0.09663581848144531, -0.0931854248046875, -0.08973503112792969, -0.08628463745117188, -0.08283424377441406, -0.07938385009765625, -0.07593345642089844, -0.07248306274414062, -0.06903266906738281, -0.065582275390625, -0.06213188171386719, -0.058681488037109375, -0.05523109436035156, -0.05178070068359375, -0.04833030700683594, -0.044879913330078125, -0.04142951965332031, -0.0379791259765625, -0.03452873229980469, -0.031078338623046875, -0.027627944946289062, -0.02417755126953125, -0.020727157592773438, -0.017276763916015625, -0.013826370239257812, -0.0103759765625, -0.0069255828857421875, -0.003475189208984375, -2.47955322265625e-05, 0.00342559814453125, 0.0068759918212890625, 0.010326385498046875, 0.013776779174804688, 0.0172271728515625, 0.020677566528320312, 0.024127960205078125, 0.027578353881835938, 0.03102874755859375, 0.03447914123535156, 0.037929534912109375, 0.04137992858886719, 0.044830322265625, 0.04828071594238281, 0.051731109619140625, 0.05518150329589844, 0.05863189697265625, 0.06208229064941406, 0.06553268432617188, 0.06898307800292969, 0.0724334716796875, 0.07588386535644531, 0.07933425903320312, 0.08278465270996094, 0.08623504638671875, 0.08968544006347656, 0.09313583374023438, 0.09658622741699219, 0.10003662109375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 5.0, 11.0, 8.0, 15.0, 17.0, 29.0, 30.0, 45.0, 48.0, 67.0, 98.0, 119.0, 132.0, 100.0, 55.0, 46.0, 43.0, 39.0, 22.0, 13.0, 13.0, 15.0, 13.0, 7.0, 3.0, 7.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.07861328125, -0.07664871215820312, -0.07468414306640625, -0.07271957397460938, -0.0707550048828125, -0.06879043579101562, -0.06682586669921875, -0.06486129760742188, -0.062896728515625, -0.060932159423828125, -0.05896759033203125, -0.057003021240234375, -0.0550384521484375, -0.053073883056640625, -0.05110931396484375, -0.049144744873046875, -0.04718017578125, -0.045215606689453125, -0.04325103759765625, -0.041286468505859375, -0.0393218994140625, -0.037357330322265625, -0.03539276123046875, -0.033428192138671875, -0.031463623046875, -0.029499053955078125, -0.02753448486328125, -0.025569915771484375, -0.0236053466796875, -0.021640777587890625, -0.01967620849609375, -0.017711639404296875, -0.0157470703125, -0.013782501220703125, -0.01181793212890625, -0.009853363037109375, -0.0078887939453125, -0.005924224853515625, -0.00395965576171875, -0.001995086669921875, -3.0517578125e-05, 0.001934051513671875, 0.00389862060546875, 0.005863189697265625, 0.0078277587890625, 0.009792327880859375, 0.01175689697265625, 0.013721466064453125, 0.01568603515625, 0.017650604248046875, 0.01961517333984375, 0.021579742431640625, 0.0235443115234375, 0.025508880615234375, 0.02747344970703125, 0.029438018798828125, 0.031402587890625, 0.033367156982421875, 0.03533172607421875, 0.037296295166015625, 0.0392608642578125, 0.041225433349609375, 0.04319000244140625, 0.045154571533203125, 0.047119140625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 16.0, 55.0, 169.0, 296.0, 288.0, 130.0, 39.0, 11.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9571785926818848, -2.8942370414733887, -2.8312954902648926, -2.7683537006378174, -2.7054121494293213, -2.642470598220825, -2.57952880859375, -2.516587257385254, -2.453645706176758, -2.3907041549682617, -2.3277626037597656, -2.2648208141326904, -2.2018792629241943, -2.1389377117156982, -2.075995922088623, -2.013054370880127, -1.9501128196716309, -1.8871712684631348, -1.8242295980453491, -1.7612879276275635, -1.6983463764190674, -1.6354048252105713, -1.5724631547927856, -1.509521484375, -1.446579933166504, -1.3836383819580078, -1.3206967115402222, -1.2577550411224365, -1.1948134899139404, -1.1318719387054443, -1.0689302682876587, -1.005988597869873, -0.9430468082427979, -0.880105197429657, -0.8171635866165161, -0.7542219758033752, -0.6912803649902344, -0.6283387541770935, -0.5653971433639526, -0.5024555325508118, -0.4395139217376709, -0.37657231092453003, -0.31363070011138916, -0.2506890892982483, -0.18774747848510742, -0.12480586767196655, -0.061864256858825684, 0.0010773539543151855, 0.06401896476745605, 0.12696057558059692, 0.1899021863937378, 0.25284379720687866, 0.31578540802001953, 0.3787270188331604, 0.44166862964630127, 0.5046102404594421, 0.567551851272583, 0.6304934620857239, 0.6934350728988647, 0.7563766837120056, 0.8193182945251465, 0.8822599053382874, 0.9452015161514282, 1.0081431865692139, 1.07108473777771]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 6.0, 9.0, 5.0, 14.0, 16.0, 14.0, 20.0, 19.0, 22.0, 31.0, 34.0, 38.0, 37.0, 23.0, 47.0, 40.0, 62.0, 64.0, 55.0, 30.0, 53.0, 41.0, 29.0, 38.0, 39.0, 28.0, 27.0, 24.0, 20.0, 13.0, 16.0, 13.0, 11.0, 12.0, 10.0, 6.0, 8.0, 4.0, 4.0, 6.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.5803826451301575, -0.5642767548561096, -0.548170804977417, -0.5320649147033691, -0.5159590244293213, -0.49985307455062866, -0.4837471842765808, -0.46764126420021057, -0.45153534412384033, -0.4354294240474701, -0.41932350397109985, -0.403217613697052, -0.38711169362068176, -0.3710057735443115, -0.35489988327026367, -0.33879396319389343, -0.3226880431175232, -0.30658212304115295, -0.2904762029647827, -0.27437031269073486, -0.2582643926143646, -0.24215847253799438, -0.22605256736278534, -0.2099466621875763, -0.19384074211120605, -0.17773482203483582, -0.16162891685962677, -0.14552301168441772, -0.12941709160804749, -0.11331117898225784, -0.0972052663564682, -0.08109935373067856, -0.06499338150024414, -0.0488874688744545, -0.032781556248664856, -0.016675643622875214, -0.0005697309970855713, 0.015536181628704071, 0.03164209425449371, 0.047748006880283356, 0.063853919506073, 0.07995983213186264, 0.09606574475765228, 0.11217165738344193, 0.12827757000923157, 0.1443834900856018, 0.16048939526081085, 0.1765953004360199, 0.19270122051239014, 0.20880714058876038, 0.22491304576396942, 0.24101895093917847, 0.2571248710155487, 0.27323079109191895, 0.2893366813659668, 0.30544260144233704, 0.3215485215187073, 0.3376544415950775, 0.35376036167144775, 0.3698662519454956, 0.38597217202186584, 0.4020780920982361, 0.41818398237228394, 0.4342899024486542, 0.4503958225250244]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 4.0, 6.0, 9.0, 13.0, 11.0, 18.0, 37.0, 54.0, 83.0, 122.0, 183.0, 295.0, 513.0, 961.0, 1773.0, 3700.0, 7951.0, 20058.0, 66287.0, 559884.0, 3360481.0, 120431.0, 29728.0, 11248.0, 5066.0, 2376.0, 1243.0, 664.0, 394.0, 228.0, 159.0, 78.0, 68.0, 54.0, 31.0, 15.0, 15.0, 10.0, 7.0, 7.0, 4.0, 4.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.1329345703125, -0.12904644012451172, -0.12515830993652344, -0.12127017974853516, -0.11738204956054688, -0.1134939193725586, -0.10960578918457031, -0.10571765899658203, -0.10182952880859375, -0.09794139862060547, -0.09405326843261719, -0.0901651382446289, -0.08627700805664062, -0.08238887786865234, -0.07850074768066406, -0.07461261749267578, -0.0707244873046875, -0.06683635711669922, -0.06294822692871094, -0.059060096740722656, -0.055171966552734375, -0.051283836364746094, -0.04739570617675781, -0.04350757598876953, -0.03961944580078125, -0.03573131561279297, -0.03184318542480469, -0.027955055236816406, -0.024066925048828125, -0.020178794860839844, -0.016290664672851562, -0.012402534484863281, -0.008514404296875, -0.004626274108886719, -0.0007381439208984375, 0.0031499862670898438, 0.007038116455078125, 0.010926246643066406, 0.014814376831054688, 0.01870250701904297, 0.02259063720703125, 0.02647876739501953, 0.030366897583007812, 0.034255027770996094, 0.038143157958984375, 0.042031288146972656, 0.04591941833496094, 0.04980754852294922, 0.0536956787109375, 0.05758380889892578, 0.06147193908691406, 0.06536006927490234, 0.06924819946289062, 0.0731363296508789, 0.07702445983886719, 0.08091259002685547, 0.08480072021484375, 0.08868885040283203, 0.09257698059082031, 0.0964651107788086, 0.10035324096679688, 0.10424137115478516, 0.10812950134277344, 0.11201763153076172, 0.11590576171875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 6.0, 3.0, 1.0, 12.0, 7.0, 6.0, 14.0, 19.0, 19.0, 14.0, 19.0, 24.0, 26.0, 30.0, 29.0, 47.0, 40.0, 46.0, 46.0, 39.0, 46.0, 51.0, 46.0, 46.0, 49.0, 39.0, 36.0, 33.0, 28.0, 23.0, 19.0, 18.0, 22.0, 16.0, 15.0, 18.0, 10.0, 5.0, 11.0, 6.0, 6.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0202484130859375, -0.019598960876464844, -0.018949508666992188, -0.01830005645751953, -0.017650604248046875, -0.01700115203857422, -0.016351699829101562, -0.015702247619628906, -0.01505279541015625, -0.014403343200683594, -0.013753890991210938, -0.013104438781738281, -0.012454986572265625, -0.011805534362792969, -0.011156082153320312, -0.010506629943847656, -0.009857177734375, -0.009207725524902344, -0.008558273315429688, -0.007908821105957031, -0.007259368896484375, -0.006609916687011719, -0.0059604644775390625, -0.005311012268066406, -0.00466156005859375, -0.004012107849121094, -0.0033626556396484375, -0.0027132034301757812, -0.002063751220703125, -0.0014142990112304688, -0.0007648468017578125, -0.00011539459228515625, 0.0005340576171875, 0.0011835098266601562, 0.0018329620361328125, 0.0024824142456054688, 0.003131866455078125, 0.0037813186645507812, 0.0044307708740234375, 0.005080223083496094, 0.00572967529296875, 0.006379127502441406, 0.0070285797119140625, 0.007678031921386719, 0.008327484130859375, 0.008976936340332031, 0.009626388549804688, 0.010275840759277344, 0.01092529296875, 0.011574745178222656, 0.012224197387695312, 0.012873649597167969, 0.013523101806640625, 0.014172554016113281, 0.014822006225585938, 0.015471458435058594, 0.01612091064453125, 0.016770362854003906, 0.017419815063476562, 0.01806926727294922, 0.018718719482421875, 0.01936817169189453, 0.020017623901367188, 0.020667076110839844, 0.0213165283203125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 5.0, 4.0, 8.0, 8.0, 13.0, 11.0, 22.0, 30.0, 55.0, 84.0, 109.0, 167.0, 237.0, 383.0, 598.0, 929.0, 1514.0, 2777.0, 4890.0, 9556.0, 19342.0, 44536.0, 128447.0, 735094.0, 2885973.0, 235744.0, 68278.0, 27427.0, 12777.0, 6426.0, 3490.0, 2047.0, 1243.0, 689.0, 471.0, 296.0, 193.0, 139.0, 85.0, 70.0, 32.0, 29.0, 15.0, 15.0, 14.0, 4.0, 8.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.09649658203125, -0.09367656707763672, -0.09085655212402344, -0.08803653717041016, -0.08521652221679688, -0.0823965072631836, -0.07957649230957031, -0.07675647735595703, -0.07393646240234375, -0.07111644744873047, -0.06829643249511719, -0.0654764175415039, -0.06265640258789062, -0.059836387634277344, -0.05701637268066406, -0.05419635772705078, -0.0513763427734375, -0.04855632781982422, -0.04573631286621094, -0.042916297912597656, -0.040096282958984375, -0.037276268005371094, -0.03445625305175781, -0.03163623809814453, -0.02881622314453125, -0.02599620819091797, -0.023176193237304688, -0.020356178283691406, -0.017536163330078125, -0.014716148376464844, -0.011896133422851562, -0.009076118469238281, -0.006256103515625, -0.0034360885620117188, -0.0006160736083984375, 0.0022039413452148438, 0.005023956298828125, 0.007843971252441406, 0.010663986206054688, 0.013484001159667969, 0.01630401611328125, 0.01912403106689453, 0.021944046020507812, 0.024764060974121094, 0.027584075927734375, 0.030404090881347656, 0.03322410583496094, 0.03604412078857422, 0.0388641357421875, 0.04168415069580078, 0.04450416564941406, 0.047324180603027344, 0.050144195556640625, 0.052964210510253906, 0.05578422546386719, 0.05860424041748047, 0.06142425537109375, 0.06424427032470703, 0.06706428527832031, 0.0698843002319336, 0.07270431518554688, 0.07552433013916016, 0.07834434509277344, 0.08116436004638672, 0.083984375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 3.0, 10.0, 4.0, 11.0, 11.0, 16.0, 20.0, 25.0, 31.0, 44.0, 60.0, 100.0, 170.0, 296.0, 835.0, 1449.0, 369.0, 187.0, 121.0, 94.0, 53.0, 37.0, 30.0, 21.0, 12.0, 18.0, 7.0, 8.0, 6.0, 1.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.052764892578125, -0.05112457275390625, -0.0494842529296875, -0.04784393310546875, -0.04620361328125, -0.04456329345703125, -0.0429229736328125, -0.04128265380859375, -0.039642333984375, -0.03800201416015625, -0.0363616943359375, -0.03472137451171875, -0.0330810546875, -0.03144073486328125, -0.0298004150390625, -0.02816009521484375, -0.026519775390625, -0.02487945556640625, -0.0232391357421875, -0.02159881591796875, -0.01995849609375, -0.01831817626953125, -0.0166778564453125, -0.01503753662109375, -0.013397216796875, -0.01175689697265625, -0.0101165771484375, -0.00847625732421875, -0.0068359375, -0.00519561767578125, -0.0035552978515625, -0.00191497802734375, -0.000274658203125, 0.00136566162109375, 0.0030059814453125, 0.00464630126953125, 0.00628662109375, 0.00792694091796875, 0.0095672607421875, 0.01120758056640625, 0.012847900390625, 0.01448822021484375, 0.0161285400390625, 0.01776885986328125, 0.0194091796875, 0.02104949951171875, 0.0226898193359375, 0.02433013916015625, 0.025970458984375, 0.02761077880859375, 0.0292510986328125, 0.03089141845703125, 0.03253173828125, 0.03417205810546875, 0.0358123779296875, 0.03745269775390625, 0.039093017578125, 0.04073333740234375, 0.0423736572265625, 0.04401397705078125, 0.045654296875, 0.04729461669921875, 0.0489349365234375, 0.05057525634765625, 0.052215576171875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 6.0, 4.0, 10.0, 12.0, 25.0, 36.0, 32.0, 48.0, 65.0, 85.0, 98.0, 107.0, 90.0, 93.0, 76.0, 68.0, 51.0, 22.0, 20.0, 13.0, 13.0, 12.0, 7.0, 3.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34757858514785767, -0.33721330761909485, -0.32684803009033203, -0.3164827227592468, -0.306117445230484, -0.2957521677017212, -0.285386860370636, -0.27502158284187317, -0.26465630531311035, -0.25429102778434753, -0.24392573535442352, -0.2335604429244995, -0.2231951653957367, -0.21282988786697388, -0.20246459543704987, -0.19209930300712585, -0.18173402547836304, -0.17136874794960022, -0.1610034555196762, -0.1506381630897522, -0.14027288556098938, -0.12990760803222656, -0.11954231560230255, -0.10917703062295914, -0.09881174564361572, -0.08844646066427231, -0.0780811756849289, -0.06771589070558548, -0.057350605726242065, -0.04698532074689865, -0.03662003576755524, -0.026254750788211823, -0.015889465808868408, -0.005524180829524994, 0.00484110414981842, 0.015206389129161835, 0.02557167410850525, 0.03593695908784866, 0.04630224406719208, 0.05666752904653549, 0.0670328140258789, 0.07739809900522232, 0.08776338398456573, 0.09812866896390915, 0.10849395394325256, 0.11885923892259598, 0.1292245239019394, 0.1395898163318634, 0.14995509386062622, 0.16032037138938904, 0.17068566381931305, 0.18105095624923706, 0.19141623377799988, 0.2017815113067627, 0.2121468037366867, 0.22251209616661072, 0.23287737369537354, 0.24324265122413635, 0.25360792875289917, 0.2639732360839844, 0.2743385136127472, 0.28470379114151, 0.2950690984725952, 0.30543437600135803, 0.31579965353012085]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 5.0, 5.0, 8.0, 5.0, 14.0, 14.0, 13.0, 16.0, 18.0, 21.0, 21.0, 25.0, 23.0, 28.0, 43.0, 36.0, 43.0, 33.0, 48.0, 38.0, 45.0, 47.0, 46.0, 46.0, 40.0, 42.0, 38.0, 25.0, 41.0, 30.0, 23.0, 21.0, 27.0, 17.0, 11.0, 11.0, 7.0, 11.0, 9.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19329124689102173, -0.18715421855449677, -0.1810171753168106, -0.17488014698028564, -0.1687431037425995, -0.16260607540607452, -0.15646904706954956, -0.1503320038318634, -0.14419497549533844, -0.13805794715881348, -0.13192090392112732, -0.12578387558460236, -0.1196468397974968, -0.11350980401039124, -0.10737277567386627, -0.10123573988676071, -0.09509870409965515, -0.08896166831254959, -0.08282463252544403, -0.07668760418891907, -0.07055056840181351, -0.06441353261470795, -0.058276500552892685, -0.05213946849107742, -0.04600243270397186, -0.0398653969168663, -0.03372836485505104, -0.02759133093059063, -0.02145429700613022, -0.015317263081669807, -0.009180229157209396, -0.0030431970953941345, 0.0030938386917114258, 0.009230872616171837, 0.015367906540632248, 0.02150494046509266, 0.02764197438955307, 0.03377901017665863, 0.03991604223847389, 0.046053074300289154, 0.052190110087394714, 0.058327145874500275, 0.06446418166160583, 0.0706012099981308, 0.07673824578523636, 0.08287528157234192, 0.08901230990886688, 0.09514934569597244, 0.101286381483078, 0.10742341727018356, 0.11356045305728912, 0.11969748139381409, 0.12583452463150024, 0.1319715529680252, 0.13810858130455017, 0.14424562454223633, 0.1503826528787613, 0.15651968121528625, 0.1626567244529724, 0.16879375278949738, 0.17493078112602234, 0.1810678243637085, 0.18720485270023346, 0.19334188103675842, 0.19947892427444458]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 3.0, 11.0, 13.0, 21.0, 23.0, 32.0, 64.0, 55.0, 124.0, 178.0, 266.0, 336.0, 620.0, 957.0, 1557.0, 2701.0, 4777.0, 8416.0, 15406.0, 29094.0, 55342.0, 106444.0, 187080.0, 238217.0, 180998.0, 101298.0, 52842.0, 27695.0, 14829.0, 8051.0, 4467.0, 2536.0, 1538.0, 901.0, 555.0, 378.0, 241.0, 167.0, 101.0, 65.0, 50.0, 32.0, 30.0, 9.0, 8.0, 6.0, 7.0, 5.0, 4.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.051971435546875, -0.05026531219482422, -0.04855918884277344, -0.046853065490722656, -0.045146942138671875, -0.043440818786621094, -0.04173469543457031, -0.04002857208251953, -0.03832244873046875, -0.03661632537841797, -0.03491020202636719, -0.033204078674316406, -0.031497955322265625, -0.029791831970214844, -0.028085708618164062, -0.02637958526611328, -0.0246734619140625, -0.02296733856201172, -0.021261215209960938, -0.019555091857910156, -0.017848968505859375, -0.016142845153808594, -0.014436721801757812, -0.012730598449707031, -0.01102447509765625, -0.009318351745605469, -0.0076122283935546875, -0.005906105041503906, -0.004199981689453125, -0.0024938583374023438, -0.0007877349853515625, 0.0009183883666992188, 0.00262451171875, 0.004330635070800781, 0.0060367584228515625, 0.007742881774902344, 0.009449005126953125, 0.011155128479003906, 0.012861251831054688, 0.014567375183105469, 0.01627349853515625, 0.01797962188720703, 0.019685745239257812, 0.021391868591308594, 0.023097991943359375, 0.024804115295410156, 0.026510238647460938, 0.02821636199951172, 0.0299224853515625, 0.03162860870361328, 0.03333473205566406, 0.035040855407714844, 0.036746978759765625, 0.038453102111816406, 0.04015922546386719, 0.04186534881591797, 0.04357147216796875, 0.04527759552001953, 0.04698371887207031, 0.048689842224121094, 0.050395965576171875, 0.052102088928222656, 0.05380821228027344, 0.05551433563232422, 0.057220458984375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 3.0, 6.0, 15.0, 9.0, 13.0, 22.0, 13.0, 19.0, 24.0, 17.0, 34.0, 31.0, 37.0, 44.0, 44.0, 47.0, 35.0, 46.0, 43.0, 42.0, 51.0, 42.0, 49.0, 40.0, 51.0, 34.0, 25.0, 25.0, 22.0, 19.0, 15.0, 18.0, 16.0, 11.0, 16.0, 6.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0222930908203125, -0.021569252014160156, -0.020845413208007812, -0.02012157440185547, -0.019397735595703125, -0.01867389678955078, -0.017950057983398438, -0.017226219177246094, -0.01650238037109375, -0.015778541564941406, -0.015054702758789062, -0.014330863952636719, -0.013607025146484375, -0.012883186340332031, -0.012159347534179688, -0.011435508728027344, -0.010711669921875, -0.009987831115722656, -0.009263992309570312, -0.008540153503417969, -0.007816314697265625, -0.007092475891113281, -0.0063686370849609375, -0.005644798278808594, -0.00492095947265625, -0.004197120666503906, -0.0034732818603515625, -0.0027494430541992188, -0.002025604248046875, -0.0013017654418945312, -0.0005779266357421875, 0.00014591217041015625, 0.0008697509765625, 0.0015935897827148438, 0.0023174285888671875, 0.0030412673950195312, 0.003765106201171875, 0.004488945007324219, 0.0052127838134765625, 0.005936622619628906, 0.00666046142578125, 0.007384300231933594, 0.008108139038085938, 0.008831977844238281, 0.009555816650390625, 0.010279655456542969, 0.011003494262695312, 0.011727333068847656, 0.012451171875, 0.013175010681152344, 0.013898849487304688, 0.014622688293457031, 0.015346527099609375, 0.01607036590576172, 0.016794204711914062, 0.017518043518066406, 0.01824188232421875, 0.018965721130371094, 0.019689559936523438, 0.02041339874267578, 0.021137237548828125, 0.02186107635498047, 0.022584915161132812, 0.023308753967285156, 0.0240325927734375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 8.0, 5.0, 7.0, 8.0, 16.0, 17.0, 32.0, 35.0, 53.0, 114.0, 179.0, 321.0, 570.0, 1306.0, 3688.0, 14089.0, 67398.0, 371853.0, 471403.0, 91228.0, 18330.0, 4734.0, 1641.0, 695.0, 326.0, 190.0, 118.0, 72.0, 36.0, 39.0, 16.0, 12.0, 6.0, 7.0, 2.0, 6.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1307373046875, -0.1266632080078125, -0.122589111328125, -0.1185150146484375, -0.11444091796875, -0.1103668212890625, -0.106292724609375, -0.1022186279296875, -0.09814453125, -0.0940704345703125, -0.089996337890625, -0.0859222412109375, -0.08184814453125, -0.0777740478515625, -0.073699951171875, -0.0696258544921875, -0.0655517578125, -0.0614776611328125, -0.057403564453125, -0.0533294677734375, -0.04925537109375, -0.0451812744140625, -0.041107177734375, -0.0370330810546875, -0.032958984375, -0.0288848876953125, -0.024810791015625, -0.0207366943359375, -0.01666259765625, -0.0125885009765625, -0.008514404296875, -0.0044403076171875, -0.0003662109375, 0.0037078857421875, 0.007781982421875, 0.0118560791015625, 0.01593017578125, 0.0200042724609375, 0.024078369140625, 0.0281524658203125, 0.0322265625, 0.0363006591796875, 0.040374755859375, 0.0444488525390625, 0.04852294921875, 0.0525970458984375, 0.056671142578125, 0.0607452392578125, 0.0648193359375, 0.0688934326171875, 0.072967529296875, 0.0770416259765625, 0.08111572265625, 0.0851898193359375, 0.089263916015625, 0.0933380126953125, 0.097412109375, 0.1014862060546875, 0.105560302734375, 0.1096343994140625, 0.11370849609375, 0.1177825927734375, 0.121856689453125, 0.1259307861328125, 0.1300048828125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 7.0, 3.0, 7.0, 11.0, 17.0, 22.0, 18.0, 32.0, 29.0, 36.0, 35.0, 48.0, 42.0, 40.0, 46.0, 39.0, 53.0, 58.0, 52.0, 46.0, 37.0, 44.0, 43.0, 32.0, 26.0, 41.0, 22.0, 24.0, 20.0, 15.0, 15.0, 8.0, 8.0, 10.0, 5.0, 0.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1512451171875, -0.14704227447509766, -0.1428394317626953, -0.13863658905029297, -0.13443374633789062, -0.13023090362548828, -0.12602806091308594, -0.1218252182006836, -0.11762237548828125, -0.1134195327758789, -0.10921669006347656, -0.10501384735107422, -0.10081100463867188, -0.09660816192626953, -0.09240531921386719, -0.08820247650146484, -0.0839996337890625, -0.07979679107666016, -0.07559394836425781, -0.07139110565185547, -0.06718826293945312, -0.06298542022705078, -0.05878257751464844, -0.054579734802246094, -0.05037689208984375, -0.046174049377441406, -0.04197120666503906, -0.03776836395263672, -0.033565521240234375, -0.02936267852783203, -0.025159835815429688, -0.020956993103027344, -0.016754150390625, -0.012551307678222656, -0.008348464965820312, -0.004145622253417969, 5.7220458984375e-05, 0.004260063171386719, 0.008462905883789062, 0.012665748596191406, 0.01686859130859375, 0.021071434020996094, 0.025274276733398438, 0.02947711944580078, 0.033679962158203125, 0.03788280487060547, 0.04208564758300781, 0.046288490295410156, 0.0504913330078125, 0.054694175720214844, 0.05889701843261719, 0.06309986114501953, 0.06730270385742188, 0.07150554656982422, 0.07570838928222656, 0.0799112319946289, 0.08411407470703125, 0.0883169174194336, 0.09251976013183594, 0.09672260284423828, 0.10092544555664062, 0.10512828826904297, 0.10933113098144531, 0.11353397369384766, 0.11773681640625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 2.0, 6.0, 10.0, 12.0, 26.0, 40.0, 106.0, 189.0, 482.0, 1344.0, 4262.0, 18926.0, 134164.0, 658803.0, 196743.0, 25275.0, 5512.0, 1666.0, 562.0, 215.0, 103.0, 53.0, 23.0, 13.0, 10.0, 7.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07818603515625, -0.07535171508789062, -0.07251739501953125, -0.06968307495117188, -0.0668487548828125, -0.06401443481445312, -0.06118011474609375, -0.058345794677734375, -0.055511474609375, -0.052677154541015625, -0.04984283447265625, -0.047008514404296875, -0.0441741943359375, -0.041339874267578125, -0.03850555419921875, -0.035671234130859375, -0.0328369140625, -0.030002593994140625, -0.02716827392578125, -0.024333953857421875, -0.0214996337890625, -0.018665313720703125, -0.01583099365234375, -0.012996673583984375, -0.010162353515625, -0.007328033447265625, -0.00449371337890625, -0.001659393310546875, 0.0011749267578125, 0.004009246826171875, 0.00684356689453125, 0.009677886962890625, 0.01251220703125, 0.015346527099609375, 0.01818084716796875, 0.021015167236328125, 0.0238494873046875, 0.026683807373046875, 0.02951812744140625, 0.032352447509765625, 0.035186767578125, 0.038021087646484375, 0.04085540771484375, 0.043689727783203125, 0.0465240478515625, 0.049358367919921875, 0.05219268798828125, 0.055027008056640625, 0.057861328125, 0.060695648193359375, 0.06352996826171875, 0.06636428833007812, 0.0691986083984375, 0.07203292846679688, 0.07486724853515625, 0.07770156860351562, 0.080535888671875, 0.08337020874023438, 0.08620452880859375, 0.08903884887695312, 0.0918731689453125, 0.09470748901367188, 0.09754180908203125, 0.10037612915039062, 0.10321044921875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 12.0, 14.0, 7.0, 12.0, 16.0, 23.0, 23.0, 28.0, 35.0, 50.0, 47.0, 68.0, 54.0, 56.0, 71.0, 68.0, 77.0, 56.0, 38.0, 47.0, 41.0, 28.0, 21.0, 18.0, 19.0, 15.0, 14.0, 12.0, 14.0, 7.0, 3.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.9981136322021484e-05, -2.9064714908599854e-05, -2.8148293495178223e-05, -2.7231872081756592e-05, -2.631545066833496e-05, -2.539902925491333e-05, -2.44826078414917e-05, -2.356618642807007e-05, -2.2649765014648438e-05, -2.1733343601226807e-05, -2.0816922187805176e-05, -1.9900500774383545e-05, -1.8984079360961914e-05, -1.8067657947540283e-05, -1.7151236534118652e-05, -1.623481512069702e-05, -1.531839370727539e-05, -1.440197229385376e-05, -1.3485550880432129e-05, -1.2569129467010498e-05, -1.1652708053588867e-05, -1.0736286640167236e-05, -9.819865226745605e-06, -8.903443813323975e-06, -7.987022399902344e-06, -7.070600986480713e-06, -6.154179573059082e-06, -5.237758159637451e-06, -4.32133674621582e-06, -3.4049153327941895e-06, -2.4884939193725586e-06, -1.5720725059509277e-06, -6.556510925292969e-07, 2.60770320892334e-07, 1.1771917343139648e-06, 2.0936131477355957e-06, 3.0100345611572266e-06, 3.926455974578857e-06, 4.842877388000488e-06, 5.759298801422119e-06, 6.67572021484375e-06, 7.592141628265381e-06, 8.508563041687012e-06, 9.424984455108643e-06, 1.0341405868530273e-05, 1.1257827281951904e-05, 1.2174248695373535e-05, 1.3090670108795166e-05, 1.4007091522216797e-05, 1.4923512935638428e-05, 1.583993434906006e-05, 1.675635576248169e-05, 1.767277717590332e-05, 1.858919858932495e-05, 1.9505620002746582e-05, 2.0422041416168213e-05, 2.1338462829589844e-05, 2.2254884243011475e-05, 2.3171305656433105e-05, 2.4087727069854736e-05, 2.5004148483276367e-05, 2.5920569896697998e-05, 2.683699131011963e-05, 2.775341272354126e-05, 2.866983413696289e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 5.0, 8.0, 21.0, 18.0, 23.0, 40.0, 56.0, 97.0, 124.0, 181.0, 304.0, 492.0, 952.0, 1949.0, 4039.0, 8983.0, 23889.0, 74084.0, 245071.0, 416149.0, 184057.0, 55253.0, 18364.0, 7284.0, 3443.0, 1598.0, 791.0, 483.0, 270.0, 174.0, 106.0, 85.0, 49.0, 37.0, 28.0, 16.0, 10.0, 4.0, 7.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.04931640625, -0.04769277572631836, -0.04606914520263672, -0.04444551467895508, -0.04282188415527344, -0.0411982536315918, -0.039574623107910156, -0.037950992584228516, -0.036327362060546875, -0.034703731536865234, -0.033080101013183594, -0.03145647048950195, -0.029832839965820312, -0.028209209442138672, -0.02658557891845703, -0.02496194839477539, -0.02333831787109375, -0.02171468734741211, -0.02009105682373047, -0.018467426300048828, -0.016843795776367188, -0.015220165252685547, -0.013596534729003906, -0.011972904205322266, -0.010349273681640625, -0.008725643157958984, -0.007102012634277344, -0.005478382110595703, -0.0038547515869140625, -0.002231121063232422, -0.0006074905395507812, 0.0010161399841308594, 0.0026397705078125, 0.004263401031494141, 0.005887031555175781, 0.007510662078857422, 0.009134292602539062, 0.010757923126220703, 0.012381553649902344, 0.014005184173583984, 0.015628814697265625, 0.017252445220947266, 0.018876075744628906, 0.020499706268310547, 0.022123336791992188, 0.023746967315673828, 0.02537059783935547, 0.02699422836303711, 0.02861785888671875, 0.03024148941040039, 0.03186511993408203, 0.03348875045776367, 0.03511238098144531, 0.03673601150512695, 0.038359642028808594, 0.039983272552490234, 0.041606903076171875, 0.043230533599853516, 0.044854164123535156, 0.0464777946472168, 0.04810142517089844, 0.04972505569458008, 0.05134868621826172, 0.05297231674194336, 0.054595947265625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 9.0, 6.0, 6.0, 9.0, 15.0, 11.0, 17.0, 17.0, 26.0, 28.0, 36.0, 48.0, 57.0, 59.0, 69.0, 86.0, 64.0, 57.0, 54.0, 59.0, 38.0, 39.0, 35.0, 30.0, 21.0, 18.0, 13.0, 15.0, 17.0, 9.0, 6.0, 5.0, 5.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.046783447265625, -0.045366764068603516, -0.04395008087158203, -0.04253339767456055, -0.04111671447753906, -0.03970003128051758, -0.038283348083496094, -0.03686666488647461, -0.035449981689453125, -0.03403329849243164, -0.032616615295410156, -0.031199932098388672, -0.029783248901367188, -0.028366565704345703, -0.02694988250732422, -0.025533199310302734, -0.02411651611328125, -0.022699832916259766, -0.02128314971923828, -0.019866466522216797, -0.018449783325195312, -0.017033100128173828, -0.015616416931152344, -0.01419973373413086, -0.012783050537109375, -0.01136636734008789, -0.009949684143066406, -0.008533000946044922, -0.0071163177490234375, -0.005699634552001953, -0.004282951354980469, -0.0028662681579589844, -0.0014495849609375, -3.2901763916015625e-05, 0.0013837814331054688, 0.002800464630126953, 0.0042171478271484375, 0.005633831024169922, 0.007050514221191406, 0.00846719741821289, 0.009883880615234375, 0.01130056381225586, 0.012717247009277344, 0.014133930206298828, 0.015550613403320312, 0.016967296600341797, 0.01838397979736328, 0.019800662994384766, 0.02121734619140625, 0.022634029388427734, 0.02405071258544922, 0.025467395782470703, 0.026884078979492188, 0.028300762176513672, 0.029717445373535156, 0.03113412857055664, 0.032550811767578125, 0.03396749496459961, 0.035384178161621094, 0.03680086135864258, 0.03821754455566406, 0.03963422775268555, 0.04105091094970703, 0.042467594146728516, 0.04388427734375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 8.0, 9.0, 11.0, 21.0, 30.0, 41.0, 70.0, 87.0, 122.0, 131.0, 127.0, 109.0, 76.0, 61.0, 30.0, 26.0, 13.0, 12.0, 5.0, 6.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6081541776657104, -0.5803227424621582, -0.552491307258606, -0.5246598720550537, -0.49682846665382385, -0.4689970314502716, -0.44116559624671936, -0.4133341908454895, -0.38550275564193726, -0.357671320438385, -0.32983988523483276, -0.3020084500312805, -0.27417704463005066, -0.2463456094264984, -0.21851417422294617, -0.19068275392055511, -0.16285130381584167, -0.13501986861228943, -0.10718844830989838, -0.07935701310634613, -0.05152558535337448, -0.023694157600402832, 0.004137277603149414, 0.031968697905540466, 0.05980013310909271, 0.08763156086206436, 0.11546298861503601, 0.14329442381858826, 0.1711258590221405, 0.19895727932453156, 0.2267887145280838, 0.25462013483047485, 0.2824515700340271, 0.31028300523757935, 0.3381144404411316, 0.36594587564468384, 0.3937772810459137, 0.42160871624946594, 0.4494401514530182, 0.47727155685424805, 0.5051029920578003, 0.5329344272613525, 0.5607658624649048, 0.588597297668457, 0.6164287328720093, 0.6442601680755615, 0.6720916032791138, 0.6999229788780212, 0.7277544736862183, 0.7555859088897705, 0.7834173440933228, 0.811248779296875, 0.8390802145004272, 0.8669116497039795, 0.8947430849075317, 0.9225744605064392, 0.9504058957099915, 0.9782373309135437, 1.0060687065124512, 1.0339001417160034, 1.0617315769195557, 1.089563012123108, 1.1173944473266602, 1.1452258825302124, 1.1730573177337646]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 8.0, 10.0, 11.0, 6.0, 12.0, 8.0, 19.0, 23.0, 18.0, 18.0, 26.0, 19.0, 39.0, 29.0, 31.0, 29.0, 33.0, 46.0, 42.0, 44.0, 51.0, 50.0, 50.0, 29.0, 39.0, 37.0, 38.0, 35.0, 34.0, 30.0, 26.0, 24.0, 8.0, 16.0, 6.0, 13.0, 6.0, 9.0, 10.0, 7.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5535398125648499, -0.5352002382278442, -0.5168606638908386, -0.4985211193561554, -0.48018157482147217, -0.46184200048446655, -0.44350242614746094, -0.4251628816127777, -0.4068233370780945, -0.38848376274108887, -0.37014421820640564, -0.3518046438694, -0.3334650993347168, -0.3151255249977112, -0.29678595066070557, -0.27844640612602234, -0.2601068317890167, -0.2417672723531723, -0.22342771291732788, -0.20508813858032227, -0.18674859404563904, -0.16840901970863342, -0.150069460272789, -0.13172990083694458, -0.11339034140110016, -0.09505078196525574, -0.07671122252941132, -0.0583716556429863, -0.040032096207141876, -0.021692536771297455, -0.0033529698848724365, 0.014986589550971985, 0.033326148986816406, 0.05166570842266083, 0.07000526785850525, 0.08834483474493027, 0.10668439418077469, 0.1250239610671997, 0.14336352050304413, 0.16170307993888855, 0.18004263937473297, 0.1983821988105774, 0.21672175824642181, 0.23506131768226624, 0.25340089201927185, 0.2717404365539551, 0.2900800108909607, 0.3084195852279663, 0.32675912976264954, 0.34509870409965515, 0.3634382486343384, 0.381777822971344, 0.4001173675060272, 0.41845694184303284, 0.43679648637771606, 0.4551360607147217, 0.4734756350517273, 0.4918152093887329, 0.5101547837257385, 0.5284942984580994, 0.546833872795105, 0.5651734471321106, 0.5835130214691162, 0.601852536201477, 0.6201921105384827]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 3.0, 7.0, 7.0, 4.0, 8.0, 10.0, 11.0, 25.0, 23.0, 38.0, 37.0, 46.0, 59.0, 74.0, 111.0, 164.0, 212.0, 376.0, 455.0, 772.0, 1373.0, 2770.0, 7238.0, 32811.0, 4052784.0, 75945.0, 10715.0, 3601.0, 1727.0, 955.0, 600.0, 391.0, 253.0, 173.0, 123.0, 89.0, 74.0, 34.0, 34.0, 36.0, 29.0, 12.0, 7.0, 15.0, 10.0, 13.0, 7.0, 8.0, 3.0, 6.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.2086181640625, -0.20223236083984375, -0.1958465576171875, -0.18946075439453125, -0.183074951171875, -0.17668914794921875, -0.1703033447265625, -0.16391754150390625, -0.15753173828125, -0.15114593505859375, -0.1447601318359375, -0.13837432861328125, -0.131988525390625, -0.12560272216796875, -0.1192169189453125, -0.11283111572265625, -0.1064453125, -0.10005950927734375, -0.0936737060546875, -0.08728790283203125, -0.080902099609375, -0.07451629638671875, -0.0681304931640625, -0.06174468994140625, -0.05535888671875, -0.04897308349609375, -0.0425872802734375, -0.03620147705078125, -0.029815673828125, -0.02342987060546875, -0.0170440673828125, -0.01065826416015625, -0.0042724609375, 0.00211334228515625, 0.0084991455078125, 0.01488494873046875, 0.021270751953125, 0.02765655517578125, 0.0340423583984375, 0.04042816162109375, 0.04681396484375, 0.05319976806640625, 0.0595855712890625, 0.06597137451171875, 0.072357177734375, 0.07874298095703125, 0.0851287841796875, 0.09151458740234375, 0.097900390625, 0.10428619384765625, 0.1106719970703125, 0.11705780029296875, 0.123443603515625, 0.12982940673828125, 0.1362152099609375, 0.14260101318359375, 0.14898681640625, 0.15537261962890625, 0.1617584228515625, 0.16814422607421875, 0.174530029296875, 0.18091583251953125, 0.1873016357421875, 0.19368743896484375, 0.2000732421875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 2.0, 7.0, 1.0, 8.0, 14.0, 10.0, 6.0, 13.0, 17.0, 17.0, 22.0, 13.0, 27.0, 29.0, 32.0, 34.0, 37.0, 40.0, 42.0, 32.0, 44.0, 38.0, 40.0, 38.0, 43.0, 35.0, 39.0, 31.0, 36.0, 38.0, 32.0, 34.0, 21.0, 17.0, 25.0, 10.0, 11.0, 13.0, 11.0, 8.0, 2.0, 14.0, 5.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.022979736328125, -0.022265195846557617, -0.021550655364990234, -0.02083611488342285, -0.02012157440185547, -0.019407033920288086, -0.018692493438720703, -0.01797795295715332, -0.017263412475585938, -0.016548871994018555, -0.015834331512451172, -0.015119791030883789, -0.014405250549316406, -0.013690710067749023, -0.01297616958618164, -0.012261629104614258, -0.011547088623046875, -0.010832548141479492, -0.01011800765991211, -0.009403467178344727, -0.008688926696777344, -0.007974386215209961, -0.007259845733642578, -0.006545305252075195, -0.0058307647705078125, -0.00511622428894043, -0.004401683807373047, -0.003687143325805664, -0.0029726028442382812, -0.0022580623626708984, -0.0015435218811035156, -0.0008289813995361328, -0.00011444091796875, 0.0006000995635986328, 0.0013146400451660156, 0.0020291805267333984, 0.0027437210083007812, 0.003458261489868164, 0.004172801971435547, 0.00488734245300293, 0.0056018829345703125, 0.006316423416137695, 0.007030963897705078, 0.007745504379272461, 0.008460044860839844, 0.009174585342407227, 0.00988912582397461, 0.010603666305541992, 0.011318206787109375, 0.012032747268676758, 0.01274728775024414, 0.013461828231811523, 0.014176368713378906, 0.014890909194946289, 0.015605449676513672, 0.016319990158081055, 0.017034530639648438, 0.01774907112121582, 0.018463611602783203, 0.019178152084350586, 0.01989269256591797, 0.02060723304748535, 0.021321773529052734, 0.022036314010620117, 0.0227508544921875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 1.0, 4.0, 2.0, 9.0, 5.0, 10.0, 13.0, 11.0, 26.0, 35.0, 51.0, 57.0, 83.0, 112.0, 152.0, 209.0, 320.0, 501.0, 763.0, 1225.0, 2353.0, 5280.0, 15446.0, 130337.0, 3982670.0, 37652.0, 8778.0, 3605.0, 1799.0, 882.0, 630.0, 354.0, 255.0, 193.0, 132.0, 82.0, 62.0, 45.0, 48.0, 30.0, 15.0, 15.0, 11.0, 6.0, 7.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.25244140625, -0.2452831268310547, -0.23812484741210938, -0.23096656799316406, -0.22380828857421875, -0.21665000915527344, -0.20949172973632812, -0.2023334503173828, -0.1951751708984375, -0.1880168914794922, -0.18085861206054688, -0.17370033264160156, -0.16654205322265625, -0.15938377380371094, -0.15222549438476562, -0.1450672149658203, -0.137908935546875, -0.1307506561279297, -0.12359237670898438, -0.11643409729003906, -0.10927581787109375, -0.10211753845214844, -0.09495925903320312, -0.08780097961425781, -0.0806427001953125, -0.07348442077636719, -0.06632614135742188, -0.05916786193847656, -0.05200958251953125, -0.04485130310058594, -0.037693023681640625, -0.030534744262695312, -0.02337646484375, -0.016218185424804688, -0.009059906005859375, -0.0019016265869140625, 0.00525665283203125, 0.012414932250976562, 0.019573211669921875, 0.026731491088867188, 0.0338897705078125, 0.04104804992675781, 0.048206329345703125, 0.05536460876464844, 0.06252288818359375, 0.06968116760253906, 0.07683944702148438, 0.08399772644042969, 0.091156005859375, 0.09831428527832031, 0.10547256469726562, 0.11263084411621094, 0.11978912353515625, 0.12694740295410156, 0.13410568237304688, 0.1412639617919922, 0.1484222412109375, 0.1555805206298828, 0.16273880004882812, 0.16989707946777344, 0.17705535888671875, 0.18421363830566406, 0.19137191772460938, 0.1985301971435547, 0.2056884765625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 2.0, 5.0, 0.0, 12.0, 9.0, 14.0, 34.0, 81.0, 463.0, 3227.0, 123.0, 47.0, 24.0, 10.0, 4.0, 6.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049774169921875, -0.04822492599487305, -0.046675682067871094, -0.04512643814086914, -0.04357719421386719, -0.042027950286865234, -0.04047870635986328, -0.03892946243286133, -0.037380218505859375, -0.03583097457885742, -0.03428173065185547, -0.032732486724853516, -0.031183242797851562, -0.02963399887084961, -0.028084754943847656, -0.026535511016845703, -0.02498626708984375, -0.023437023162841797, -0.021887779235839844, -0.02033853530883789, -0.018789291381835938, -0.017240047454833984, -0.01569080352783203, -0.014141559600830078, -0.012592315673828125, -0.011043071746826172, -0.009493827819824219, -0.007944583892822266, -0.0063953399658203125, -0.004846096038818359, -0.0032968521118164062, -0.0017476081848144531, -0.0001983642578125, 0.0013508796691894531, 0.0029001235961914062, 0.004449367523193359, 0.0059986114501953125, 0.007547855377197266, 0.009097099304199219, 0.010646343231201172, 0.012195587158203125, 0.013744831085205078, 0.015294075012207031, 0.016843318939208984, 0.018392562866210938, 0.01994180679321289, 0.021491050720214844, 0.023040294647216797, 0.02458953857421875, 0.026138782501220703, 0.027688026428222656, 0.02923727035522461, 0.030786514282226562, 0.032335758209228516, 0.03388500213623047, 0.03543424606323242, 0.036983489990234375, 0.03853273391723633, 0.04008197784423828, 0.041631221771240234, 0.04318046569824219, 0.04472970962524414, 0.046278953552246094, 0.04782819747924805, 0.04937744140625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 1.0, 4.0, 4.0, 13.0, 9.0, 12.0, 19.0, 36.0, 38.0, 69.0, 87.0, 101.0, 118.0, 110.0, 109.0, 71.0, 60.0, 59.0, 27.0, 22.0, 15.0, 8.0, 3.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14739945530891418, -0.14217491447925568, -0.13695037364959717, -0.13172583281993866, -0.12650129199028015, -0.12127675861120224, -0.11605222523212433, -0.11082768440246582, -0.10560314357280731, -0.1003786027431488, -0.0951540619134903, -0.08992952853441238, -0.08470498770475388, -0.07948044687509537, -0.07425591349601746, -0.06903137266635895, -0.06380683183670044, -0.05858229100704193, -0.05335775390267372, -0.04813321679830551, -0.042908675968647, -0.037684135138988495, -0.032459598034620285, -0.027235060930252075, -0.022010520100593567, -0.016785981133580208, -0.011561442166566849, -0.00633690319955349, -0.0011123642325401306, 0.0041121747344732285, 0.009336713701486588, 0.014561250805854797, 0.019785791635513306, 0.025010330602526665, 0.030234869569540024, 0.035459406673908234, 0.04068394750356674, 0.04590848833322525, 0.05113302543759346, 0.05635756254196167, 0.06158210337162018, 0.06680664420127869, 0.0720311850309372, 0.0772557184100151, 0.08248025923967361, 0.08770480006933212, 0.09292933344841003, 0.09815387427806854, 0.10337841510772705, 0.10860295593738556, 0.11382749676704407, 0.11905203014612198, 0.12427657097578049, 0.1295011043548584, 0.1347256451845169, 0.13995018601417542, 0.14517472684383392, 0.15039926767349243, 0.15562380850315094, 0.16084834933280945, 0.16607287526130676, 0.17129741609096527, 0.17652195692062378, 0.1817464977502823, 0.1869710385799408]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 6.0, 10.0, 6.0, 5.0, 4.0, 13.0, 15.0, 24.0, 13.0, 23.0, 28.0, 18.0, 26.0, 31.0, 47.0, 43.0, 44.0, 47.0, 50.0, 59.0, 53.0, 49.0, 35.0, 36.0, 52.0, 34.0, 34.0, 26.0, 33.0, 26.0, 26.0, 18.0, 14.0, 11.0, 9.0, 14.0, 10.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.08530747890472412, -0.08259212970733643, -0.07987678050994873, -0.07716142386198044, -0.07444607466459274, -0.07173072546720505, -0.06901536881923676, -0.06630001962184906, -0.06358467042446136, -0.06086932122707367, -0.058153968304395676, -0.05543861538171768, -0.05272326618432999, -0.05000791698694229, -0.0472925640642643, -0.044577211141586304, -0.04186186194419861, -0.03914651274681091, -0.03643115982413292, -0.033715806901454926, -0.03100045770406723, -0.028285106644034386, -0.02556975558400154, -0.022854404523968697, -0.020139053463935852, -0.017423702403903008, -0.014708351343870163, -0.011993000283837318, -0.009277649223804474, -0.006562298163771629, -0.003846947103738785, -0.0011315960437059402, 0.0015837550163269043, 0.004299106076359749, 0.007014457136392593, 0.009729808196425438, 0.012445159256458282, 0.015160510316491127, 0.01787586137652397, 0.020591212436556816, 0.02330656349658966, 0.026021914556622505, 0.02873726561665535, 0.031452618539333344, 0.03416796773672104, 0.036883316934108734, 0.03959866985678673, 0.04231402277946472, 0.04502937197685242, 0.04774472117424011, 0.050460074096918106, 0.0531754270195961, 0.055890776216983795, 0.05860612541437149, 0.061321478337049484, 0.06403683125972748, 0.06675218045711517, 0.06946752965450287, 0.07218287885189056, 0.07489823549985886, 0.07761358469724655, 0.08032893389463425, 0.08304429054260254, 0.08575963973999023, 0.08847498893737793]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 9.0, 11.0, 15.0, 26.0, 37.0, 45.0, 67.0, 102.0, 130.0, 252.0, 356.0, 521.0, 901.0, 1495.0, 2569.0, 4578.0, 8540.0, 16754.0, 34574.0, 71812.0, 147712.0, 249193.0, 239987.0, 137511.0, 66006.0, 31437.0, 15572.0, 7879.0, 4211.0, 2433.0, 1419.0, 868.0, 555.0, 328.0, 212.0, 142.0, 87.0, 66.0, 42.0, 26.0, 20.0, 20.0, 13.0, 3.0, 9.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052032470703125, -0.0501704216003418, -0.048308372497558594, -0.04644632339477539, -0.04458427429199219, -0.042722225189208984, -0.04086017608642578, -0.03899812698364258, -0.037136077880859375, -0.03527402877807617, -0.03341197967529297, -0.031549930572509766, -0.029687881469726562, -0.02782583236694336, -0.025963783264160156, -0.024101734161376953, -0.02223968505859375, -0.020377635955810547, -0.018515586853027344, -0.01665353775024414, -0.014791488647460938, -0.012929439544677734, -0.011067390441894531, -0.009205341339111328, -0.007343292236328125, -0.005481243133544922, -0.0036191940307617188, -0.0017571449279785156, 0.0001049041748046875, 0.0019669532775878906, 0.0038290023803710938, 0.005691051483154297, 0.0075531005859375, 0.009415149688720703, 0.011277198791503906, 0.01313924789428711, 0.015001296997070312, 0.016863346099853516, 0.01872539520263672, 0.020587444305419922, 0.022449493408203125, 0.024311542510986328, 0.02617359161376953, 0.028035640716552734, 0.029897689819335938, 0.03175973892211914, 0.033621788024902344, 0.03548383712768555, 0.03734588623046875, 0.03920793533325195, 0.041069984436035156, 0.04293203353881836, 0.04479408264160156, 0.046656131744384766, 0.04851818084716797, 0.05038022994995117, 0.052242279052734375, 0.05410432815551758, 0.05596637725830078, 0.057828426361083984, 0.05969047546386719, 0.06155252456665039, 0.0634145736694336, 0.0652766227722168, 0.067138671875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 0.0, 6.0, 11.0, 8.0, 6.0, 17.0, 16.0, 13.0, 25.0, 18.0, 21.0, 28.0, 20.0, 30.0, 34.0, 36.0, 38.0, 36.0, 38.0, 44.0, 46.0, 44.0, 53.0, 46.0, 42.0, 38.0, 44.0, 33.0, 27.0, 31.0, 32.0, 18.0, 24.0, 18.0, 15.0, 6.0, 7.0, 12.0, 5.0, 9.0, 6.0, 4.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.021697998046875, -0.020832061767578125, -0.01996612548828125, -0.019100189208984375, -0.0182342529296875, -0.017368316650390625, -0.01650238037109375, -0.015636444091796875, -0.0147705078125, -0.013904571533203125, -0.01303863525390625, -0.012172698974609375, -0.0113067626953125, -0.010440826416015625, -0.00957489013671875, -0.008708953857421875, -0.007843017578125, -0.006977081298828125, -0.00611114501953125, -0.005245208740234375, -0.0043792724609375, -0.003513336181640625, -0.00264739990234375, -0.001781463623046875, -0.00091552734375, -4.9591064453125e-05, 0.00081634521484375, 0.001682281494140625, 0.0025482177734375, 0.003414154052734375, 0.00428009033203125, 0.005146026611328125, 0.006011962890625, 0.006877899169921875, 0.00774383544921875, 0.008609771728515625, 0.0094757080078125, 0.010341644287109375, 0.01120758056640625, 0.012073516845703125, 0.012939453125, 0.013805389404296875, 0.01467132568359375, 0.015537261962890625, 0.0164031982421875, 0.017269134521484375, 0.01813507080078125, 0.019001007080078125, 0.019866943359375, 0.020732879638671875, 0.02159881591796875, 0.022464752197265625, 0.0233306884765625, 0.024196624755859375, 0.02506256103515625, 0.025928497314453125, 0.02679443359375, 0.027660369873046875, 0.02852630615234375, 0.029392242431640625, 0.0302581787109375, 0.031124114990234375, 0.03199005126953125, 0.032855987548828125, 0.033721923828125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 16.0, 8.0, 17.0, 26.0, 46.0, 87.0, 97.0, 175.0, 325.0, 559.0, 1076.0, 2345.0, 6668.0, 24314.0, 124864.0, 585610.0, 243485.0, 42056.0, 10336.0, 3379.0, 1413.0, 718.0, 363.0, 215.0, 126.0, 94.0, 50.0, 30.0, 19.0, 20.0, 8.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.15283203125, -0.14877605438232422, -0.14472007751464844, -0.14066410064697266, -0.13660812377929688, -0.1325521469116211, -0.1284961700439453, -0.12444019317626953, -0.12038421630859375, -0.11632823944091797, -0.11227226257324219, -0.1082162857055664, -0.10416030883789062, -0.10010433197021484, -0.09604835510253906, -0.09199237823486328, -0.0879364013671875, -0.08388042449951172, -0.07982444763183594, -0.07576847076416016, -0.07171249389648438, -0.0676565170288086, -0.06360054016113281, -0.05954456329345703, -0.05548858642578125, -0.05143260955810547, -0.04737663269042969, -0.043320655822753906, -0.039264678955078125, -0.035208702087402344, -0.031152725219726562, -0.02709674835205078, -0.023040771484375, -0.01898479461669922, -0.014928817749023438, -0.010872840881347656, -0.006816864013671875, -0.0027608871459960938, 0.0012950897216796875, 0.005351066589355469, 0.00940704345703125, 0.013463020324707031, 0.017518997192382812, 0.021574974060058594, 0.025630950927734375, 0.029686927795410156, 0.03374290466308594, 0.03779888153076172, 0.0418548583984375, 0.04591083526611328, 0.04996681213378906, 0.054022789001464844, 0.058078765869140625, 0.062134742736816406, 0.06619071960449219, 0.07024669647216797, 0.07430267333984375, 0.07835865020751953, 0.08241462707519531, 0.0864706039428711, 0.09052658081054688, 0.09458255767822266, 0.09863853454589844, 0.10269451141357422, 0.10675048828125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 6.0, 2.0, 6.0, 7.0, 8.0, 10.0, 9.0, 10.0, 10.0, 21.0, 17.0, 22.0, 18.0, 35.0, 33.0, 31.0, 39.0, 31.0, 41.0, 44.0, 51.0, 43.0, 39.0, 48.0, 38.0, 43.0, 33.0, 41.0, 30.0, 30.0, 30.0, 31.0, 19.0, 25.0, 16.0, 13.0, 15.0, 11.0, 8.0, 10.0, 5.0, 7.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.1290283203125, -0.12491607666015625, -0.1208038330078125, -0.11669158935546875, -0.112579345703125, -0.10846710205078125, -0.1043548583984375, -0.10024261474609375, -0.09613037109375, -0.09201812744140625, -0.0879058837890625, -0.08379364013671875, -0.079681396484375, -0.07556915283203125, -0.0714569091796875, -0.06734466552734375, -0.063232421875, -0.05912017822265625, -0.0550079345703125, -0.05089569091796875, -0.046783447265625, -0.04267120361328125, -0.0385589599609375, -0.03444671630859375, -0.03033447265625, -0.02622222900390625, -0.0221099853515625, -0.01799774169921875, -0.013885498046875, -0.00977325439453125, -0.0056610107421875, -0.00154876708984375, 0.0025634765625, 0.00667572021484375, 0.0107879638671875, 0.01490020751953125, 0.019012451171875, 0.02312469482421875, 0.0272369384765625, 0.03134918212890625, 0.03546142578125, 0.03957366943359375, 0.0436859130859375, 0.04779815673828125, 0.051910400390625, 0.05602264404296875, 0.0601348876953125, 0.06424713134765625, 0.068359375, 0.07247161865234375, 0.0765838623046875, 0.08069610595703125, 0.084808349609375, 0.08892059326171875, 0.0930328369140625, 0.09714508056640625, 0.10125732421875, 0.10536956787109375, 0.1094818115234375, 0.11359405517578125, 0.117706298828125, 0.12181854248046875, 0.1259307861328125, 0.13004302978515625, 0.1341552734375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 5.0, 4.0, 4.0, 26.0, 28.0, 40.0, 62.0, 91.0, 231.0, 525.0, 1617.0, 6515.0, 116863.0, 898852.0, 18976.0, 3064.0, 950.0, 320.0, 145.0, 92.0, 48.0, 22.0, 29.0, 12.0, 7.0, 10.0, 7.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.29150390625, -0.28426170349121094, -0.2770195007324219, -0.2697772979736328, -0.26253509521484375, -0.2552928924560547, -0.24805068969726562, -0.24080848693847656, -0.2335662841796875, -0.22632408142089844, -0.21908187866210938, -0.2118396759033203, -0.20459747314453125, -0.1973552703857422, -0.19011306762695312, -0.18287086486816406, -0.175628662109375, -0.16838645935058594, -0.16114425659179688, -0.1539020538330078, -0.14665985107421875, -0.1394176483154297, -0.13217544555664062, -0.12493324279785156, -0.1176910400390625, -0.11044883728027344, -0.10320663452148438, -0.09596443176269531, -0.08872222900390625, -0.08148002624511719, -0.07423782348632812, -0.06699562072753906, -0.05975341796875, -0.05251121520996094, -0.045269012451171875, -0.03802680969238281, -0.03078460693359375, -0.023542404174804688, -0.016300201416015625, -0.009057998657226562, -0.0018157958984375, 0.0054264068603515625, 0.012668609619140625, 0.019910812377929688, 0.02715301513671875, 0.03439521789550781, 0.041637420654296875, 0.04887962341308594, 0.056121826171875, 0.06336402893066406, 0.07060623168945312, 0.07784843444824219, 0.08509063720703125, 0.09233283996582031, 0.09957504272460938, 0.10681724548339844, 0.1140594482421875, 0.12130165100097656, 0.12854385375976562, 0.1357860565185547, 0.14302825927734375, 0.1502704620361328, 0.15751266479492188, 0.16475486755371094, 0.1719970703125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 7.0, 11.0, 12.0, 24.0, 33.0, 56.0, 57.0, 72.0, 101.0, 122.0, 109.0, 94.0, 75.0, 56.0, 48.0, 47.0, 27.0, 22.0, 10.0, 7.0, 5.0, 3.0, 5.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-5.835294723510742e-05, -5.705840885639191e-05, -5.576387047767639e-05, -5.4469332098960876e-05, -5.317479372024536e-05, -5.1880255341529846e-05, -5.058571696281433e-05, -4.9291178584098816e-05, -4.79966402053833e-05, -4.6702101826667786e-05, -4.540756344795227e-05, -4.4113025069236755e-05, -4.281848669052124e-05, -4.1523948311805725e-05, -4.022940993309021e-05, -3.8934871554374695e-05, -3.764033317565918e-05, -3.6345794796943665e-05, -3.505125641822815e-05, -3.3756718039512634e-05, -3.246217966079712e-05, -3.1167641282081604e-05, -2.987310290336609e-05, -2.8578564524650574e-05, -2.728402614593506e-05, -2.5989487767219543e-05, -2.469494938850403e-05, -2.3400411009788513e-05, -2.2105872631072998e-05, -2.0811334252357483e-05, -1.9516795873641968e-05, -1.8222257494926453e-05, -1.6927719116210938e-05, -1.5633180737495422e-05, -1.4338642358779907e-05, -1.3044103980064392e-05, -1.1749565601348877e-05, -1.0455027222633362e-05, -9.160488843917847e-06, -7.865950465202332e-06, -6.571412086486816e-06, -5.276873707771301e-06, -3.982335329055786e-06, -2.687796950340271e-06, -1.3932585716247559e-06, -9.872019290924072e-08, 1.1958181858062744e-06, 2.4903565645217896e-06, 3.7848949432373047e-06, 5.07943332195282e-06, 6.373971700668335e-06, 7.66851007938385e-06, 8.963048458099365e-06, 1.025758683681488e-05, 1.1552125215530396e-05, 1.284666359424591e-05, 1.4141201972961426e-05, 1.543574035167694e-05, 1.6730278730392456e-05, 1.802481710910797e-05, 1.9319355487823486e-05, 2.0613893866539e-05, 2.1908432245254517e-05, 2.3202970623970032e-05, 2.4497509002685547e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 4.0, 7.0, 4.0, 12.0, 17.0, 28.0, 25.0, 52.0, 73.0, 101.0, 153.0, 280.0, 398.0, 742.0, 1358.0, 2971.0, 8143.0, 35933.0, 418088.0, 521092.0, 43359.0, 8981.0, 3221.0, 1498.0, 789.0, 464.0, 256.0, 183.0, 93.0, 61.0, 51.0, 38.0, 32.0, 18.0, 7.0, 6.0, 4.0, 4.0, 1.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1060791015625, -0.1027688980102539, -0.09945869445800781, -0.09614849090576172, -0.09283828735351562, -0.08952808380126953, -0.08621788024902344, -0.08290767669677734, -0.07959747314453125, -0.07628726959228516, -0.07297706604003906, -0.06966686248779297, -0.06635665893554688, -0.06304645538330078, -0.05973625183105469, -0.056426048278808594, -0.0531158447265625, -0.049805641174316406, -0.04649543762207031, -0.04318523406982422, -0.039875030517578125, -0.03656482696533203, -0.03325462341308594, -0.029944419860839844, -0.02663421630859375, -0.023324012756347656, -0.020013809204101562, -0.01670360565185547, -0.013393402099609375, -0.010083198547363281, -0.0067729949951171875, -0.0034627914428710938, -0.000152587890625, 0.0031576156616210938, 0.0064678192138671875, 0.009778022766113281, 0.013088226318359375, 0.01639842987060547, 0.019708633422851562, 0.023018836975097656, 0.02632904052734375, 0.029639244079589844, 0.03294944763183594, 0.03625965118408203, 0.039569854736328125, 0.04288005828857422, 0.04619026184082031, 0.049500465393066406, 0.0528106689453125, 0.056120872497558594, 0.05943107604980469, 0.06274127960205078, 0.06605148315429688, 0.06936168670654297, 0.07267189025878906, 0.07598209381103516, 0.07929229736328125, 0.08260250091552734, 0.08591270446777344, 0.08922290802001953, 0.09253311157226562, 0.09584331512451172, 0.09915351867675781, 0.1024637222290039, 0.10577392578125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 2.0, 3.0, 5.0, 9.0, 8.0, 13.0, 5.0, 17.0, 27.0, 26.0, 41.0, 45.0, 66.0, 90.0, 78.0, 84.0, 106.0, 89.0, 67.0, 48.0, 35.0, 33.0, 25.0, 19.0, 15.0, 17.0, 12.0, 5.0, 3.0, 1.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06634521484375, -0.06403923034667969, -0.061733245849609375, -0.05942726135253906, -0.05712127685546875, -0.05481529235839844, -0.052509307861328125, -0.05020332336425781, -0.0478973388671875, -0.04559135437011719, -0.043285369873046875, -0.04097938537597656, -0.03867340087890625, -0.03636741638183594, -0.034061431884765625, -0.03175544738769531, -0.029449462890625, -0.027143478393554688, -0.024837493896484375, -0.022531509399414062, -0.02022552490234375, -0.017919540405273438, -0.015613555908203125, -0.013307571411132812, -0.0110015869140625, -0.008695602416992188, -0.006389617919921875, -0.0040836334228515625, -0.00177764892578125, 0.0005283355712890625, 0.002834320068359375, 0.0051403045654296875, 0.0074462890625, 0.009752273559570312, 0.012058258056640625, 0.014364242553710938, 0.01667022705078125, 0.018976211547851562, 0.021282196044921875, 0.023588180541992188, 0.0258941650390625, 0.028200149536132812, 0.030506134033203125, 0.03281211853027344, 0.03511810302734375, 0.03742408752441406, 0.039730072021484375, 0.04203605651855469, 0.044342041015625, 0.04664802551269531, 0.048954010009765625, 0.05125999450683594, 0.05356597900390625, 0.05587196350097656, 0.058177947998046875, 0.06048393249511719, 0.0627899169921875, 0.06509590148925781, 0.06740188598632812, 0.06970787048339844, 0.07201385498046875, 0.07431983947753906, 0.07662582397460938, 0.07893180847167969, 0.08123779296875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 10.0, 10.0, 21.0, 46.0, 80.0, 117.0, 148.0, 149.0, 141.0, 110.0, 77.0, 45.0, 20.0, 13.0, 11.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0901665687561035, -1.0443147420883179, -0.9984630346298218, -0.9526112079620361, -0.9067594408988953, -0.8609076738357544, -0.8150558471679688, -0.7692040801048279, -0.723352313041687, -0.6775005459785461, -0.6316487789154053, -0.5857969522476196, -0.5399451851844788, -0.4940934181213379, -0.44824162125587463, -0.4023898243904114, -0.3565380573272705, -0.31068629026412964, -0.2648344933986664, -0.21898271143436432, -0.17313092947006226, -0.1272791475057602, -0.08142736554145813, -0.03557556867599487, 0.010276198387145996, 0.05612798035144806, 0.10197976231575012, 0.14783154428005219, 0.19368332624435425, 0.2395351082086563, 0.2853868901729584, 0.33123868703842163, 0.3770904541015625, 0.42294222116470337, 0.4687940180301666, 0.5146458148956299, 0.5604975819587708, 0.6063493490219116, 0.6522011756896973, 0.6980529427528381, 0.743904709815979, 0.7897564768791199, 0.8356082439422607, 0.8814600706100464, 0.9273118376731873, 0.9731636047363281, 1.0190154314041138, 1.0648672580718994, 1.1107189655303955, 1.1565707921981812, 1.2024224996566772, 1.248274326324463, 1.294126033782959, 1.3399778604507446, 1.3858296871185303, 1.4316813945770264, 1.477533221244812, 1.5233850479125977, 1.5692367553710938, 1.6150885820388794, 1.660940408706665, 1.7067921161651611, 1.7526439428329468, 1.7984957695007324, 1.8443474769592285]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 7.0, 8.0, 11.0, 9.0, 11.0, 14.0, 15.0, 30.0, 28.0, 28.0, 32.0, 54.0, 48.0, 52.0, 47.0, 61.0, 56.0, 66.0, 67.0, 49.0, 45.0, 37.0, 36.0, 30.0, 32.0, 26.0, 14.0, 18.0, 21.0, 15.0, 7.0, 17.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.1282103061676025, -1.0989480018615723, -1.0696858167648315, -1.0404235124588013, -1.0111613273620605, -0.9818990230560303, -0.9526367783546448, -0.9233745336532593, -0.894112229347229, -0.8648499846458435, -0.835587739944458, -0.8063254356384277, -0.7770631909370422, -0.7478009462356567, -0.7185387015342712, -0.6892764568328857, -0.6600141525268555, -0.63075190782547, -0.6014896631240845, -0.5722273588180542, -0.5429651141166687, -0.5137028694152832, -0.4844406247138977, -0.4551783502101898, -0.4259161353111267, -0.3966538906097412, -0.3673916161060333, -0.3381293714046478, -0.30886709690093994, -0.27960485219955444, -0.25034260749816895, -0.22108033299446106, -0.19181805849075317, -0.16255579888820648, -0.1332935392856598, -0.1040312871336937, -0.074769027531147, -0.04550677537918091, -0.016244515776634216, 0.013017743825912476, 0.04228000342845917, 0.07154226303100586, 0.10080452263355255, 0.13006678223609924, 0.15932902693748474, 0.18859128654003143, 0.21785354614257812, 0.24711580574512482, 0.2763780653476715, 0.305640310049057, 0.3349025845527649, 0.3641648292541504, 0.3934271037578583, 0.4226893484592438, 0.45195162296295166, 0.48121386766433716, 0.5104761123657227, 0.5397383570671082, 0.5690006017684937, 0.5982629060745239, 0.6275251507759094, 0.6567873954772949, 0.6860496401786804, 0.7153118848800659, 0.7445741891860962]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 12.0, 8.0, 9.0, 10.0, 23.0, 30.0, 46.0, 47.0, 76.0, 118.0, 167.0, 254.0, 401.0, 786.0, 1629.0, 4176.0, 18943.0, 4070729.0, 83403.0, 8365.0, 2461.0, 1055.0, 548.0, 346.0, 206.0, 128.0, 86.0, 66.0, 44.0, 31.0, 20.0, 17.0, 12.0, 9.0, 4.0, 5.0, 6.0, 2.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.315185546875, -0.30556488037109375, -0.2959442138671875, -0.28632354736328125, -0.276702880859375, -0.26708221435546875, -0.2574615478515625, -0.24784088134765625, -0.23822021484375, -0.22859954833984375, -0.2189788818359375, -0.20935821533203125, -0.199737548828125, -0.19011688232421875, -0.1804962158203125, -0.17087554931640625, -0.1612548828125, -0.15163421630859375, -0.1420135498046875, -0.13239288330078125, -0.122772216796875, -0.11315155029296875, -0.1035308837890625, -0.09391021728515625, -0.08428955078125, -0.07466888427734375, -0.0650482177734375, -0.05542755126953125, -0.045806884765625, -0.03618621826171875, -0.0265655517578125, -0.01694488525390625, -0.00732421875, 0.00229644775390625, 0.0119171142578125, 0.02153778076171875, 0.031158447265625, 0.04077911376953125, 0.0503997802734375, 0.06002044677734375, 0.06964111328125, 0.07926177978515625, 0.0888824462890625, 0.09850311279296875, 0.108123779296875, 0.11774444580078125, 0.1273651123046875, 0.13698577880859375, 0.1466064453125, 0.15622711181640625, 0.1658477783203125, 0.17546844482421875, 0.185089111328125, 0.19470977783203125, 0.2043304443359375, 0.21395111083984375, 0.22357177734375, 0.23319244384765625, 0.2428131103515625, 0.25243377685546875, 0.262054443359375, 0.27167510986328125, 0.2812957763671875, 0.29091644287109375, 0.300537109375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 6.0, 4.0, 5.0, 3.0, 8.0, 9.0, 13.0, 11.0, 25.0, 16.0, 26.0, 30.0, 43.0, 27.0, 41.0, 50.0, 53.0, 54.0, 46.0, 65.0, 57.0, 50.0, 43.0, 45.0, 43.0, 29.0, 41.0, 38.0, 20.0, 20.0, 18.0, 15.0, 13.0, 11.0, 10.0, 4.0, 5.0, 5.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.038726806640625, -0.037693023681640625, -0.03665924072265625, -0.035625457763671875, -0.0345916748046875, -0.033557891845703125, -0.03252410888671875, -0.031490325927734375, -0.03045654296875, -0.029422760009765625, -0.02838897705078125, -0.027355194091796875, -0.0263214111328125, -0.025287628173828125, -0.02425384521484375, -0.023220062255859375, -0.022186279296875, -0.021152496337890625, -0.02011871337890625, -0.019084930419921875, -0.0180511474609375, -0.017017364501953125, -0.01598358154296875, -0.014949798583984375, -0.013916015625, -0.012882232666015625, -0.01184844970703125, -0.010814666748046875, -0.0097808837890625, -0.008747100830078125, -0.00771331787109375, -0.006679534912109375, -0.005645751953125, -0.004611968994140625, -0.00357818603515625, -0.002544403076171875, -0.0015106201171875, -0.000476837158203125, 0.00055694580078125, 0.001590728759765625, 0.00262451171875, 0.003658294677734375, 0.00469207763671875, 0.005725860595703125, 0.0067596435546875, 0.007793426513671875, 0.00882720947265625, 0.009860992431640625, 0.010894775390625, 0.011928558349609375, 0.01296234130859375, 0.013996124267578125, 0.0150299072265625, 0.016063690185546875, 0.01709747314453125, 0.018131256103515625, 0.0191650390625, 0.020198822021484375, 0.02123260498046875, 0.022266387939453125, 0.0233001708984375, 0.024333953857421875, 0.02536773681640625, 0.026401519775390625, 0.027435302734375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 8.0, 9.0, 8.0, 10.0, 17.0, 20.0, 28.0, 42.0, 70.0, 98.0, 106.0, 133.0, 197.0, 328.0, 529.0, 832.0, 1451.0, 3059.0, 8172.0, 36818.0, 4028192.0, 93184.0, 12246.0, 4097.0, 1800.0, 963.0, 597.0, 372.0, 260.0, 185.0, 120.0, 83.0, 90.0, 60.0, 20.0, 21.0, 18.0, 17.0, 3.0, 8.0, 5.0, 5.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.270751953125, -0.261627197265625, -0.25250244140625, -0.243377685546875, -0.2342529296875, -0.225128173828125, -0.21600341796875, -0.206878662109375, -0.19775390625, -0.188629150390625, -0.17950439453125, -0.170379638671875, -0.1612548828125, -0.152130126953125, -0.14300537109375, -0.133880615234375, -0.124755859375, -0.115631103515625, -0.10650634765625, -0.097381591796875, -0.0882568359375, -0.079132080078125, -0.07000732421875, -0.060882568359375, -0.0517578125, -0.042633056640625, -0.03350830078125, -0.024383544921875, -0.0152587890625, -0.006134033203125, 0.00299072265625, 0.012115478515625, 0.021240234375, 0.030364990234375, 0.03948974609375, 0.048614501953125, 0.0577392578125, 0.066864013671875, 0.07598876953125, 0.085113525390625, 0.09423828125, 0.103363037109375, 0.11248779296875, 0.121612548828125, 0.1307373046875, 0.139862060546875, 0.14898681640625, 0.158111572265625, 0.167236328125, 0.176361083984375, 0.18548583984375, 0.194610595703125, 0.2037353515625, 0.212860107421875, 0.22198486328125, 0.231109619140625, 0.240234375, 0.249359130859375, 0.25848388671875, 0.267608642578125, 0.2767333984375, 0.285858154296875, 0.29498291015625, 0.304107666015625, 0.313232421875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 9.0, 2.0, 8.0, 13.0, 39.0, 95.0, 3152.0, 589.0, 77.0, 34.0, 15.0, 14.0, 11.0, 3.0, 3.0, 5.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0899658203125, -0.08759450912475586, -0.08522319793701172, -0.08285188674926758, -0.08048057556152344, -0.0781092643737793, -0.07573795318603516, -0.07336664199829102, -0.07099533081054688, -0.06862401962280273, -0.0662527084350586, -0.06388139724731445, -0.06151008605957031, -0.05913877487182617, -0.05676746368408203, -0.05439615249633789, -0.05202484130859375, -0.04965353012084961, -0.04728221893310547, -0.04491090774536133, -0.04253959655761719, -0.04016828536987305, -0.037796974182128906, -0.035425662994384766, -0.033054351806640625, -0.030683040618896484, -0.028311729431152344, -0.025940418243408203, -0.023569107055664062, -0.021197795867919922, -0.01882648468017578, -0.01645517349243164, -0.0140838623046875, -0.01171255111694336, -0.009341239929199219, -0.006969928741455078, -0.0045986175537109375, -0.002227306365966797, 0.00014400482177734375, 0.0025153160095214844, 0.004886627197265625, 0.007257938385009766, 0.009629249572753906, 0.012000560760498047, 0.014371871948242188, 0.016743183135986328, 0.01911449432373047, 0.02148580551147461, 0.02385711669921875, 0.02622842788696289, 0.02859973907470703, 0.030971050262451172, 0.03334236145019531, 0.03571367263793945, 0.038084983825683594, 0.040456295013427734, 0.042827606201171875, 0.045198917388916016, 0.047570228576660156, 0.0499415397644043, 0.05231285095214844, 0.05468416213989258, 0.05705547332763672, 0.05942678451538086, 0.061798095703125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 10.0, 14.0, 18.0, 30.0, 43.0, 74.0, 103.0, 116.0, 143.0, 133.0, 84.0, 79.0, 49.0, 29.0, 29.0, 11.0, 7.0, 8.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18322843313217163, -0.17545722424983978, -0.16768601536750793, -0.15991482138633728, -0.15214361250400543, -0.14437240362167358, -0.13660119473934174, -0.1288299858570099, -0.12105877697467804, -0.11328756809234619, -0.10551636666059494, -0.09774515777826309, -0.08997394889593124, -0.08220274746417999, -0.07443153858184814, -0.0666603296995163, -0.058889128267765045, -0.051117923110723495, -0.04334671422839165, -0.0355755090713501, -0.0278043020516634, -0.0200330950319767, -0.01226188987493515, -0.004490680992603302, 0.0032805241644382477, 0.011051731184124947, 0.018822938203811646, 0.026594143360853195, 0.034365348517894745, 0.04213655740022659, 0.04990776255726814, 0.05767897143959999, 0.06545017659664154, 0.07322138547897339, 0.08099258691072464, 0.08876379579305649, 0.09653500467538834, 0.10430620610713959, 0.11207741498947144, 0.11984862387180328, 0.12761983275413513, 0.13539104163646698, 0.14316225051879883, 0.15093344449996948, 0.15870465338230133, 0.16647586226463318, 0.17424707114696503, 0.18201828002929688, 0.18978947401046753, 0.19756068289279938, 0.20533189177513123, 0.21310308575630188, 0.22087429463863373, 0.22864550352096558, 0.23641671240329742, 0.24418792128562927, 0.2519591450691223, 0.25973033905029297, 0.267501562833786, 0.27527275681495667, 0.2830439805984497, 0.29081517457962036, 0.298586368560791, 0.30635759234428406, 0.3141287863254547]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 11.0, 7.0, 12.0, 8.0, 13.0, 19.0, 18.0, 17.0, 19.0, 27.0, 28.0, 29.0, 33.0, 28.0, 34.0, 31.0, 41.0, 37.0, 36.0, 51.0, 40.0, 29.0, 33.0, 31.0, 31.0, 36.0, 35.0, 34.0, 29.0, 23.0, 23.0, 25.0, 21.0, 20.0, 14.0, 12.0, 16.0, 11.0, 6.0, 6.0, 6.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09320485591888428, -0.08998407423496246, -0.08676329255104065, -0.08354251086711884, -0.08032172918319702, -0.07710094749927521, -0.0738801583647728, -0.07065937668085098, -0.06743859499692917, -0.06421781331300735, -0.06099703162908554, -0.05777624621987343, -0.054555464535951614, -0.0513346828520298, -0.04811389744281769, -0.044893115758895874, -0.04167233407497406, -0.038451552391052246, -0.03523077070713043, -0.03200998529791832, -0.028789203613996506, -0.025568421930074692, -0.02234763838350773, -0.019126854836940765, -0.01590607315301895, -0.012685290537774563, -0.009464507922530174, -0.006243725307285786, -0.003022942692041397, 0.00019783899188041687, 0.00341862253844738, 0.006639406085014343, 0.009860187768936157, 0.013080970384180546, 0.016301752999424934, 0.019522536545991898, 0.02274331822991371, 0.025964099913835526, 0.02918488346040249, 0.03240566700696945, 0.035626448690891266, 0.03884723037481308, 0.042068012058734894, 0.045288797467947006, 0.04850957915186882, 0.051730360835790634, 0.05495114624500275, 0.05817192792892456, 0.061392709612846375, 0.06461349129676819, 0.06783427298069, 0.07105505466461182, 0.07427583634853363, 0.07749661803245544, 0.08071740716695786, 0.08393818885087967, 0.08715897053480148, 0.0903797522187233, 0.09360053390264511, 0.09682131558656693, 0.10004210472106934, 0.10326288640499115, 0.10648366808891296, 0.10970444977283478, 0.11292523145675659]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 4.0, 6.0, 3.0, 9.0, 14.0, 17.0, 31.0, 53.0, 69.0, 111.0, 220.0, 274.0, 510.0, 860.0, 1686.0, 3472.0, 6996.0, 15422.0, 34762.0, 81852.0, 181734.0, 294416.0, 229716.0, 110074.0, 47607.0, 20221.0, 9254.0, 4292.0, 2162.0, 1162.0, 582.0, 369.0, 207.0, 140.0, 89.0, 56.0, 37.0, 29.0, 5.0, 17.0, 10.0, 4.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0704345703125, -0.0683431625366211, -0.06625175476074219, -0.06416034698486328, -0.062068939208984375, -0.05997753143310547, -0.05788612365722656, -0.055794715881347656, -0.05370330810546875, -0.051611900329589844, -0.04952049255371094, -0.04742908477783203, -0.045337677001953125, -0.04324626922607422, -0.04115486145019531, -0.039063453674316406, -0.0369720458984375, -0.034880638122558594, -0.03278923034667969, -0.03069782257080078, -0.028606414794921875, -0.02651500701904297, -0.024423599243164062, -0.022332191467285156, -0.02024078369140625, -0.018149375915527344, -0.016057968139648438, -0.013966560363769531, -0.011875152587890625, -0.009783744812011719, -0.0076923370361328125, -0.005600929260253906, -0.003509521484375, -0.0014181137084960938, 0.0006732940673828125, 0.0027647018432617188, 0.004856109619140625, 0.006947517395019531, 0.009038925170898438, 0.011130332946777344, 0.01322174072265625, 0.015313148498535156, 0.017404556274414062, 0.01949596405029297, 0.021587371826171875, 0.02367877960205078, 0.025770187377929688, 0.027861595153808594, 0.0299530029296875, 0.032044410705566406, 0.03413581848144531, 0.03622722625732422, 0.038318634033203125, 0.04041004180908203, 0.04250144958496094, 0.044592857360839844, 0.04668426513671875, 0.048775672912597656, 0.05086708068847656, 0.05295848846435547, 0.055049896240234375, 0.05714130401611328, 0.05923271179199219, 0.061324119567871094, 0.06341552734375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 5.0, 11.0, 6.0, 16.0, 11.0, 15.0, 18.0, 14.0, 14.0, 18.0, 32.0, 32.0, 41.0, 28.0, 40.0, 48.0, 41.0, 59.0, 44.0, 38.0, 33.0, 39.0, 50.0, 42.0, 40.0, 43.0, 30.0, 27.0, 26.0, 31.0, 16.0, 13.0, 13.0, 18.0, 10.0, 10.0, 4.0, 2.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0290374755859375, -0.028041601181030273, -0.027045726776123047, -0.02604985237121582, -0.025053977966308594, -0.024058103561401367, -0.02306222915649414, -0.022066354751586914, -0.021070480346679688, -0.02007460594177246, -0.019078731536865234, -0.018082857131958008, -0.01708698272705078, -0.016091108322143555, -0.015095233917236328, -0.014099359512329102, -0.013103485107421875, -0.012107610702514648, -0.011111736297607422, -0.010115861892700195, -0.009119987487792969, -0.008124113082885742, -0.007128238677978516, -0.006132364273071289, -0.0051364898681640625, -0.004140615463256836, -0.0031447410583496094, -0.002148866653442383, -0.0011529922485351562, -0.0001571178436279297, 0.0008387565612792969, 0.0018346309661865234, 0.00283050537109375, 0.0038263797760009766, 0.004822254180908203, 0.00581812858581543, 0.006814002990722656, 0.007809877395629883, 0.00880575180053711, 0.009801626205444336, 0.010797500610351562, 0.011793375015258789, 0.012789249420166016, 0.013785123825073242, 0.014780998229980469, 0.015776872634887695, 0.016772747039794922, 0.01776862144470215, 0.018764495849609375, 0.0197603702545166, 0.020756244659423828, 0.021752119064331055, 0.02274799346923828, 0.023743867874145508, 0.024739742279052734, 0.02573561668395996, 0.026731491088867188, 0.027727365493774414, 0.02872323989868164, 0.029719114303588867, 0.030714988708496094, 0.03171086311340332, 0.03270673751831055, 0.03370261192321777, 0.034698486328125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 2.0, 2.0, 5.0, 6.0, 3.0, 7.0, 13.0, 15.0, 28.0, 30.0, 73.0, 79.0, 133.0, 191.0, 297.0, 473.0, 921.0, 1932.0, 5059.0, 17124.0, 83425.0, 495341.0, 364175.0, 58743.0, 12624.0, 4112.0, 1655.0, 800.0, 442.0, 272.0, 188.0, 101.0, 89.0, 49.0, 33.0, 28.0, 25.0, 12.0, 20.0, 7.0, 5.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.141357421875, -0.1374197006225586, -0.1334819793701172, -0.12954425811767578, -0.12560653686523438, -0.12166881561279297, -0.11773109436035156, -0.11379337310791016, -0.10985565185546875, -0.10591793060302734, -0.10198020935058594, -0.09804248809814453, -0.09410476684570312, -0.09016704559326172, -0.08622932434082031, -0.0822916030883789, -0.0783538818359375, -0.0744161605834961, -0.07047843933105469, -0.06654071807861328, -0.06260299682617188, -0.05866527557373047, -0.05472755432128906, -0.050789833068847656, -0.04685211181640625, -0.042914390563964844, -0.03897666931152344, -0.03503894805908203, -0.031101226806640625, -0.02716350555419922, -0.023225784301757812, -0.019288063049316406, -0.015350341796875, -0.011412620544433594, -0.0074748992919921875, -0.0035371780395507812, 0.000400543212890625, 0.004338264465332031, 0.008275985717773438, 0.012213706970214844, 0.01615142822265625, 0.020089149475097656, 0.024026870727539062, 0.02796459197998047, 0.031902313232421875, 0.03584003448486328, 0.03977775573730469, 0.043715476989746094, 0.0476531982421875, 0.051590919494628906, 0.05552864074707031, 0.05946636199951172, 0.06340408325195312, 0.06734180450439453, 0.07127952575683594, 0.07521724700927734, 0.07915496826171875, 0.08309268951416016, 0.08703041076660156, 0.09096813201904297, 0.09490585327148438, 0.09884357452392578, 0.10278129577636719, 0.1067190170288086, 0.11065673828125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 2.0, 6.0, 3.0, 8.0, 3.0, 12.0, 10.0, 13.0, 14.0, 13.0, 22.0, 33.0, 28.0, 32.0, 21.0, 34.0, 47.0, 31.0, 48.0, 60.0, 60.0, 50.0, 45.0, 58.0, 36.0, 35.0, 23.0, 33.0, 31.0, 32.0, 25.0, 29.0, 18.0, 15.0, 17.0, 12.0, 13.0, 9.0, 4.0, 5.0, 4.0, 5.0, 2.0, 1.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1376953125, -0.13295745849609375, -0.1282196044921875, -0.12348175048828125, -0.118743896484375, -0.11400604248046875, -0.1092681884765625, -0.10453033447265625, -0.09979248046875, -0.09505462646484375, -0.0903167724609375, -0.08557891845703125, -0.080841064453125, -0.07610321044921875, -0.0713653564453125, -0.06662750244140625, -0.0618896484375, -0.05715179443359375, -0.0524139404296875, -0.04767608642578125, -0.042938232421875, -0.03820037841796875, -0.0334625244140625, -0.02872467041015625, -0.02398681640625, -0.01924896240234375, -0.0145111083984375, -0.00977325439453125, -0.005035400390625, -0.00029754638671875, 0.0044403076171875, 0.00917816162109375, 0.013916015625, 0.01865386962890625, 0.0233917236328125, 0.02812957763671875, 0.032867431640625, 0.03760528564453125, 0.0423431396484375, 0.04708099365234375, 0.05181884765625, 0.05655670166015625, 0.0612945556640625, 0.06603240966796875, 0.070770263671875, 0.07550811767578125, 0.0802459716796875, 0.08498382568359375, 0.0897216796875, 0.09445953369140625, 0.0991973876953125, 0.10393524169921875, 0.108673095703125, 0.11341094970703125, 0.1181488037109375, 0.12288665771484375, 0.12762451171875, 0.13236236572265625, 0.1371002197265625, 0.14183807373046875, 0.146575927734375, 0.15131378173828125, 0.1560516357421875, 0.16078948974609375, 0.16552734375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 6.0, 3.0, 5.0, 9.0, 9.0, 15.0, 20.0, 28.0, 48.0, 74.0, 149.0, 301.0, 781.0, 3271.0, 27469.0, 858417.0, 148013.0, 7556.0, 1449.0, 439.0, 213.0, 112.0, 53.0, 29.0, 21.0, 13.0, 13.0, 8.0, 5.0, 4.0, 9.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1849365234375, -0.1801614761352539, -0.1753864288330078, -0.17061138153076172, -0.16583633422851562, -0.16106128692626953, -0.15628623962402344, -0.15151119232177734, -0.14673614501953125, -0.14196109771728516, -0.13718605041503906, -0.13241100311279297, -0.12763595581054688, -0.12286090850830078, -0.11808586120605469, -0.1133108139038086, -0.1085357666015625, -0.1037607192993164, -0.09898567199707031, -0.09421062469482422, -0.08943557739257812, -0.08466053009033203, -0.07988548278808594, -0.07511043548583984, -0.07033538818359375, -0.06556034088134766, -0.06078529357910156, -0.05601024627685547, -0.051235198974609375, -0.04646015167236328, -0.04168510437011719, -0.036910057067871094, -0.032135009765625, -0.027359962463378906, -0.022584915161132812, -0.01780986785888672, -0.013034820556640625, -0.008259773254394531, -0.0034847259521484375, 0.0012903213500976562, 0.00606536865234375, 0.010840415954589844, 0.015615463256835938, 0.02039051055908203, 0.025165557861328125, 0.02994060516357422, 0.03471565246582031, 0.039490699768066406, 0.0442657470703125, 0.049040794372558594, 0.05381584167480469, 0.05859088897705078, 0.06336593627929688, 0.06814098358154297, 0.07291603088378906, 0.07769107818603516, 0.08246612548828125, 0.08724117279052734, 0.09201622009277344, 0.09679126739501953, 0.10156631469726562, 0.10634136199951172, 0.11111640930175781, 0.1158914566040039, 0.12066650390625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 7.0, 16.0, 13.0, 24.0, 29.0, 26.0, 50.0, 51.0, 77.0, 73.0, 93.0, 76.0, 78.0, 67.0, 69.0, 39.0, 34.0, 37.0, 22.0, 24.0, 13.0, 25.0, 11.0, 13.0, 9.0, 3.0, 5.0, 5.0, 2.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.300739288330078e-05, -2.2184103727340698e-05, -2.1360814571380615e-05, -2.0537525415420532e-05, -1.971423625946045e-05, -1.8890947103500366e-05, -1.8067657947540283e-05, -1.72443687915802e-05, -1.6421079635620117e-05, -1.5597790479660034e-05, -1.4774501323699951e-05, -1.3951212167739868e-05, -1.3127923011779785e-05, -1.2304633855819702e-05, -1.1481344699859619e-05, -1.0658055543899536e-05, -9.834766387939453e-06, -9.01147723197937e-06, -8.188188076019287e-06, -7.364898920059204e-06, -6.541609764099121e-06, -5.718320608139038e-06, -4.895031452178955e-06, -4.071742296218872e-06, -3.248453140258789e-06, -2.425163984298706e-06, -1.601874828338623e-06, -7.7858567237854e-07, 4.470348358154297e-08, 8.67992639541626e-07, 1.691281795501709e-06, 2.514570951461792e-06, 3.337860107421875e-06, 4.161149263381958e-06, 4.984438419342041e-06, 5.807727575302124e-06, 6.631016731262207e-06, 7.45430588722229e-06, 8.277595043182373e-06, 9.100884199142456e-06, 9.924173355102539e-06, 1.0747462511062622e-05, 1.1570751667022705e-05, 1.2394040822982788e-05, 1.3217329978942871e-05, 1.4040619134902954e-05, 1.4863908290863037e-05, 1.568719744682312e-05, 1.6510486602783203e-05, 1.7333775758743286e-05, 1.815706491470337e-05, 1.8980354070663452e-05, 1.9803643226623535e-05, 2.0626932382583618e-05, 2.14502215385437e-05, 2.2273510694503784e-05, 2.3096799850463867e-05, 2.392008900642395e-05, 2.4743378162384033e-05, 2.5566667318344116e-05, 2.63899564743042e-05, 2.7213245630264282e-05, 2.8036534786224365e-05, 2.8859823942184448e-05, 2.968311309814453e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 7.0, 6.0, 7.0, 8.0, 19.0, 28.0, 30.0, 38.0, 76.0, 135.0, 202.0, 345.0, 725.0, 1524.0, 3858.0, 12858.0, 83399.0, 687958.0, 223287.0, 23869.0, 5943.0, 2121.0, 974.0, 470.0, 234.0, 126.0, 90.0, 78.0, 33.0, 31.0, 16.0, 8.0, 17.0, 8.0, 7.0, 5.0, 4.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.08917236328125, -0.08635902404785156, -0.08354568481445312, -0.08073234558105469, -0.07791900634765625, -0.07510566711425781, -0.07229232788085938, -0.06947898864746094, -0.0666656494140625, -0.06385231018066406, -0.061038970947265625, -0.05822563171386719, -0.05541229248046875, -0.05259895324707031, -0.049785614013671875, -0.04697227478027344, -0.044158935546875, -0.04134559631347656, -0.038532257080078125, -0.03571891784667969, -0.03290557861328125, -0.030092239379882812, -0.027278900146484375, -0.024465560913085938, -0.0216522216796875, -0.018838882446289062, -0.016025543212890625, -0.013212203979492188, -0.01039886474609375, -0.0075855255126953125, -0.004772186279296875, -0.0019588470458984375, 0.0008544921875, 0.0036678314208984375, 0.006481170654296875, 0.009294509887695312, 0.01210784912109375, 0.014921188354492188, 0.017734527587890625, 0.020547866821289062, 0.0233612060546875, 0.026174545288085938, 0.028987884521484375, 0.03180122375488281, 0.03461456298828125, 0.03742790222167969, 0.040241241455078125, 0.04305458068847656, 0.045867919921875, 0.04868125915527344, 0.051494598388671875, 0.05430793762207031, 0.05712127685546875, 0.05993461608886719, 0.06274795532226562, 0.06556129455566406, 0.0683746337890625, 0.07118797302246094, 0.07400131225585938, 0.07681465148925781, 0.07962799072265625, 0.08244132995605469, 0.08525466918945312, 0.08806800842285156, 0.09088134765625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 1.0, 3.0, 5.0, 6.0, 7.0, 9.0, 23.0, 36.0, 67.0, 116.0, 134.0, 150.0, 162.0, 104.0, 69.0, 45.0, 27.0, 13.0, 12.0, 7.0, 3.0, 5.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1597900390625, -0.15594959259033203, -0.15210914611816406, -0.1482686996459961, -0.14442825317382812, -0.14058780670166016, -0.1367473602294922, -0.13290691375732422, -0.12906646728515625, -0.12522602081298828, -0.12138557434082031, -0.11754512786865234, -0.11370468139648438, -0.1098642349243164, -0.10602378845214844, -0.10218334197998047, -0.0983428955078125, -0.09450244903564453, -0.09066200256347656, -0.0868215560913086, -0.08298110961914062, -0.07914066314697266, -0.07530021667480469, -0.07145977020263672, -0.06761932373046875, -0.06377887725830078, -0.05993843078613281, -0.056097984313964844, -0.052257537841796875, -0.048417091369628906, -0.04457664489746094, -0.04073619842529297, -0.036895751953125, -0.03305530548095703, -0.029214859008789062, -0.025374412536621094, -0.021533966064453125, -0.017693519592285156, -0.013853073120117188, -0.010012626647949219, -0.00617218017578125, -0.0023317337036132812, 0.0015087127685546875, 0.005349159240722656, 0.009189605712890625, 0.013030052185058594, 0.016870498657226562, 0.02071094512939453, 0.0245513916015625, 0.02839183807373047, 0.03223228454589844, 0.036072731018066406, 0.039913177490234375, 0.043753623962402344, 0.04759407043457031, 0.05143451690673828, 0.05527496337890625, 0.05911540985107422, 0.06295585632324219, 0.06679630279541016, 0.07063674926757812, 0.0744771957397461, 0.07831764221191406, 0.08215808868408203, 0.08599853515625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 7.0, 25.0, 60.0, 186.0, 271.0, 257.0, 143.0, 31.0, 15.0, 6.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0014524459838867, -0.9235528111457825, -0.8456531763076782, -0.7677536010742188, -0.6898539662361145, -0.6119543313980103, -0.5340547561645508, -0.45615512132644653, -0.3782554864883423, -0.30035585165023804, -0.22245624661445618, -0.14455662667751312, -0.06665700674057007, 0.01124262809753418, 0.08914223313331604, 0.1670418381690979, 0.24494147300720215, 0.3228411078453064, 0.40074071288108826, 0.4786403179168701, 0.5565399527549744, 0.6344395875930786, 0.7123391628265381, 0.7902387976646423, 0.8681384325027466, 0.9460380673408508, 1.023937702178955, 1.1018372774124146, 1.179736852645874, 1.257636547088623, 1.3355361223220825, 1.413435697555542, 1.491335153579712, 1.5692347288131714, 1.6471344232559204, 1.7250339984893799, 1.802933692932129, 1.8808332681655884, 1.9587328433990479, 2.036632537841797, 2.114531993865967, 2.192431688308716, 2.2703311443328857, 2.3482308387756348, 2.426130533218384, 2.504030227661133, 2.5819296836853027, 2.6598293781280518, 2.737729072570801, 2.81562876701355, 2.8935282230377197, 2.9714279174804688, 3.0493276119232178, 3.127227306365967, 3.2051267623901367, 3.2830264568328857, 3.3609261512756348, 3.438825845718384, 3.5167253017425537, 3.5946249961853027, 3.6725246906280518, 3.750424385070801, 3.8283238410949707, 3.9062235355377197, 3.9841229915618896]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 7.0, 11.0, 8.0, 13.0, 13.0, 14.0, 15.0, 22.0, 32.0, 34.0, 32.0, 34.0, 42.0, 42.0, 47.0, 55.0, 59.0, 49.0, 44.0, 48.0, 55.0, 38.0, 38.0, 41.0, 34.0, 33.0, 33.0, 13.0, 18.0, 11.0, 19.0, 9.0, 9.0, 8.0, 7.0, 6.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8185887336730957, -0.794086217880249, -0.7695837616920471, -0.7450812458992004, -0.7205787897109985, -0.6960762739181519, -0.6715737581253052, -0.6470712423324585, -0.6225687861442566, -0.5980662703514099, -0.573563814163208, -0.5490612983703613, -0.5245587825775146, -0.5000563263893127, -0.47555381059646606, -0.4510513246059418, -0.4265488386154175, -0.4020463526248932, -0.3775438666343689, -0.3530413508415222, -0.3285388648509979, -0.30403637886047363, -0.27953386306762695, -0.25503137707710266, -0.23052889108657837, -0.20602640509605408, -0.1815239042043686, -0.1570214033126831, -0.1325189173221588, -0.10801642388105392, -0.08351393043994904, -0.05901142954826355, -0.03450888395309448, -0.010006390511989594, 0.014496102929115295, 0.038998596370220184, 0.06350108981132507, 0.08800358325242996, 0.11250607669353485, 0.13700857758522034, 0.16151106357574463, 0.18601354956626892, 0.2105160504579544, 0.2350185513496399, 0.2595210373401642, 0.2840235233306885, 0.30852603912353516, 0.33302852511405945, 0.35753101110458374, 0.38203349709510803, 0.4065359830856323, 0.431038498878479, 0.4555409848690033, 0.4800434708595276, 0.5045459866523743, 0.5290484428405762, 0.5535509586334229, 0.5780534744262695, 0.6025559306144714, 0.6270584464073181, 0.65156090259552, 0.6760634183883667, 0.7005659341812134, 0.7250684499740601, 0.749570906162262]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 2.0, 6.0, 5.0, 5.0, 8.0, 23.0, 29.0, 50.0, 49.0, 104.0, 150.0, 274.0, 354.0, 684.0, 1150.0, 2496.0, 6454.0, 44672.0, 4113567.0, 15875.0, 4160.0, 1798.0, 940.0, 526.0, 332.0, 174.0, 120.0, 105.0, 61.0, 42.0, 24.0, 12.0, 11.0, 10.0, 7.0, 7.0, 5.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.185546875, -0.17722702026367188, -0.16890716552734375, -0.16058731079101562, -0.1522674560546875, -0.14394760131835938, -0.13562774658203125, -0.12730789184570312, -0.118988037109375, -0.11066818237304688, -0.10234832763671875, -0.09402847290039062, -0.0857086181640625, -0.07738876342773438, -0.06906890869140625, -0.060749053955078125, -0.05242919921875, -0.044109344482421875, -0.03578948974609375, -0.027469635009765625, -0.0191497802734375, -0.010829925537109375, -0.00251007080078125, 0.005809783935546875, 0.014129638671875, 0.022449493408203125, 0.03076934814453125, 0.039089202880859375, 0.0474090576171875, 0.055728912353515625, 0.06404876708984375, 0.07236862182617188, 0.0806884765625, 0.08900833129882812, 0.09732818603515625, 0.10564804077148438, 0.1139678955078125, 0.12228775024414062, 0.13060760498046875, 0.13892745971679688, 0.147247314453125, 0.15556716918945312, 0.16388702392578125, 0.17220687866210938, 0.1805267333984375, 0.18884658813476562, 0.19716644287109375, 0.20548629760742188, 0.21380615234375, 0.22212600708007812, 0.23044586181640625, 0.23876571655273438, 0.2470855712890625, 0.2554054260253906, 0.26372528076171875, 0.2720451354980469, 0.280364990234375, 0.2886848449707031, 0.29700469970703125, 0.3053245544433594, 0.3136444091796875, 0.3219642639160156, 0.33028411865234375, 0.3386039733886719, 0.346923828125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 7.0, 10.0, 15.0, 15.0, 21.0, 23.0, 27.0, 35.0, 31.0, 33.0, 39.0, 42.0, 54.0, 48.0, 45.0, 44.0, 49.0, 40.0, 49.0, 49.0, 46.0, 36.0, 34.0, 34.0, 30.0, 26.0, 22.0, 10.0, 12.0, 9.0, 18.0, 7.0, 6.0, 6.0, 9.0, 0.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.038330078125, -0.03719615936279297, -0.03606224060058594, -0.034928321838378906, -0.033794403076171875, -0.032660484313964844, -0.03152656555175781, -0.03039264678955078, -0.02925872802734375, -0.02812480926513672, -0.026990890502929688, -0.025856971740722656, -0.024723052978515625, -0.023589134216308594, -0.022455215454101562, -0.02132129669189453, -0.0201873779296875, -0.01905345916748047, -0.017919540405273438, -0.016785621643066406, -0.015651702880859375, -0.014517784118652344, -0.013383865356445312, -0.012249946594238281, -0.01111602783203125, -0.009982109069824219, -0.008848190307617188, -0.007714271545410156, -0.006580352783203125, -0.005446434020996094, -0.0043125152587890625, -0.0031785964965820312, -0.002044677734375, -0.0009107589721679688, 0.0002231597900390625, 0.0013570785522460938, 0.002490997314453125, 0.0036249160766601562, 0.0047588348388671875, 0.005892753601074219, 0.00702667236328125, 0.008160591125488281, 0.009294509887695312, 0.010428428649902344, 0.011562347412109375, 0.012696266174316406, 0.013830184936523438, 0.014964103698730469, 0.0160980224609375, 0.01723194122314453, 0.018365859985351562, 0.019499778747558594, 0.020633697509765625, 0.021767616271972656, 0.022901535034179688, 0.02403545379638672, 0.02516937255859375, 0.02630329132080078, 0.027437210083007812, 0.028571128845214844, 0.029705047607421875, 0.030838966369628906, 0.03197288513183594, 0.03310680389404297, 0.03424072265625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 5.0, 8.0, 7.0, 6.0, 9.0, 12.0, 27.0, 20.0, 22.0, 42.0, 61.0, 80.0, 110.0, 143.0, 180.0, 308.0, 546.0, 998.0, 3132.0, 100561.0, 4081016.0, 4114.0, 1182.0, 603.0, 315.0, 223.0, 148.0, 101.0, 76.0, 60.0, 36.0, 42.0, 23.0, 14.0, 8.0, 9.0, 10.0, 9.0, 2.0, 2.0, 2.0, 1.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.79296875, -0.7697067260742188, -0.7464447021484375, -0.7231826782226562, -0.699920654296875, -0.6766586303710938, -0.6533966064453125, -0.6301345825195312, -0.60687255859375, -0.5836105346679688, -0.5603485107421875, -0.5370864868164062, -0.513824462890625, -0.49056243896484375, -0.4673004150390625, -0.44403839111328125, -0.4207763671875, -0.39751434326171875, -0.3742523193359375, -0.35099029541015625, -0.327728271484375, -0.30446624755859375, -0.2812042236328125, -0.25794219970703125, -0.23468017578125, -0.21141815185546875, -0.1881561279296875, -0.16489410400390625, -0.141632080078125, -0.11837005615234375, -0.0951080322265625, -0.07184600830078125, -0.048583984375, -0.02532196044921875, -0.0020599365234375, 0.02120208740234375, 0.044464111328125, 0.06772613525390625, 0.0909881591796875, 0.11425018310546875, 0.13751220703125, 0.16077423095703125, 0.1840362548828125, 0.20729827880859375, 0.230560302734375, 0.25382232666015625, 0.2770843505859375, 0.30034637451171875, 0.3236083984375, 0.34687042236328125, 0.3701324462890625, 0.39339447021484375, 0.416656494140625, 0.43991851806640625, 0.4631805419921875, 0.48644256591796875, 0.50970458984375, 0.5329666137695312, 0.5562286376953125, 0.5794906616210938, 0.602752685546875, 0.6260147094726562, 0.6492767333984375, 0.6725387573242188, 0.69580078125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 8.0, 15.0, 102.0, 3884.0, 52.0, 11.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.169921875, -0.16414642333984375, -0.1583709716796875, -0.15259552001953125, -0.146820068359375, -0.14104461669921875, -0.1352691650390625, -0.12949371337890625, -0.12371826171875, -0.11794281005859375, -0.1121673583984375, -0.10639190673828125, -0.100616455078125, -0.09484100341796875, -0.0890655517578125, -0.08329010009765625, -0.0775146484375, -0.07173919677734375, -0.0659637451171875, -0.06018829345703125, -0.054412841796875, -0.04863739013671875, -0.0428619384765625, -0.03708648681640625, -0.03131103515625, -0.02553558349609375, -0.0197601318359375, -0.01398468017578125, -0.008209228515625, -0.00243377685546875, 0.0033416748046875, 0.00911712646484375, 0.014892578125, 0.02066802978515625, 0.0264434814453125, 0.03221893310546875, 0.037994384765625, 0.04376983642578125, 0.0495452880859375, 0.05532073974609375, 0.06109619140625, 0.06687164306640625, 0.0726470947265625, 0.07842254638671875, 0.084197998046875, 0.08997344970703125, 0.0957489013671875, 0.10152435302734375, 0.1072998046875, 0.11307525634765625, 0.1188507080078125, 0.12462615966796875, 0.130401611328125, 0.13617706298828125, 0.1419525146484375, 0.14772796630859375, 0.15350341796875, 0.15927886962890625, 0.1650543212890625, 0.17082977294921875, 0.176605224609375, 0.18238067626953125, 0.1881561279296875, 0.19393157958984375, 0.19970703125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 6.0, 8.0, 13.0, 20.0, 19.0, 19.0, 36.0, 53.0, 76.0, 81.0, 108.0, 108.0, 102.0, 96.0, 75.0, 47.0, 31.0, 29.0, 22.0, 14.0, 6.0, 10.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2450229972600937, -0.23755328357219696, -0.23008356988430023, -0.2226138710975647, -0.21514415740966797, -0.20767444372177124, -0.2002047300338745, -0.19273501634597778, -0.18526530265808105, -0.17779558897018433, -0.1703258752822876, -0.16285616159439087, -0.15538646280765533, -0.1479167491197586, -0.14044703543186188, -0.13297732174396515, -0.12550762295722961, -0.11803790926933289, -0.11056820303201675, -0.10309848934412003, -0.0956287831068039, -0.08815906941890717, -0.08068935573101044, -0.07321964204311371, -0.06574993580579758, -0.05828022584319115, -0.05081051588058472, -0.04334080219268799, -0.03587109223008156, -0.028401382267475128, -0.0209316685795784, -0.01346195861697197, -0.005992233753204346, 0.001477477140724659, 0.008947188034653664, 0.016416899859905243, 0.023886609822511673, 0.0313563197851181, 0.03882603347301483, 0.04629574343562126, 0.05376545339822769, 0.06123516336083412, 0.06870487332344055, 0.07617458701133728, 0.08364430069923401, 0.09111400693655014, 0.09858372062444687, 0.106053426861763, 0.11352314054965973, 0.12099285423755646, 0.12846256792545319, 0.13593226671218872, 0.14340198040008545, 0.15087169408798218, 0.1583414077758789, 0.16581112146377563, 0.17328083515167236, 0.1807505488395691, 0.18822026252746582, 0.19568997621536255, 0.20315967500209808, 0.2106293886899948, 0.21809910237789154, 0.22556881606578827, 0.2330385148525238]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 4.0, 2.0, 3.0, 4.0, 9.0, 7.0, 9.0, 10.0, 13.0, 18.0, 17.0, 20.0, 22.0, 28.0, 27.0, 28.0, 34.0, 33.0, 39.0, 41.0, 30.0, 34.0, 50.0, 36.0, 37.0, 44.0, 25.0, 33.0, 28.0, 43.0, 34.0, 27.0, 45.0, 17.0, 14.0, 15.0, 23.0, 19.0, 16.0, 15.0, 11.0, 6.0, 7.0, 5.0, 4.0, 5.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.1370716094970703, -0.1327364295721054, -0.1284012496471405, -0.1240660548210144, -0.1197308748960495, -0.1153956949710846, -0.11106050759553909, -0.10672532021999359, -0.10239014029502869, -0.09805496037006378, -0.09371977299451828, -0.08938458561897278, -0.08504940569400787, -0.08071422576904297, -0.07637903839349747, -0.07204385101795197, -0.06770867109298706, -0.06337349116802216, -0.059038303792476654, -0.05470312014222145, -0.05036793649196625, -0.046032752841711044, -0.04169756919145584, -0.03736238554120064, -0.033027201890945435, -0.02869201824069023, -0.024356834590435028, -0.020021650940179825, -0.01568646728992462, -0.011351283639669418, -0.007016099989414215, -0.002680916339159012, 0.0016542673110961914, 0.005989450961351395, 0.010324634611606598, 0.014659818261861801, 0.018995001912117004, 0.023330185562372208, 0.02766536921262741, 0.032000552862882614, 0.03633573651313782, 0.04067092016339302, 0.045006103813648224, 0.04934128746390343, 0.05367647111415863, 0.058011654764413834, 0.06234683841466904, 0.06668202579021454, 0.07101720571517944, 0.07535238564014435, 0.07968757301568985, 0.08402276039123535, 0.08835794031620026, 0.09269312024116516, 0.09702830761671066, 0.10136349499225616, 0.10569867491722107, 0.11003385484218597, 0.11436904221773148, 0.11870422959327698, 0.12303940951824188, 0.1273745894432068, 0.13170978426933289, 0.1360449641942978, 0.1403801441192627]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 9.0, 7.0, 4.0, 12.0, 10.0, 16.0, 30.0, 27.0, 41.0, 68.0, 100.0, 111.0, 227.0, 307.0, 444.0, 737.0, 1164.0, 2096.0, 3855.0, 7274.0, 15459.0, 35350.0, 88218.0, 227783.0, 354865.0, 183161.0, 70951.0, 29045.0, 12859.0, 6291.0, 3163.0, 1853.0, 1048.0, 693.0, 416.0, 284.0, 167.0, 109.0, 77.0, 56.0, 50.0, 30.0, 33.0, 16.0, 7.0, 8.0, 7.0, 2.0, 3.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 3.0], "bins": [-0.07763671875, -0.07516288757324219, -0.07268905639648438, -0.07021522521972656, -0.06774139404296875, -0.06526756286621094, -0.06279373168945312, -0.06031990051269531, -0.0578460693359375, -0.05537223815917969, -0.052898406982421875, -0.05042457580566406, -0.04795074462890625, -0.04547691345214844, -0.043003082275390625, -0.04052925109863281, -0.038055419921875, -0.03558158874511719, -0.033107757568359375, -0.030633926391601562, -0.02816009521484375, -0.025686264038085938, -0.023212432861328125, -0.020738601684570312, -0.0182647705078125, -0.015790939331054688, -0.013317108154296875, -0.010843276977539062, -0.00836944580078125, -0.0058956146240234375, -0.003421783447265625, -0.0009479522705078125, 0.00152587890625, 0.0039997100830078125, 0.006473541259765625, 0.008947372436523438, 0.01142120361328125, 0.013895034790039062, 0.016368865966796875, 0.018842697143554688, 0.0213165283203125, 0.023790359497070312, 0.026264190673828125, 0.028738021850585938, 0.03121185302734375, 0.03368568420410156, 0.036159515380859375, 0.03863334655761719, 0.041107177734375, 0.04358100891113281, 0.046054840087890625, 0.04852867126464844, 0.05100250244140625, 0.05347633361816406, 0.055950164794921875, 0.05842399597167969, 0.0608978271484375, 0.06337165832519531, 0.06584548950195312, 0.06831932067871094, 0.07079315185546875, 0.07326698303222656, 0.07574081420898438, 0.07821464538574219, 0.0806884765625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 7.0, 0.0, 6.0, 6.0, 5.0, 6.0, 9.0, 15.0, 15.0, 12.0, 16.0, 16.0, 20.0, 12.0, 28.0, 36.0, 41.0, 33.0, 32.0, 39.0, 29.0, 49.0, 47.0, 31.0, 53.0, 46.0, 49.0, 43.0, 46.0, 35.0, 28.0, 23.0, 27.0, 19.0, 16.0, 19.0, 12.0, 12.0, 14.0, 12.0, 10.0, 9.0, 4.0, 8.0, 4.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.040313720703125, -0.03911113739013672, -0.03790855407714844, -0.036705970764160156, -0.035503387451171875, -0.034300804138183594, -0.03309822082519531, -0.03189563751220703, -0.03069305419921875, -0.02949047088623047, -0.028287887573242188, -0.027085304260253906, -0.025882720947265625, -0.024680137634277344, -0.023477554321289062, -0.02227497100830078, -0.0210723876953125, -0.01986980438232422, -0.018667221069335938, -0.017464637756347656, -0.016262054443359375, -0.015059471130371094, -0.013856887817382812, -0.012654304504394531, -0.01145172119140625, -0.010249137878417969, -0.009046554565429688, -0.007843971252441406, -0.006641387939453125, -0.005438804626464844, -0.0042362213134765625, -0.0030336380004882812, -0.0018310546875, -0.0006284713745117188, 0.0005741119384765625, 0.0017766952514648438, 0.002979278564453125, 0.004181861877441406, 0.0053844451904296875, 0.006587028503417969, 0.00778961181640625, 0.008992195129394531, 0.010194778442382812, 0.011397361755371094, 0.012599945068359375, 0.013802528381347656, 0.015005111694335938, 0.01620769500732422, 0.0174102783203125, 0.01861286163330078, 0.019815444946289062, 0.021018028259277344, 0.022220611572265625, 0.023423194885253906, 0.024625778198242188, 0.02582836151123047, 0.02703094482421875, 0.02823352813720703, 0.029436111450195312, 0.030638694763183594, 0.031841278076171875, 0.033043861389160156, 0.03424644470214844, 0.03544902801513672, 0.036651611328125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 2.0, 3.0, 3.0, 11.0, 8.0, 14.0, 14.0, 27.0, 32.0, 39.0, 69.0, 89.0, 118.0, 198.0, 242.0, 443.0, 796.0, 1635.0, 4440.0, 16215.0, 95027.0, 684233.0, 206016.0, 27455.0, 6563.0, 2296.0, 1015.0, 526.0, 327.0, 215.0, 157.0, 98.0, 68.0, 49.0, 36.0, 27.0, 14.0, 11.0, 9.0, 7.0, 4.0, 1.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1624755859375, -0.1577892303466797, -0.15310287475585938, -0.14841651916503906, -0.14373016357421875, -0.13904380798339844, -0.13435745239257812, -0.1296710968017578, -0.1249847412109375, -0.12029838562011719, -0.11561203002929688, -0.11092567443847656, -0.10623931884765625, -0.10155296325683594, -0.09686660766601562, -0.09218025207519531, -0.087493896484375, -0.08280754089355469, -0.07812118530273438, -0.07343482971191406, -0.06874847412109375, -0.06406211853027344, -0.059375762939453125, -0.05468940734863281, -0.0500030517578125, -0.04531669616699219, -0.040630340576171875, -0.03594398498535156, -0.03125762939453125, -0.026571273803710938, -0.021884918212890625, -0.017198562622070312, -0.01251220703125, -0.007825851440429688, -0.003139495849609375, 0.0015468597412109375, 0.00623321533203125, 0.010919570922851562, 0.015605926513671875, 0.020292282104492188, 0.0249786376953125, 0.029664993286132812, 0.034351348876953125, 0.03903770446777344, 0.04372406005859375, 0.04841041564941406, 0.053096771240234375, 0.05778312683105469, 0.062469482421875, 0.06715583801269531, 0.07184219360351562, 0.07652854919433594, 0.08121490478515625, 0.08590126037597656, 0.09058761596679688, 0.09527397155761719, 0.0999603271484375, 0.10464668273925781, 0.10933303833007812, 0.11401939392089844, 0.11870574951171875, 0.12339210510253906, 0.12807846069335938, 0.1327648162841797, 0.137451171875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 8.0, 5.0, 14.0, 9.0, 8.0, 25.0, 17.0, 39.0, 18.0, 39.0, 33.0, 50.0, 31.0, 43.0, 48.0, 55.0, 55.0, 60.0, 42.0, 46.0, 59.0, 35.0, 43.0, 40.0, 39.0, 21.0, 34.0, 24.0, 9.0, 10.0, 7.0, 11.0, 7.0, 7.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2349853515625, -0.22806930541992188, -0.22115325927734375, -0.21423721313476562, -0.2073211669921875, -0.20040512084960938, -0.19348907470703125, -0.18657302856445312, -0.179656982421875, -0.17274093627929688, -0.16582489013671875, -0.15890884399414062, -0.1519927978515625, -0.14507675170898438, -0.13816070556640625, -0.13124465942382812, -0.12432861328125, -0.11741256713867188, -0.11049652099609375, -0.10358047485351562, -0.0966644287109375, -0.08974838256835938, -0.08283233642578125, -0.07591629028320312, -0.069000244140625, -0.062084197998046875, -0.05516815185546875, -0.048252105712890625, -0.0413360595703125, -0.034420013427734375, -0.02750396728515625, -0.020587921142578125, -0.013671875, -0.006755828857421875, 0.00016021728515625, 0.007076263427734375, 0.0139923095703125, 0.020908355712890625, 0.02782440185546875, 0.034740447998046875, 0.041656494140625, 0.048572540283203125, 0.05548858642578125, 0.062404632568359375, 0.0693206787109375, 0.07623672485351562, 0.08315277099609375, 0.09006881713867188, 0.09698486328125, 0.10390090942382812, 0.11081695556640625, 0.11773300170898438, 0.1246490478515625, 0.13156509399414062, 0.13848114013671875, 0.14539718627929688, 0.152313232421875, 0.15922927856445312, 0.16614532470703125, 0.17306137084960938, 0.1799774169921875, 0.18689346313476562, 0.19380950927734375, 0.20072555541992188, 0.2076416015625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 2.0, 5.0, 8.0, 3.0, 12.0, 22.0, 32.0, 56.0, 91.0, 196.0, 445.0, 1383.0, 11594.0, 842199.0, 186035.0, 4843.0, 908.0, 334.0, 144.0, 64.0, 62.0, 41.0, 24.0, 19.0, 8.0, 7.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.2646484375, -0.25832176208496094, -0.2519950866699219, -0.2456684112548828, -0.23934173583984375, -0.2330150604248047, -0.22668838500976562, -0.22036170959472656, -0.2140350341796875, -0.20770835876464844, -0.20138168334960938, -0.1950550079345703, -0.18872833251953125, -0.1824016571044922, -0.17607498168945312, -0.16974830627441406, -0.163421630859375, -0.15709495544433594, -0.15076828002929688, -0.1444416046142578, -0.13811492919921875, -0.1317882537841797, -0.12546157836914062, -0.11913490295410156, -0.1128082275390625, -0.10648155212402344, -0.10015487670898438, -0.09382820129394531, -0.08750152587890625, -0.08117485046386719, -0.07484817504882812, -0.06852149963378906, -0.06219482421875, -0.05586814880371094, -0.049541473388671875, -0.04321479797363281, -0.03688812255859375, -0.030561447143554688, -0.024234771728515625, -0.017908096313476562, -0.0115814208984375, -0.0052547454833984375, 0.001071929931640625, 0.0073986053466796875, 0.01372528076171875, 0.020051956176757812, 0.026378631591796875, 0.03270530700683594, 0.039031982421875, 0.04535865783691406, 0.051685333251953125, 0.05801200866699219, 0.06433868408203125, 0.07066535949707031, 0.07699203491210938, 0.08331871032714844, 0.0896453857421875, 0.09597206115722656, 0.10229873657226562, 0.10862541198730469, 0.11495208740234375, 0.12127876281738281, 0.12760543823242188, 0.13393211364746094, 0.1402587890625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 8.0, 7.0, 10.0, 10.0, 15.0, 11.0, 18.0, 18.0, 37.0, 42.0, 48.0, 46.0, 86.0, 71.0, 78.0, 80.0, 65.0, 71.0, 49.0, 49.0, 45.0, 25.0, 20.0, 23.0, 10.0, 11.0, 10.0, 8.0, 10.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1278858184814453e-05, -2.0585954189300537e-05, -1.989305019378662e-05, -1.9200146198272705e-05, -1.850724220275879e-05, -1.7814338207244873e-05, -1.7121434211730957e-05, -1.642853021621704e-05, -1.5735626220703125e-05, -1.5042722225189209e-05, -1.4349818229675293e-05, -1.3656914234161377e-05, -1.2964010238647461e-05, -1.2271106243133545e-05, -1.1578202247619629e-05, -1.0885298252105713e-05, -1.0192394256591797e-05, -9.499490261077881e-06, -8.806586265563965e-06, -8.113682270050049e-06, -7.420778274536133e-06, -6.727874279022217e-06, -6.034970283508301e-06, -5.342066287994385e-06, -4.649162292480469e-06, -3.956258296966553e-06, -3.2633543014526367e-06, -2.5704503059387207e-06, -1.8775463104248047e-06, -1.1846423149108887e-06, -4.917383193969727e-07, 2.0116567611694336e-07, 8.940696716308594e-07, 1.5869736671447754e-06, 2.2798776626586914e-06, 2.9727816581726074e-06, 3.6656856536865234e-06, 4.3585896492004395e-06, 5.0514936447143555e-06, 5.7443976402282715e-06, 6.4373016357421875e-06, 7.1302056312561035e-06, 7.82310962677002e-06, 8.516013622283936e-06, 9.208917617797852e-06, 9.901821613311768e-06, 1.0594725608825684e-05, 1.12876296043396e-05, 1.1980533599853516e-05, 1.2673437595367432e-05, 1.3366341590881348e-05, 1.4059245586395264e-05, 1.475214958190918e-05, 1.5445053577423096e-05, 1.6137957572937012e-05, 1.6830861568450928e-05, 1.7523765563964844e-05, 1.821666955947876e-05, 1.8909573554992676e-05, 1.9602477550506592e-05, 2.0295381546020508e-05, 2.0988285541534424e-05, 2.168118953704834e-05, 2.2374093532562256e-05, 2.3066997528076172e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 12.0, 15.0, 31.0, 56.0, 82.0, 159.0, 280.0, 585.0, 1422.0, 5051.0, 39584.0, 832005.0, 155469.0, 9882.0, 2254.0, 790.0, 395.0, 202.0, 106.0, 67.0, 28.0, 22.0, 15.0, 9.0, 6.0, 5.0, 8.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.174072265625, -0.16945552825927734, -0.1648387908935547, -0.16022205352783203, -0.15560531616210938, -0.15098857879638672, -0.14637184143066406, -0.1417551040649414, -0.13713836669921875, -0.1325216293334961, -0.12790489196777344, -0.12328815460205078, -0.11867141723632812, -0.11405467987060547, -0.10943794250488281, -0.10482120513916016, -0.1002044677734375, -0.09558773040771484, -0.09097099304199219, -0.08635425567626953, -0.08173751831054688, -0.07712078094482422, -0.07250404357910156, -0.0678873062133789, -0.06327056884765625, -0.058653831481933594, -0.05403709411621094, -0.04942035675048828, -0.044803619384765625, -0.04018688201904297, -0.03557014465332031, -0.030953407287597656, -0.026336669921875, -0.021719932556152344, -0.017103195190429688, -0.012486457824707031, -0.007869720458984375, -0.0032529830932617188, 0.0013637542724609375, 0.005980491638183594, 0.01059722900390625, 0.015213966369628906, 0.019830703735351562, 0.02444744110107422, 0.029064178466796875, 0.03368091583251953, 0.03829765319824219, 0.042914390563964844, 0.0475311279296875, 0.052147865295410156, 0.05676460266113281, 0.06138134002685547, 0.06599807739257812, 0.07061481475830078, 0.07523155212402344, 0.0798482894897461, 0.08446502685546875, 0.0890817642211914, 0.09369850158691406, 0.09831523895263672, 0.10293197631835938, 0.10754871368408203, 0.11216545104980469, 0.11678218841552734, 0.12139892578125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 8.0, 9.0, 12.0, 27.0, 49.0, 83.0, 122.0, 164.0, 161.0, 139.0, 85.0, 55.0, 36.0, 24.0, 7.0, 9.0, 7.0, 7.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1910400390625, -0.1868114471435547, -0.18258285522460938, -0.17835426330566406, -0.17412567138671875, -0.16989707946777344, -0.16566848754882812, -0.1614398956298828, -0.1572113037109375, -0.1529827117919922, -0.14875411987304688, -0.14452552795410156, -0.14029693603515625, -0.13606834411621094, -0.13183975219726562, -0.1276111602783203, -0.123382568359375, -0.11915397644042969, -0.11492538452148438, -0.11069679260253906, -0.10646820068359375, -0.10223960876464844, -0.09801101684570312, -0.09378242492675781, -0.0895538330078125, -0.08532524108886719, -0.08109664916992188, -0.07686805725097656, -0.07263946533203125, -0.06841087341308594, -0.06418228149414062, -0.05995368957519531, -0.05572509765625, -0.05149650573730469, -0.047267913818359375, -0.04303932189941406, -0.03881072998046875, -0.03458213806152344, -0.030353546142578125, -0.026124954223632812, -0.0218963623046875, -0.017667770385742188, -0.013439178466796875, -0.009210586547851562, -0.00498199462890625, -0.0007534027099609375, 0.003475189208984375, 0.0077037811279296875, 0.011932373046875, 0.016160964965820312, 0.020389556884765625, 0.024618148803710938, 0.02884674072265625, 0.03307533264160156, 0.037303924560546875, 0.04153251647949219, 0.0457611083984375, 0.04998970031738281, 0.054218292236328125, 0.05844688415527344, 0.06267547607421875, 0.06690406799316406, 0.07113265991210938, 0.07536125183105469, 0.07958984375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 9.0, 4.0, 33.0, 85.0, 234.0, 276.0, 200.0, 102.0, 32.0, 16.0, 9.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9702353477478027, -2.891038179397583, -2.8118410110473633, -2.7326440811157227, -2.653446912765503, -2.574249744415283, -2.4950528144836426, -2.415855646133423, -2.336658477783203, -2.2574613094329834, -2.1782641410827637, -2.099067211151123, -2.0198700428009033, -1.9406728744506836, -1.8614758253097534, -1.7822787761688232, -1.7030816078186035, -1.6238844394683838, -1.5446873903274536, -1.4654903411865234, -1.3862931728363037, -1.307096004486084, -1.2278989553451538, -1.1487019062042236, -1.069504737854004, -0.990307629108429, -0.911110520362854, -0.831913411617279, -0.7527163028717041, -0.6735191941261292, -0.5943220853805542, -0.5151249766349792, -0.4359278678894043, -0.35673075914382935, -0.2775336503982544, -0.19833654165267944, -0.11913943290710449, -0.03994232416152954, 0.03925478458404541, 0.11845189332962036, 0.1976490020751953, 0.27684611082077026, 0.3560432195663452, 0.43524032831192017, 0.5144374370574951, 0.5936345458030701, 0.672831654548645, 0.75202876329422, 0.8312258720397949, 0.9104229807853699, 0.9896200895309448, 1.068817138671875, 1.1480143070220947, 1.2272114753723145, 1.3064085245132446, 1.3856055736541748, 1.4648027420043945, 1.5439999103546143, 1.6231969594955444, 1.7023940086364746, 1.7815911769866943, 1.860788345336914, 1.9399853944778442, 2.0191824436187744, 2.098379611968994]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 10.0, 16.0, 16.0, 23.0, 21.0, 18.0, 34.0, 42.0, 46.0, 53.0, 59.0, 69.0, 87.0, 74.0, 76.0, 66.0, 61.0, 36.0, 50.0, 29.0, 24.0, 23.0, 19.0, 14.0, 8.0, 9.0, 2.0, 6.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0803883075714111, -1.0384495258331299, -0.9965108036994934, -0.9545720815658569, -0.9126332998275757, -0.8706945180892944, -0.828755795955658, -0.7868170738220215, -0.7448782920837402, -0.702939510345459, -0.6610007882118225, -0.619062066078186, -0.5771232843399048, -0.5351845026016235, -0.49324578046798706, -0.4513070285320282, -0.40936827659606934, -0.3674295246601105, -0.3254907727241516, -0.28355202078819275, -0.2416132688522339, -0.19967451691627502, -0.15773576498031616, -0.1157970130443573, -0.07385826110839844, -0.031919509172439575, 0.010019242763519287, 0.05195799469947815, 0.09389674663543701, 0.13583549857139587, 0.17777425050735474, 0.2197130024433136, 0.26165175437927246, 0.3035905063152313, 0.3455292582511902, 0.38746801018714905, 0.4294067621231079, 0.4713455140590668, 0.5132842659950256, 0.5552229881286621, 0.5971617698669434, 0.6391005516052246, 0.6810392737388611, 0.7229779958724976, 0.7649167776107788, 0.8068555593490601, 0.8487942814826965, 0.890733003616333, 0.9326717853546143, 0.9746105670928955, 1.0165493488311768, 1.0584880113601685, 1.1004267930984497, 1.142365574836731, 1.1843042373657227, 1.226243019104004, 1.2681818008422852, 1.3101205825805664, 1.3520593643188477, 1.3939980268478394, 1.4359368085861206, 1.4778755903244019, 1.5198142528533936, 1.5617530345916748, 1.603691816329956]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 5.0, 10.0, 11.0, 13.0, 19.0, 21.0, 25.0, 51.0, 55.0, 86.0, 123.0, 173.0, 233.0, 335.0, 527.0, 991.0, 2199.0, 6888.0, 31969.0, 4041324.0, 90522.0, 11805.0, 3402.0, 1392.0, 698.0, 406.0, 281.0, 189.0, 144.0, 96.0, 66.0, 68.0, 48.0, 30.0, 20.0, 21.0, 10.0, 11.0, 2.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.22705078125, -0.2201080322265625, -0.213165283203125, -0.2062225341796875, -0.19927978515625, -0.1923370361328125, -0.185394287109375, -0.1784515380859375, -0.1715087890625, -0.1645660400390625, -0.157623291015625, -0.1506805419921875, -0.14373779296875, -0.1367950439453125, -0.129852294921875, -0.1229095458984375, -0.115966796875, -0.1090240478515625, -0.102081298828125, -0.0951385498046875, -0.08819580078125, -0.0812530517578125, -0.074310302734375, -0.0673675537109375, -0.0604248046875, -0.0534820556640625, -0.046539306640625, -0.0395965576171875, -0.03265380859375, -0.0257110595703125, -0.018768310546875, -0.0118255615234375, -0.0048828125, 0.0020599365234375, 0.009002685546875, 0.0159454345703125, 0.02288818359375, 0.0298309326171875, 0.036773681640625, 0.0437164306640625, 0.0506591796875, 0.0576019287109375, 0.064544677734375, 0.0714874267578125, 0.07843017578125, 0.0853729248046875, 0.092315673828125, 0.0992584228515625, 0.106201171875, 0.1131439208984375, 0.120086669921875, 0.1270294189453125, 0.13397216796875, 0.1409149169921875, 0.147857666015625, 0.1548004150390625, 0.1617431640625, 0.1686859130859375, 0.175628662109375, 0.1825714111328125, 0.18951416015625, 0.1964569091796875, 0.203399658203125, 0.2103424072265625, 0.21728515625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 7.0, 10.0, 12.0, 19.0, 26.0, 28.0, 50.0, 65.0, 77.0, 98.0, 99.0, 105.0, 118.0, 75.0, 57.0, 47.0, 41.0, 36.0, 17.0, 9.0, 3.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.087890625, -0.08505630493164062, -0.08222198486328125, -0.07938766479492188, -0.0765533447265625, -0.07371902465820312, -0.07088470458984375, -0.06805038452148438, -0.065216064453125, -0.062381744384765625, -0.05954742431640625, -0.056713104248046875, -0.0538787841796875, -0.051044464111328125, -0.04821014404296875, -0.045375823974609375, -0.04254150390625, -0.039707183837890625, -0.03687286376953125, -0.034038543701171875, -0.0312042236328125, -0.028369903564453125, -0.02553558349609375, -0.022701263427734375, -0.019866943359375, -0.017032623291015625, -0.01419830322265625, -0.011363983154296875, -0.0085296630859375, -0.005695343017578125, -0.00286102294921875, -2.6702880859375e-05, 0.0028076171875, 0.005641937255859375, 0.00847625732421875, 0.011310577392578125, 0.0141448974609375, 0.016979217529296875, 0.01981353759765625, 0.022647857666015625, 0.025482177734375, 0.028316497802734375, 0.03115081787109375, 0.033985137939453125, 0.0368194580078125, 0.039653778076171875, 0.04248809814453125, 0.045322418212890625, 0.04815673828125, 0.050991058349609375, 0.05382537841796875, 0.056659698486328125, 0.0594940185546875, 0.062328338623046875, 0.06516265869140625, 0.06799697875976562, 0.070831298828125, 0.07366561889648438, 0.07649993896484375, 0.07933425903320312, 0.0821685791015625, 0.08500289916992188, 0.08783721923828125, 0.09067153930664062, 0.093505859375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 2.0, 2.0, 4.0, 6.0, 11.0, 12.0, 17.0, 23.0, 23.0, 46.0, 47.0, 66.0, 102.0, 140.0, 211.0, 290.0, 456.0, 640.0, 1057.0, 1825.0, 3581.0, 8641.0, 31241.0, 3330202.0, 770759.0, 28403.0, 8147.0, 3509.0, 1794.0, 1019.0, 638.0, 414.0, 269.0, 189.0, 151.0, 99.0, 70.0, 53.0, 29.0, 23.0, 23.0, 15.0, 10.0, 9.0, 4.0, 1.0, 3.0, 5.0, 6.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.2103271484375, -0.20413589477539062, -0.19794464111328125, -0.19175338745117188, -0.1855621337890625, -0.17937088012695312, -0.17317962646484375, -0.16698837280273438, -0.160797119140625, -0.15460586547851562, -0.14841461181640625, -0.14222335815429688, -0.1360321044921875, -0.12984085083007812, -0.12364959716796875, -0.11745834350585938, -0.11126708984375, -0.10507583618164062, -0.09888458251953125, -0.09269332885742188, -0.0865020751953125, -0.08031082153320312, -0.07411956787109375, -0.06792831420898438, -0.061737060546875, -0.055545806884765625, -0.04935455322265625, -0.043163299560546875, -0.0369720458984375, -0.030780792236328125, -0.02458953857421875, -0.018398284912109375, -0.01220703125, -0.006015777587890625, 0.00017547607421875, 0.006366729736328125, 0.0125579833984375, 0.018749237060546875, 0.02494049072265625, 0.031131744384765625, 0.037322998046875, 0.043514251708984375, 0.04970550537109375, 0.055896759033203125, 0.0620880126953125, 0.06827926635742188, 0.07447052001953125, 0.08066177368164062, 0.08685302734375, 0.09304428100585938, 0.09923553466796875, 0.10542678833007812, 0.1116180419921875, 0.11780929565429688, 0.12400054931640625, 0.13019180297851562, 0.136383056640625, 0.14257431030273438, 0.14876556396484375, 0.15495681762695312, 0.1611480712890625, 0.16733932495117188, 0.17353057861328125, 0.17972183227539062, 0.1859130859375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 5.0, 6.0, 8.0, 11.0, 14.0, 28.0, 36.0, 109.0, 728.0, 2829.0, 161.0, 48.0, 37.0, 13.0, 5.0, 8.0, 10.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09521484375, -0.09224796295166016, -0.08928108215332031, -0.08631420135498047, -0.08334732055664062, -0.08038043975830078, -0.07741355895996094, -0.0744466781616211, -0.07147979736328125, -0.0685129165649414, -0.06554603576660156, -0.06257915496826172, -0.059612274169921875, -0.05664539337158203, -0.05367851257324219, -0.050711631774902344, -0.0477447509765625, -0.044777870178222656, -0.04181098937988281, -0.03884410858154297, -0.035877227783203125, -0.03291034698486328, -0.029943466186523438, -0.026976585388183594, -0.02400970458984375, -0.021042823791503906, -0.018075942993164062, -0.015109062194824219, -0.012142181396484375, -0.009175300598144531, -0.0062084197998046875, -0.0032415390014648438, -0.000274658203125, 0.0026922225952148438, 0.0056591033935546875, 0.008625984191894531, 0.011592864990234375, 0.014559745788574219, 0.017526626586914062, 0.020493507385253906, 0.02346038818359375, 0.026427268981933594, 0.029394149780273438, 0.03236103057861328, 0.035327911376953125, 0.03829479217529297, 0.04126167297363281, 0.044228553771972656, 0.0471954345703125, 0.050162315368652344, 0.05312919616699219, 0.05609607696533203, 0.059062957763671875, 0.06202983856201172, 0.06499671936035156, 0.0679636001586914, 0.07093048095703125, 0.0738973617553711, 0.07686424255371094, 0.07983112335205078, 0.08279800415039062, 0.08576488494873047, 0.08873176574707031, 0.09169864654541016, 0.09466552734375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 2.0, 2.0, 8.0, 16.0, 14.0, 10.0, 15.0, 29.0, 35.0, 42.0, 61.0, 92.0, 98.0, 100.0, 102.0, 82.0, 84.0, 62.0, 38.0, 39.0, 25.0, 11.0, 10.0, 6.0, 8.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3083820044994354, -0.29975780844688416, -0.2911336123943329, -0.2825094163417816, -0.27388522028923035, -0.2652610242366791, -0.2566368281841278, -0.24801264703273773, -0.23938845098018646, -0.2307642549276352, -0.22214005887508392, -0.21351586282253265, -0.20489168167114258, -0.1962674856185913, -0.18764328956604004, -0.17901909351348877, -0.1703948974609375, -0.16177070140838623, -0.15314650535583496, -0.1445223093032837, -0.13589811325073242, -0.12727391719818115, -0.11864973604679108, -0.11002553999423981, -0.10140134394168854, -0.09277714788913727, -0.084152951836586, -0.07552876323461533, -0.06690456718206406, -0.05828037112951279, -0.049656178802251816, -0.041031986474990845, -0.03240780532360077, -0.02378361113369465, -0.015159416943788528, -0.006535222753882408, 0.002088971436023712, 0.010713167488574982, 0.019337359815835953, 0.027961552143096924, 0.03658574819564819, 0.04520994424819946, 0.053834136575460434, 0.062458328902721405, 0.07108252495527267, 0.07970672100782394, 0.08833090960979462, 0.09695510566234589, 0.10557930171489716, 0.11420349776744843, 0.1228276938199997, 0.13145188987255096, 0.14007607102394104, 0.1487002670764923, 0.15732446312904358, 0.16594865918159485, 0.17457285523414612, 0.1831970512866974, 0.19182124733924866, 0.20044544339179993, 0.2090696394443512, 0.21769383549690247, 0.22631801664829254, 0.2349422127008438, 0.24356640875339508]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 10.0, 3.0, 6.0, 18.0, 14.0, 14.0, 20.0, 18.0, 28.0, 30.0, 37.0, 28.0, 33.0, 51.0, 43.0, 50.0, 36.0, 49.0, 34.0, 52.0, 41.0, 53.0, 46.0, 31.0, 47.0, 36.0, 22.0, 26.0, 25.0, 21.0, 10.0, 19.0, 12.0, 12.0, 3.0, 6.0, 6.0, 2.0, 4.0, 0.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.18508309125900269, -0.17879697680473328, -0.17251084744930267, -0.16622473299503326, -0.15993860363960266, -0.15365248918533325, -0.14736637473106384, -0.14108026027679443, -0.13479413092136383, -0.12850801646709442, -0.12222188711166382, -0.11593577265739441, -0.1096496507525444, -0.1033635288476944, -0.09707741439342499, -0.09079129248857498, -0.08450517058372498, -0.07821904867887497, -0.07193292677402496, -0.06564681231975555, -0.05936069041490555, -0.05307456851005554, -0.046788450330495834, -0.04050233215093613, -0.03421621024608612, -0.027930090203881264, -0.021643970161676407, -0.01535785011947155, -0.009071730077266693, -0.002785608172416687, 0.0035005100071430206, 0.009786628186702728, 0.016072750091552734, 0.02235887013375759, 0.028644990175962448, 0.034931108355522156, 0.04121723026037216, 0.04750335216522217, 0.053789470344781876, 0.06007558852434158, 0.06636171042919159, 0.0726478323340416, 0.0789339542388916, 0.08522006869316101, 0.09150619059801102, 0.09779231250286102, 0.10407842695713043, 0.11036454886198044, 0.11665067076683044, 0.12293679267168045, 0.12922291457653046, 0.13550902903079987, 0.14179515838623047, 0.14808127284049988, 0.1543673872947693, 0.1606535017490387, 0.1669396311044693, 0.1732257455587387, 0.1795118749141693, 0.18579798936843872, 0.19208410382270813, 0.19837023317813873, 0.20465634763240814, 0.21094247698783875, 0.21722859144210815]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 8.0, 10.0, 29.0, 39.0, 41.0, 89.0, 154.0, 230.0, 458.0, 851.0, 1650.0, 3693.0, 10066.0, 32596.0, 131757.0, 509375.0, 269181.0, 60745.0, 16936.0, 5818.0, 2379.0, 1099.0, 585.0, 309.0, 182.0, 101.0, 64.0, 42.0, 24.0, 10.0, 14.0, 7.0, 3.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1624755859375, -0.1570110321044922, -0.15154647827148438, -0.14608192443847656, -0.14061737060546875, -0.13515281677246094, -0.12968826293945312, -0.12422370910644531, -0.1187591552734375, -0.11329460144042969, -0.10783004760742188, -0.10236549377441406, -0.09690093994140625, -0.09143638610839844, -0.08597183227539062, -0.08050727844238281, -0.075042724609375, -0.06957817077636719, -0.06411361694335938, -0.05864906311035156, -0.05318450927734375, -0.04771995544433594, -0.042255401611328125, -0.03679084777832031, -0.0313262939453125, -0.025861740112304688, -0.020397186279296875, -0.014932632446289062, -0.00946807861328125, -0.0040035247802734375, 0.001461029052734375, 0.0069255828857421875, 0.01239013671875, 0.017854690551757812, 0.023319244384765625, 0.028783798217773438, 0.03424835205078125, 0.03971290588378906, 0.045177459716796875, 0.05064201354980469, 0.0561065673828125, 0.06157112121582031, 0.06703567504882812, 0.07250022888183594, 0.07796478271484375, 0.08342933654785156, 0.08889389038085938, 0.09435844421386719, 0.099822998046875, 0.10528755187988281, 0.11075210571289062, 0.11621665954589844, 0.12168121337890625, 0.12714576721191406, 0.13261032104492188, 0.1380748748779297, 0.1435394287109375, 0.1490039825439453, 0.15446853637695312, 0.15993309020996094, 0.16539764404296875, 0.17086219787597656, 0.17632675170898438, 0.1817913055419922, 0.187255859375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 8.0, 10.0, 21.0, 23.0, 29.0, 49.0, 56.0, 81.0, 85.0, 103.0, 85.0, 107.0, 94.0, 80.0, 50.0, 42.0, 25.0, 18.0, 18.0, 11.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10992431640625, -0.1069021224975586, -0.10387992858886719, -0.10085773468017578, -0.09783554077148438, -0.09481334686279297, -0.09179115295410156, -0.08876895904541016, -0.08574676513671875, -0.08272457122802734, -0.07970237731933594, -0.07668018341064453, -0.07365798950195312, -0.07063579559326172, -0.06761360168457031, -0.0645914077758789, -0.0615692138671875, -0.058547019958496094, -0.05552482604980469, -0.05250263214111328, -0.049480438232421875, -0.04645824432373047, -0.04343605041503906, -0.040413856506347656, -0.03739166259765625, -0.034369468688964844, -0.03134727478027344, -0.02832508087158203, -0.025302886962890625, -0.02228069305419922, -0.019258499145507812, -0.016236305236816406, -0.013214111328125, -0.010191917419433594, -0.0071697235107421875, -0.004147529602050781, -0.001125335693359375, 0.0018968582153320312, 0.0049190521240234375, 0.007941246032714844, 0.01096343994140625, 0.013985633850097656, 0.017007827758789062, 0.02003002166748047, 0.023052215576171875, 0.02607440948486328, 0.029096603393554688, 0.032118797302246094, 0.0351409912109375, 0.038163185119628906, 0.04118537902832031, 0.04420757293701172, 0.047229766845703125, 0.05025196075439453, 0.05327415466308594, 0.056296348571777344, 0.05931854248046875, 0.062340736389160156, 0.06536293029785156, 0.06838512420654297, 0.07140731811523438, 0.07442951202392578, 0.07745170593261719, 0.0804738998413086, 0.08349609375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 7.0, 4.0, 6.0, 10.0, 8.0, 13.0, 12.0, 23.0, 45.0, 49.0, 60.0, 78.0, 99.0, 168.0, 234.0, 323.0, 492.0, 843.0, 1583.0, 3161.0, 7710.0, 24385.0, 120487.0, 620478.0, 211181.0, 37533.0, 10607.0, 4096.0, 1963.0, 1004.0, 614.0, 363.0, 288.0, 164.0, 117.0, 90.0, 73.0, 53.0, 33.0, 27.0, 25.0, 11.0, 11.0, 10.0, 4.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.16943359375, -0.164398193359375, -0.15936279296875, -0.154327392578125, -0.1492919921875, -0.144256591796875, -0.13922119140625, -0.134185791015625, -0.129150390625, -0.124114990234375, -0.11907958984375, -0.114044189453125, -0.1090087890625, -0.103973388671875, -0.09893798828125, -0.093902587890625, -0.0888671875, -0.083831787109375, -0.07879638671875, -0.073760986328125, -0.0687255859375, -0.063690185546875, -0.05865478515625, -0.053619384765625, -0.048583984375, -0.043548583984375, -0.03851318359375, -0.033477783203125, -0.0284423828125, -0.023406982421875, -0.01837158203125, -0.013336181640625, -0.00830078125, -0.003265380859375, 0.00177001953125, 0.006805419921875, 0.0118408203125, 0.016876220703125, 0.02191162109375, 0.026947021484375, 0.031982421875, 0.037017822265625, 0.04205322265625, 0.047088623046875, 0.0521240234375, 0.057159423828125, 0.06219482421875, 0.067230224609375, 0.072265625, 0.077301025390625, 0.08233642578125, 0.087371826171875, 0.0924072265625, 0.097442626953125, 0.10247802734375, 0.107513427734375, 0.112548828125, 0.117584228515625, 0.12261962890625, 0.127655029296875, 0.1326904296875, 0.137725830078125, 0.14276123046875, 0.147796630859375, 0.15283203125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 7.0, 3.0, 7.0, 5.0, 5.0, 16.0, 13.0, 13.0, 16.0, 26.0, 32.0, 21.0, 29.0, 44.0, 36.0, 31.0, 40.0, 34.0, 33.0, 44.0, 39.0, 40.0, 29.0, 38.0, 38.0, 37.0, 31.0, 32.0, 35.0, 34.0, 19.0, 24.0, 22.0, 21.0, 13.0, 15.0, 16.0, 17.0, 7.0, 5.0, 7.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.1904296875, -0.1849346160888672, -0.17943954467773438, -0.17394447326660156, -0.16844940185546875, -0.16295433044433594, -0.15745925903320312, -0.1519641876220703, -0.1464691162109375, -0.1409740447998047, -0.13547897338867188, -0.12998390197753906, -0.12448883056640625, -0.11899375915527344, -0.11349868774414062, -0.10800361633300781, -0.102508544921875, -0.09701347351074219, -0.09151840209960938, -0.08602333068847656, -0.08052825927734375, -0.07503318786621094, -0.06953811645507812, -0.06404304504394531, -0.0585479736328125, -0.05305290222167969, -0.047557830810546875, -0.04206275939941406, -0.03656768798828125, -0.031072616577148438, -0.025577545166015625, -0.020082473754882812, -0.01458740234375, -0.009092330932617188, -0.003597259521484375, 0.0018978118896484375, 0.00739288330078125, 0.012887954711914062, 0.018383026123046875, 0.023878097534179688, 0.0293731689453125, 0.03486824035644531, 0.040363311767578125, 0.04585838317871094, 0.05135345458984375, 0.05684852600097656, 0.062343597412109375, 0.06783866882324219, 0.073333740234375, 0.07882881164550781, 0.08432388305664062, 0.08981895446777344, 0.09531402587890625, 0.10080909729003906, 0.10630416870117188, 0.11179924011230469, 0.1172943115234375, 0.12278938293457031, 0.12828445434570312, 0.13377952575683594, 0.13927459716796875, 0.14476966857910156, 0.15026473999023438, 0.1557598114013672, 0.1612548828125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 4.0, 6.0, 6.0, 5.0, 4.0, 6.0, 5.0, 11.0, 12.0, 27.0, 31.0, 34.0, 64.0, 115.0, 154.0, 230.0, 349.0, 626.0, 1251.0, 2620.0, 6578.0, 22242.0, 148853.0, 698580.0, 134285.0, 20900.0, 6173.0, 2480.0, 1218.0, 634.0, 377.0, 241.0, 130.0, 99.0, 57.0, 48.0, 26.0, 19.0, 18.0, 9.0, 7.0, 5.0, 7.0, 3.0, 2.0, 4.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06658935546875, -0.06440448760986328, -0.06221961975097656, -0.060034751892089844, -0.057849884033203125, -0.055665016174316406, -0.05348014831542969, -0.05129528045654297, -0.04911041259765625, -0.04692554473876953, -0.04474067687988281, -0.042555809020996094, -0.040370941162109375, -0.038186073303222656, -0.03600120544433594, -0.03381633758544922, -0.0316314697265625, -0.02944660186767578, -0.027261734008789062, -0.025076866149902344, -0.022891998291015625, -0.020707130432128906, -0.018522262573242188, -0.01633739471435547, -0.01415252685546875, -0.011967658996582031, -0.009782791137695312, -0.007597923278808594, -0.005413055419921875, -0.0032281875610351562, -0.0010433197021484375, 0.0011415481567382812, 0.003326416015625, 0.005511283874511719, 0.0076961517333984375, 0.009881019592285156, 0.012065887451171875, 0.014250755310058594, 0.016435623168945312, 0.01862049102783203, 0.02080535888671875, 0.02299022674560547, 0.025175094604492188, 0.027359962463378906, 0.029544830322265625, 0.031729698181152344, 0.03391456604003906, 0.03609943389892578, 0.0382843017578125, 0.04046916961669922, 0.04265403747558594, 0.044838905334472656, 0.047023773193359375, 0.049208641052246094, 0.05139350891113281, 0.05357837677001953, 0.05576324462890625, 0.05794811248779297, 0.06013298034667969, 0.062317848205566406, 0.06450271606445312, 0.06668758392333984, 0.06887245178222656, 0.07105731964111328, 0.0732421875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 7.0, 10.0, 10.0, 15.0, 19.0, 45.0, 42.0, 57.0, 66.0, 100.0, 162.0, 122.0, 95.0, 73.0, 61.0, 24.0, 31.0, 15.0, 12.0, 12.0, 10.0, 5.0, 5.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.500150680541992e-05, -4.3623149394989014e-05, -4.2244791984558105e-05, -4.08664345741272e-05, -3.948807716369629e-05, -3.810971975326538e-05, -3.673136234283447e-05, -3.5353004932403564e-05, -3.3974647521972656e-05, -3.259629011154175e-05, -3.121793270111084e-05, -2.983957529067993e-05, -2.8461217880249023e-05, -2.7082860469818115e-05, -2.5704503059387207e-05, -2.43261456489563e-05, -2.294778823852539e-05, -2.1569430828094482e-05, -2.0191073417663574e-05, -1.8812716007232666e-05, -1.7434358596801758e-05, -1.605600118637085e-05, -1.4677643775939941e-05, -1.3299286365509033e-05, -1.1920928955078125e-05, -1.0542571544647217e-05, -9.164214134216309e-06, -7.7858567237854e-06, -6.407499313354492e-06, -5.029141902923584e-06, -3.6507844924926758e-06, -2.2724270820617676e-06, -8.940696716308594e-07, 4.842877388000488e-07, 1.862645149230957e-06, 3.2410025596618652e-06, 4.6193599700927734e-06, 5.997717380523682e-06, 7.37607479095459e-06, 8.754432201385498e-06, 1.0132789611816406e-05, 1.1511147022247314e-05, 1.2889504432678223e-05, 1.4267861843109131e-05, 1.564621925354004e-05, 1.7024576663970947e-05, 1.8402934074401855e-05, 1.9781291484832764e-05, 2.1159648895263672e-05, 2.253800630569458e-05, 2.3916363716125488e-05, 2.5294721126556396e-05, 2.6673078536987305e-05, 2.8051435947418213e-05, 2.942979335784912e-05, 3.080815076828003e-05, 3.218650817871094e-05, 3.3564865589141846e-05, 3.4943222999572754e-05, 3.632158041000366e-05, 3.769993782043457e-05, 3.907829523086548e-05, 4.045665264129639e-05, 4.1835010051727295e-05, 4.32133674621582e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 4.0, 10.0, 13.0, 19.0, 46.0, 62.0, 128.0, 225.0, 495.0, 1216.0, 4059.0, 21049.0, 417327.0, 571089.0, 25811.0, 4508.0, 1387.0, 516.0, 247.0, 132.0, 69.0, 57.0, 26.0, 13.0, 12.0, 7.0, 10.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08404541015625, -0.0805501937866211, -0.07705497741699219, -0.07355976104736328, -0.07006454467773438, -0.06656932830810547, -0.06307411193847656, -0.059578895568847656, -0.05608367919921875, -0.052588462829589844, -0.04909324645996094, -0.04559803009033203, -0.042102813720703125, -0.03860759735107422, -0.03511238098144531, -0.031617164611816406, -0.0281219482421875, -0.024626731872558594, -0.021131515502929688, -0.01763629913330078, -0.014141082763671875, -0.010645866394042969, -0.0071506500244140625, -0.0036554336547851562, -0.00016021728515625, 0.0033349990844726562, 0.0068302154541015625, 0.010325431823730469, 0.013820648193359375, 0.01731586456298828, 0.020811080932617188, 0.024306297302246094, 0.027801513671875, 0.031296730041503906, 0.03479194641113281, 0.03828716278076172, 0.041782379150390625, 0.04527759552001953, 0.04877281188964844, 0.052268028259277344, 0.05576324462890625, 0.059258460998535156, 0.06275367736816406, 0.06624889373779297, 0.06974411010742188, 0.07323932647705078, 0.07673454284667969, 0.0802297592163086, 0.0837249755859375, 0.0872201919555664, 0.09071540832519531, 0.09421062469482422, 0.09770584106445312, 0.10120105743408203, 0.10469627380371094, 0.10819149017333984, 0.11168670654296875, 0.11518192291259766, 0.11867713928222656, 0.12217235565185547, 0.12566757202148438, 0.12916278839111328, 0.1326580047607422, 0.1361532211303711, 0.1396484375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 3.0, 6.0, 14.0, 15.0, 22.0, 34.0, 50.0, 70.0, 95.0, 123.0, 125.0, 110.0, 78.0, 76.0, 43.0, 38.0, 23.0, 17.0, 16.0, 8.0, 4.0, 5.0, 5.0, 9.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08782958984375, -0.0852804183959961, -0.08273124694824219, -0.08018207550048828, -0.07763290405273438, -0.07508373260498047, -0.07253456115722656, -0.06998538970947266, -0.06743621826171875, -0.06488704681396484, -0.06233787536621094, -0.05978870391845703, -0.057239532470703125, -0.05469036102294922, -0.05214118957519531, -0.049592018127441406, -0.0470428466796875, -0.044493675231933594, -0.04194450378417969, -0.03939533233642578, -0.036846160888671875, -0.03429698944091797, -0.03174781799316406, -0.029198646545410156, -0.02664947509765625, -0.024100303649902344, -0.021551132202148438, -0.01900196075439453, -0.016452789306640625, -0.013903617858886719, -0.011354446411132812, -0.008805274963378906, -0.006256103515625, -0.0037069320678710938, -0.0011577606201171875, 0.0013914108276367188, 0.003940582275390625, 0.006489753723144531, 0.009038925170898438, 0.011588096618652344, 0.01413726806640625, 0.016686439514160156, 0.019235610961914062, 0.02178478240966797, 0.024333953857421875, 0.02688312530517578, 0.029432296752929688, 0.031981468200683594, 0.0345306396484375, 0.037079811096191406, 0.03962898254394531, 0.04217815399169922, 0.044727325439453125, 0.04727649688720703, 0.04982566833496094, 0.052374839782714844, 0.05492401123046875, 0.057473182678222656, 0.06002235412597656, 0.06257152557373047, 0.06512069702148438, 0.06766986846923828, 0.07021903991699219, 0.0727682113647461, 0.0753173828125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 8.0, 6.0, 31.0, 38.0, 109.0, 185.0, 242.0, 197.0, 113.0, 45.0, 20.0, 4.0, 1.0, 6.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.017937660217285, -2.946852922439575, -2.8757681846618652, -2.8046836853027344, -2.7335989475250244, -2.6625142097473145, -2.5914294719696045, -2.5203447341918945, -2.4492602348327637, -2.3781754970550537, -2.3070907592773438, -2.236006259918213, -2.164921522140503, -2.093836784362793, -2.022752046585083, -1.9516674280166626, -1.8805826902389526, -1.8094979524612427, -1.7384133338928223, -1.6673285961151123, -1.596243977546692, -1.525159239768982, -1.4540746212005615, -1.3829898834228516, -1.3119051456451416, -1.2408204078674316, -1.1697357892990112, -1.0986510515213013, -1.0275664329528809, -0.9564816951751709, -0.8853970170021057, -0.8143123388290405, -0.7432276010513306, -0.6721429228782654, -0.6010582447052002, -0.5299735069274902, -0.45888885855674744, -0.38780418038368225, -0.3167194724082947, -0.2456347942352295, -0.1745501160621643, -0.10346543043851852, -0.03238074481487274, 0.03870394825935364, 0.10978862643241882, 0.180873304605484, 0.2519580125808716, 0.32304269075393677, 0.39412736892700195, 0.46521204710006714, 0.5362967252731323, 0.6073814630508423, 0.6784660816192627, 0.7495508193969727, 0.8206354975700378, 0.891720175743103, 0.9628048539161682, 1.0338895320892334, 1.1049742698669434, 1.1760588884353638, 1.2471436262130737, 1.3182282447814941, 1.389312982559204, 1.460397720336914, 1.5314823389053345]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 3.0, 3.0, 1.0, 6.0, 3.0, 9.0, 5.0, 11.0, 6.0, 14.0, 13.0, 15.0, 21.0, 34.0, 34.0, 27.0, 23.0, 39.0, 50.0, 39.0, 53.0, 48.0, 60.0, 67.0, 37.0, 58.0, 48.0, 41.0, 28.0, 34.0, 27.0, 33.0, 17.0, 13.0, 25.0, 11.0, 16.0, 5.0, 5.0, 7.0, 7.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9634849429130554, -0.9339351654052734, -0.9043853282928467, -0.8748355507850647, -0.8452857732772827, -0.815735936164856, -0.786186158657074, -0.756636381149292, -0.72708660364151, -0.697536826133728, -0.6679869890213013, -0.6384372115135193, -0.6088874340057373, -0.5793375968933105, -0.5497878193855286, -0.5202380418777466, -0.4906882345676422, -0.46113842725753784, -0.43158864974975586, -0.4020388424396515, -0.3724890649318695, -0.34293925762176514, -0.31338948011398315, -0.2838396728038788, -0.2542898654937744, -0.22474007308483124, -0.19519028067588806, -0.1656404733657837, -0.1360906958580017, -0.10654088854789734, -0.07699109613895416, -0.047441303730010986, -0.017891526222229004, 0.011658268049359322, 0.04120806232094765, 0.07075785845518112, 0.1003076508641243, 0.12985745072364807, 0.15940724313259125, 0.18895703554153442, 0.2185068279504776, 0.24805662035942078, 0.27760642766952515, 0.30715620517730713, 0.3367060124874115, 0.36625581979751587, 0.39580559730529785, 0.42535537481307983, 0.4549051821231842, 0.4844549894332886, 0.5140047669410706, 0.5435545444488525, 0.5731043815612793, 0.6026541590690613, 0.6322039365768433, 0.66175377368927, 0.691303551197052, 0.720853328704834, 0.7504031658172607, 0.7799529433250427, 0.8095027208328247, 0.8390525579452515, 0.8686023354530334, 0.8981521129608154, 0.9277018904685974]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 6.0, 2.0, 5.0, 9.0, 11.0, 13.0, 26.0, 25.0, 36.0, 49.0, 67.0, 92.0, 113.0, 150.0, 273.0, 346.0, 499.0, 781.0, 1244.0, 2184.0, 3952.0, 7744.0, 16949.0, 46525.0, 209098.0, 2639896.0, 1088449.0, 116696.0, 31916.0, 12832.0, 6083.0, 3243.0, 1764.0, 1113.0, 665.0, 446.0, 275.0, 187.0, 149.0, 84.0, 86.0, 46.0, 42.0, 22.0, 27.0, 18.0, 15.0, 12.0, 4.0, 7.0, 4.0, 2.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08306884765625, -0.08018779754638672, -0.07730674743652344, -0.07442569732666016, -0.07154464721679688, -0.0686635971069336, -0.06578254699707031, -0.06290149688720703, -0.06002044677734375, -0.05713939666748047, -0.05425834655761719, -0.051377296447753906, -0.048496246337890625, -0.045615196228027344, -0.04273414611816406, -0.03985309600830078, -0.0369720458984375, -0.03409099578857422, -0.031209945678710938, -0.028328895568847656, -0.025447845458984375, -0.022566795349121094, -0.019685745239257812, -0.01680469512939453, -0.01392364501953125, -0.011042594909667969, -0.008161544799804688, -0.005280494689941406, -0.002399444580078125, 0.00048160552978515625, 0.0033626556396484375, 0.006243705749511719, 0.009124755859375, 0.012005805969238281, 0.014886856079101562, 0.017767906188964844, 0.020648956298828125, 0.023530006408691406, 0.026411056518554688, 0.02929210662841797, 0.03217315673828125, 0.03505420684814453, 0.03793525695800781, 0.040816307067871094, 0.043697357177734375, 0.046578407287597656, 0.04945945739746094, 0.05234050750732422, 0.0552215576171875, 0.05810260772705078, 0.06098365783691406, 0.06386470794677734, 0.06674575805664062, 0.0696268081665039, 0.07250785827636719, 0.07538890838623047, 0.07826995849609375, 0.08115100860595703, 0.08403205871582031, 0.0869131088256836, 0.08979415893554688, 0.09267520904541016, 0.09555625915527344, 0.09843730926513672, 0.101318359375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 1.0, 4.0, 3.0, 3.0, 6.0, 8.0, 7.0, 12.0, 8.0, 12.0, 9.0, 14.0, 19.0, 25.0, 17.0, 26.0, 22.0, 22.0, 25.0, 32.0, 31.0, 28.0, 38.0, 39.0, 36.0, 35.0, 51.0, 20.0, 44.0, 43.0, 33.0, 42.0, 40.0, 22.0, 28.0, 20.0, 30.0, 23.0, 18.0, 15.0, 17.0, 15.0, 11.0, 12.0, 9.0, 10.0, 4.0, 3.0, 4.0, 4.0, 5.0, 2.0, 1.0, 3.0], "bins": [-0.03936767578125, -0.03827214241027832, -0.03717660903930664, -0.03608107566833496, -0.03498554229736328, -0.0338900089263916, -0.03279447555541992, -0.03169894218444824, -0.030603408813476562, -0.029507875442504883, -0.028412342071533203, -0.027316808700561523, -0.026221275329589844, -0.025125741958618164, -0.024030208587646484, -0.022934675216674805, -0.021839141845703125, -0.020743608474731445, -0.019648075103759766, -0.018552541732788086, -0.017457008361816406, -0.016361474990844727, -0.015265941619873047, -0.014170408248901367, -0.013074874877929688, -0.011979341506958008, -0.010883808135986328, -0.009788274765014648, -0.008692741394042969, -0.007597208023071289, -0.006501674652099609, -0.00540614128112793, -0.00431060791015625, -0.0032150745391845703, -0.0021195411682128906, -0.001024007797241211, 7.152557373046875e-05, 0.0011670589447021484, 0.002262592315673828, 0.003358125686645508, 0.0044536590576171875, 0.005549192428588867, 0.006644725799560547, 0.0077402591705322266, 0.008835792541503906, 0.009931325912475586, 0.011026859283447266, 0.012122392654418945, 0.013217926025390625, 0.014313459396362305, 0.015408992767333984, 0.016504526138305664, 0.017600059509277344, 0.018695592880249023, 0.019791126251220703, 0.020886659622192383, 0.021982192993164062, 0.023077726364135742, 0.024173259735107422, 0.0252687931060791, 0.02636432647705078, 0.02745985984802246, 0.02855539321899414, 0.02965092658996582, 0.0307464599609375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 16.0, 19.0, 20.0, 35.0, 59.0, 94.0, 128.0, 223.0, 410.0, 770.0, 1651.0, 3865.0, 11646.0, 47609.0, 518028.0, 3424480.0, 147959.0, 24850.0, 7170.0, 2714.0, 1160.0, 556.0, 330.0, 169.0, 117.0, 73.0, 36.0, 20.0, 18.0, 14.0, 15.0, 2.0, 10.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.156494140625, -0.15132713317871094, -0.14616012573242188, -0.1409931182861328, -0.13582611083984375, -0.1306591033935547, -0.12549209594726562, -0.12032508850097656, -0.1151580810546875, -0.10999107360839844, -0.10482406616210938, -0.09965705871582031, -0.09449005126953125, -0.08932304382324219, -0.08415603637695312, -0.07898902893066406, -0.073822021484375, -0.06865501403808594, -0.06348800659179688, -0.05832099914550781, -0.05315399169921875, -0.04798698425292969, -0.042819976806640625, -0.03765296936035156, -0.0324859619140625, -0.027318954467773438, -0.022151947021484375, -0.016984939575195312, -0.01181793212890625, -0.0066509246826171875, -0.001483917236328125, 0.0036830902099609375, 0.00885009765625, 0.014017105102539062, 0.019184112548828125, 0.024351119995117188, 0.02951812744140625, 0.03468513488769531, 0.039852142333984375, 0.04501914978027344, 0.0501861572265625, 0.05535316467285156, 0.060520172119140625, 0.06568717956542969, 0.07085418701171875, 0.07602119445800781, 0.08118820190429688, 0.08635520935058594, 0.091522216796875, 0.09668922424316406, 0.10185623168945312, 0.10702323913574219, 0.11219024658203125, 0.11735725402832031, 0.12252426147460938, 0.12769126892089844, 0.1328582763671875, 0.13802528381347656, 0.14319229125976562, 0.1483592987060547, 0.15352630615234375, 0.1586933135986328, 0.16386032104492188, 0.16902732849121094, 0.1741943359375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 13.0, 12.0, 17.0, 10.0, 18.0, 40.0, 65.0, 113.0, 186.0, 323.0, 756.0, 1196.0, 599.0, 287.0, 144.0, 82.0, 54.0, 41.0, 25.0, 20.0, 13.0, 14.0, 11.0, 3.0, 6.0, 2.0, 2.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1390380859375, -0.1339569091796875, -0.128875732421875, -0.1237945556640625, -0.11871337890625, -0.1136322021484375, -0.108551025390625, -0.1034698486328125, -0.098388671875, -0.0933074951171875, -0.088226318359375, -0.0831451416015625, -0.07806396484375, -0.0729827880859375, -0.067901611328125, -0.0628204345703125, -0.0577392578125, -0.0526580810546875, -0.047576904296875, -0.0424957275390625, -0.03741455078125, -0.0323333740234375, -0.027252197265625, -0.0221710205078125, -0.01708984375, -0.0120086669921875, -0.006927490234375, -0.0018463134765625, 0.00323486328125, 0.0083160400390625, 0.013397216796875, 0.0184783935546875, 0.0235595703125, 0.0286407470703125, 0.033721923828125, 0.0388031005859375, 0.04388427734375, 0.0489654541015625, 0.054046630859375, 0.0591278076171875, 0.064208984375, 0.0692901611328125, 0.074371337890625, 0.0794525146484375, 0.08453369140625, 0.0896148681640625, 0.094696044921875, 0.0997772216796875, 0.1048583984375, 0.1099395751953125, 0.115020751953125, 0.1201019287109375, 0.12518310546875, 0.1302642822265625, 0.135345458984375, 0.1404266357421875, 0.1455078125, 0.1505889892578125, 0.155670166015625, 0.1607513427734375, 0.16583251953125, 0.1709136962890625, 0.175994873046875, 0.1810760498046875, 0.1861572265625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 12.0, 24.0, 84.0, 291.0, 355.0, 151.0, 49.0, 17.0, 12.0, 7.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9909154772758484, -0.9020388126373291, -0.8131622076034546, -0.7242856025695801, -0.6354089379310608, -0.5465322732925415, -0.457655668258667, -0.3687790036201477, -0.2799023985862732, -0.1910257637500763, -0.1021491289138794, -0.013272494077682495, 0.0756041407585144, 0.1644807755947113, 0.2533574104309082, 0.3422340750694275, 0.431110680103302, 0.5199873447418213, 0.6088639497756958, 0.6977405548095703, 0.7866172194480896, 0.8754938840866089, 0.9643704891204834, 1.0532472133636475, 1.1421236991882324, 1.231000304222107, 1.3198769092559814, 1.4087536334991455, 1.49763023853302, 1.5865068435668945, 1.6753835678100586, 1.764260172843933, 1.8531370162963867, 1.9420136213302612, 2.0308902263641357, 2.1197669506073, 2.2086434364318848, 2.297520160675049, 2.386396884918213, 2.475273609161377, 2.564150094985962, 2.653026819229126, 2.741903305053711, 2.830780029296875, 2.919656753540039, 3.008533239364624, 3.097409963607788, 3.186286449432373, 3.275163173675537, 3.364039897918701, 3.452916383743286, 3.54179310798645, 3.630669593811035, 3.719546318054199, 3.8084230422973633, 3.8972997665405273, 3.9861762523651123, 4.075052738189697, 4.163929462432861, 4.252806186676025, 4.3416829109191895, 4.4305596351623535, 4.519435882568359, 4.608312606811523, 4.6971893310546875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 7.0, 4.0, 6.0, 5.0, 11.0, 14.0, 22.0, 26.0, 25.0, 36.0, 33.0, 45.0, 47.0, 58.0, 49.0, 50.0, 77.0, 64.0, 50.0, 51.0, 52.0, 55.0, 41.0, 39.0, 32.0, 20.0, 22.0, 20.0, 12.0, 14.0, 8.0, 4.0, 1.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6463693380355835, -0.6231992840766907, -0.6000292897224426, -0.5768592357635498, -0.553689181804657, -0.5305191278457642, -0.5073491334915161, -0.4841790795326233, -0.46100902557373047, -0.43783900141716003, -0.4146689474582672, -0.3914989233016968, -0.36832886934280396, -0.3451588451862335, -0.3219888210296631, -0.29881876707077026, -0.27564874291419983, -0.2524787187576294, -0.22930866479873657, -0.20613864064216614, -0.18296858668327332, -0.15979856252670288, -0.13662852346897125, -0.11345848441123962, -0.090288445353508, -0.06711840629577637, -0.04394837096333504, -0.020778335630893707, 0.002391703426837921, 0.02556174248456955, 0.04873177409172058, 0.07190181314945221, 0.09507185220718384, 0.11824189126491547, 0.1414119303226471, 0.16458195447921753, 0.18775200843811035, 0.2109220325946808, 0.23409207165241241, 0.25726211071014404, 0.28043216466903687, 0.3036021888256073, 0.3267722427845001, 0.34994226694107056, 0.3731123208999634, 0.3962823450565338, 0.41945236921310425, 0.44262242317199707, 0.4657924473285675, 0.48896247148513794, 0.5121325254440308, 0.5353025794029236, 0.5584725737571716, 0.5816426277160645, 0.6048126816749573, 0.6279827356338501, 0.6511527299880981, 0.674322783946991, 0.697492778301239, 0.7206628322601318, 0.7438328862190247, 0.7670029401779175, 0.7901729345321655, 0.8133429884910583, 0.8365130424499512]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 10.0, 10.0, 19.0, 24.0, 34.0, 39.0, 70.0, 90.0, 165.0, 234.0, 440.0, 783.0, 1521.0, 2917.0, 5558.0, 12210.0, 29696.0, 84013.0, 305158.0, 413463.0, 121500.0, 40010.0, 15791.0, 7275.0, 3478.0, 1731.0, 952.0, 523.0, 314.0, 180.0, 112.0, 78.0, 40.0, 31.0, 23.0, 18.0, 14.0, 10.0, 7.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.1337890625, -0.13018798828125, -0.1265869140625, -0.12298583984375, -0.119384765625, -0.11578369140625, -0.1121826171875, -0.10858154296875, -0.10498046875, -0.10137939453125, -0.0977783203125, -0.09417724609375, -0.090576171875, -0.08697509765625, -0.0833740234375, -0.07977294921875, -0.076171875, -0.07257080078125, -0.0689697265625, -0.06536865234375, -0.061767578125, -0.05816650390625, -0.0545654296875, -0.05096435546875, -0.04736328125, -0.04376220703125, -0.0401611328125, -0.03656005859375, -0.032958984375, -0.02935791015625, -0.0257568359375, -0.02215576171875, -0.0185546875, -0.01495361328125, -0.0113525390625, -0.00775146484375, -0.004150390625, -0.00054931640625, 0.0030517578125, 0.00665283203125, 0.01025390625, 0.01385498046875, 0.0174560546875, 0.02105712890625, 0.024658203125, 0.02825927734375, 0.0318603515625, 0.03546142578125, 0.0390625, 0.04266357421875, 0.0462646484375, 0.04986572265625, 0.053466796875, 0.05706787109375, 0.0606689453125, 0.06427001953125, 0.06787109375, 0.07147216796875, 0.0750732421875, 0.07867431640625, 0.082275390625, 0.08587646484375, 0.0894775390625, 0.09307861328125, 0.0966796875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 2.0, 7.0, 14.0, 9.0, 19.0, 15.0, 25.0, 23.0, 21.0, 30.0, 27.0, 41.0, 33.0, 50.0, 52.0, 60.0, 40.0, 44.0, 59.0, 58.0, 37.0, 51.0, 39.0, 43.0, 30.0, 26.0, 21.0, 29.0, 14.0, 16.0, 15.0, 10.0, 11.0, 9.0, 6.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039093017578125, -0.03761863708496094, -0.036144256591796875, -0.03466987609863281, -0.03319549560546875, -0.03172111511230469, -0.030246734619140625, -0.028772354125976562, -0.0272979736328125, -0.025823593139648438, -0.024349212646484375, -0.022874832153320312, -0.02140045166015625, -0.019926071166992188, -0.018451690673828125, -0.016977310180664062, -0.0155029296875, -0.014028549194335938, -0.012554168701171875, -0.011079788208007812, -0.00960540771484375, -0.008131027221679688, -0.006656646728515625, -0.0051822662353515625, -0.0037078857421875, -0.0022335052490234375, -0.000759124755859375, 0.0007152557373046875, 0.00218963623046875, 0.0036640167236328125, 0.005138397216796875, 0.0066127777099609375, 0.008087158203125, 0.009561538696289062, 0.011035919189453125, 0.012510299682617188, 0.01398468017578125, 0.015459060668945312, 0.016933441162109375, 0.018407821655273438, 0.0198822021484375, 0.021356582641601562, 0.022830963134765625, 0.024305343627929688, 0.02577972412109375, 0.027254104614257812, 0.028728485107421875, 0.030202865600585938, 0.03167724609375, 0.03315162658691406, 0.034626007080078125, 0.03610038757324219, 0.03757476806640625, 0.03904914855957031, 0.040523529052734375, 0.04199790954589844, 0.0434722900390625, 0.04494667053222656, 0.046421051025390625, 0.04789543151855469, 0.04936981201171875, 0.05084419250488281, 0.052318572998046875, 0.05379295349121094, 0.055267333984375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 8.0, 8.0, 7.0, 12.0, 15.0, 31.0, 54.0, 86.0, 110.0, 192.0, 311.0, 522.0, 1045.0, 2342.0, 7103.0, 37704.0, 661829.0, 303899.0, 23954.0, 5345.0, 1886.0, 925.0, 465.0, 256.0, 162.0, 92.0, 51.0, 54.0, 28.0, 23.0, 15.0, 9.0, 9.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2493896484375, -0.24224090576171875, -0.2350921630859375, -0.22794342041015625, -0.220794677734375, -0.21364593505859375, -0.2064971923828125, -0.19934844970703125, -0.19219970703125, -0.18505096435546875, -0.1779022216796875, -0.17075347900390625, -0.163604736328125, -0.15645599365234375, -0.1493072509765625, -0.14215850830078125, -0.135009765625, -0.12786102294921875, -0.1207122802734375, -0.11356353759765625, -0.106414794921875, -0.09926605224609375, -0.0921173095703125, -0.08496856689453125, -0.07781982421875, -0.07067108154296875, -0.0635223388671875, -0.05637359619140625, -0.049224853515625, -0.04207611083984375, -0.0349273681640625, -0.02777862548828125, -0.0206298828125, -0.01348114013671875, -0.0063323974609375, 0.00081634521484375, 0.007965087890625, 0.01511383056640625, 0.0222625732421875, 0.02941131591796875, 0.03656005859375, 0.04370880126953125, 0.0508575439453125, 0.05800628662109375, 0.065155029296875, 0.07230377197265625, 0.0794525146484375, 0.08660125732421875, 0.09375, 0.10089874267578125, 0.1080474853515625, 0.11519622802734375, 0.122344970703125, 0.12949371337890625, 0.1366424560546875, 0.14379119873046875, 0.15093994140625, 0.15808868408203125, 0.1652374267578125, 0.17238616943359375, 0.179534912109375, 0.18668365478515625, 0.1938323974609375, 0.20098114013671875, 0.2081298828125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 2.0, 3.0, 6.0, 8.0, 7.0, 17.0, 16.0, 7.0, 22.0, 25.0, 20.0, 29.0, 44.0, 45.0, 62.0, 58.0, 78.0, 62.0, 67.0, 54.0, 50.0, 57.0, 37.0, 51.0, 36.0, 22.0, 38.0, 23.0, 16.0, 13.0, 10.0, 10.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2310791015625, -0.2233448028564453, -0.21561050415039062, -0.20787620544433594, -0.20014190673828125, -0.19240760803222656, -0.18467330932617188, -0.1769390106201172, -0.1692047119140625, -0.1614704132080078, -0.15373611450195312, -0.14600181579589844, -0.13826751708984375, -0.13053321838378906, -0.12279891967773438, -0.11506462097167969, -0.107330322265625, -0.09959602355957031, -0.09186172485351562, -0.08412742614746094, -0.07639312744140625, -0.06865882873535156, -0.060924530029296875, -0.05319023132324219, -0.0454559326171875, -0.03772163391113281, -0.029987335205078125, -0.022253036499023438, -0.01451873779296875, -0.0067844390869140625, 0.000949859619140625, 0.008684158325195312, 0.01641845703125, 0.024152755737304688, 0.031887054443359375, 0.03962135314941406, 0.04735565185546875, 0.05508995056152344, 0.06282424926757812, 0.07055854797363281, 0.0782928466796875, 0.08602714538574219, 0.09376144409179688, 0.10149574279785156, 0.10923004150390625, 0.11696434020996094, 0.12469863891601562, 0.1324329376220703, 0.140167236328125, 0.1479015350341797, 0.15563583374023438, 0.16337013244628906, 0.17110443115234375, 0.17883872985839844, 0.18657302856445312, 0.1943073272705078, 0.2020416259765625, 0.2097759246826172, 0.21751022338867188, 0.22524452209472656, 0.23297882080078125, 0.24071311950683594, 0.24844741821289062, 0.2561817169189453, 0.263916015625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 3.0, 5.0, 9.0, 17.0, 22.0, 47.0, 64.0, 96.0, 174.0, 340.0, 650.0, 1448.0, 3890.0, 13165.0, 81819.0, 820644.0, 103727.0, 15203.0, 4216.0, 1558.0, 648.0, 312.0, 176.0, 135.0, 60.0, 40.0, 28.0, 14.0, 12.0, 9.0, 3.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11456298828125, -0.11114788055419922, -0.10773277282714844, -0.10431766510009766, -0.10090255737304688, -0.0974874496459961, -0.09407234191894531, -0.09065723419189453, -0.08724212646484375, -0.08382701873779297, -0.08041191101074219, -0.0769968032836914, -0.07358169555664062, -0.07016658782958984, -0.06675148010253906, -0.06333637237548828, -0.0599212646484375, -0.05650615692138672, -0.05309104919433594, -0.049675941467285156, -0.046260833740234375, -0.042845726013183594, -0.03943061828613281, -0.03601551055908203, -0.03260040283203125, -0.02918529510498047, -0.025770187377929688, -0.022355079650878906, -0.018939971923828125, -0.015524864196777344, -0.012109756469726562, -0.008694648742675781, -0.005279541015625, -0.0018644332885742188, 0.0015506744384765625, 0.004965782165527344, 0.008380889892578125, 0.011795997619628906, 0.015211105346679688, 0.01862621307373047, 0.02204132080078125, 0.02545642852783203, 0.028871536254882812, 0.032286643981933594, 0.035701751708984375, 0.039116859436035156, 0.04253196716308594, 0.04594707489013672, 0.0493621826171875, 0.05277729034423828, 0.05619239807128906, 0.059607505798339844, 0.06302261352539062, 0.0664377212524414, 0.06985282897949219, 0.07326793670654297, 0.07668304443359375, 0.08009815216064453, 0.08351325988769531, 0.0869283676147461, 0.09034347534179688, 0.09375858306884766, 0.09717369079589844, 0.10058879852294922, 0.10400390625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 5.0, 2.0, 5.0, 2.0, 7.0, 7.0, 14.0, 9.0, 18.0, 33.0, 34.0, 45.0, 80.0, 134.0, 145.0, 140.0, 100.0, 61.0, 35.0, 37.0, 20.0, 19.0, 10.0, 8.0, 10.0, 6.0, 7.0, 3.0, 9.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.334615707397461e-05, -5.212612450122833e-05, -5.0906091928482056e-05, -4.968605935573578e-05, -4.84660267829895e-05, -4.7245994210243225e-05, -4.602596163749695e-05, -4.480592906475067e-05, -4.3585896492004395e-05, -4.236586391925812e-05, -4.114583134651184e-05, -3.9925798773765564e-05, -3.870576620101929e-05, -3.748573362827301e-05, -3.6265701055526733e-05, -3.5045668482780457e-05, -3.382563591003418e-05, -3.26056033372879e-05, -3.1385570764541626e-05, -3.016553819179535e-05, -2.8945505619049072e-05, -2.7725473046302795e-05, -2.650544047355652e-05, -2.5285407900810242e-05, -2.4065375328063965e-05, -2.2845342755317688e-05, -2.162531018257141e-05, -2.0405277609825134e-05, -1.9185245037078857e-05, -1.796521246433258e-05, -1.6745179891586304e-05, -1.5525147318840027e-05, -1.430511474609375e-05, -1.3085082173347473e-05, -1.1865049600601196e-05, -1.064501702785492e-05, -9.424984455108643e-06, -8.204951882362366e-06, -6.984919309616089e-06, -5.764886736869812e-06, -4.544854164123535e-06, -3.3248215913772583e-06, -2.1047890186309814e-06, -8.847564458847046e-07, 3.3527612686157227e-07, 1.5553086996078491e-06, 2.775341272354126e-06, 3.995373845100403e-06, 5.21540641784668e-06, 6.4354389905929565e-06, 7.655471563339233e-06, 8.87550413608551e-06, 1.0095536708831787e-05, 1.1315569281578064e-05, 1.253560185432434e-05, 1.3755634427070618e-05, 1.4975666999816895e-05, 1.619569957256317e-05, 1.7415732145309448e-05, 1.8635764718055725e-05, 1.9855797290802002e-05, 2.107582986354828e-05, 2.2295862436294556e-05, 2.3515895009040833e-05, 2.473592758178711e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 4.0, 5.0, 2.0, 5.0, 4.0, 2.0, 11.0, 12.0, 14.0, 24.0, 36.0, 43.0, 45.0, 79.0, 174.0, 244.0, 467.0, 946.0, 2280.0, 7245.0, 39671.0, 702855.0, 265547.0, 20588.0, 4805.0, 1698.0, 789.0, 373.0, 189.0, 123.0, 88.0, 53.0, 34.0, 30.0, 19.0, 13.0, 11.0, 6.0, 9.0, 4.0, 6.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.12548828125, -0.12208175659179688, -0.11867523193359375, -0.11526870727539062, -0.1118621826171875, -0.10845565795898438, -0.10504913330078125, -0.10164260864257812, -0.098236083984375, -0.09482955932617188, -0.09142303466796875, -0.08801651000976562, -0.0846099853515625, -0.08120346069335938, -0.07779693603515625, -0.07439041137695312, -0.07098388671875, -0.06757736206054688, -0.06417083740234375, -0.060764312744140625, -0.0573577880859375, -0.053951263427734375, -0.05054473876953125, -0.047138214111328125, -0.043731689453125, -0.040325164794921875, -0.03691864013671875, -0.033512115478515625, -0.0301055908203125, -0.026699066162109375, -0.02329254150390625, -0.019886016845703125, -0.0164794921875, -0.013072967529296875, -0.00966644287109375, -0.006259918212890625, -0.0028533935546875, 0.000553131103515625, 0.00395965576171875, 0.007366180419921875, 0.010772705078125, 0.014179229736328125, 0.01758575439453125, 0.020992279052734375, 0.0243988037109375, 0.027805328369140625, 0.03121185302734375, 0.034618377685546875, 0.03802490234375, 0.041431427001953125, 0.04483795166015625, 0.048244476318359375, 0.0516510009765625, 0.055057525634765625, 0.05846405029296875, 0.061870574951171875, 0.065277099609375, 0.06868362426757812, 0.07209014892578125, 0.07549667358398438, 0.0789031982421875, 0.08230972290039062, 0.08571624755859375, 0.08912277221679688, 0.092529296875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 2.0, 6.0, 7.0, 6.0, 11.0, 8.0, 10.0, 13.0, 26.0, 34.0, 36.0, 56.0, 73.0, 77.0, 91.0, 96.0, 89.0, 86.0, 71.0, 53.0, 20.0, 28.0, 22.0, 12.0, 15.0, 9.0, 5.0, 11.0, 2.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.07025146484375, -0.06768798828125, -0.06512451171875, -0.06256103515625, -0.05999755859375, -0.05743408203125, -0.05487060546875, -0.05230712890625, -0.04974365234375, -0.04718017578125, -0.04461669921875, -0.04205322265625, -0.03948974609375, -0.03692626953125, -0.03436279296875, -0.03179931640625, -0.02923583984375, -0.02667236328125, -0.02410888671875, -0.02154541015625, -0.01898193359375, -0.01641845703125, -0.01385498046875, -0.01129150390625, -0.00872802734375, -0.00616455078125, -0.00360107421875, -0.00103759765625, 0.00152587890625, 0.00408935546875, 0.00665283203125, 0.00921630859375, 0.01177978515625, 0.01434326171875, 0.01690673828125, 0.01947021484375, 0.02203369140625, 0.02459716796875, 0.02716064453125, 0.02972412109375, 0.03228759765625, 0.03485107421875, 0.03741455078125, 0.03997802734375, 0.04254150390625, 0.04510498046875, 0.04766845703125, 0.05023193359375, 0.05279541015625, 0.05535888671875, 0.05792236328125, 0.06048583984375, 0.06304931640625, 0.06561279296875, 0.06817626953125, 0.07073974609375, 0.07330322265625, 0.07586669921875, 0.07843017578125, 0.08099365234375, 0.08355712890625, 0.08612060546875, 0.08868408203125, 0.09124755859375, 0.09381103515625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 19.0, 76.0, 279.0, 420.0, 147.0, 37.0, 7.0, 6.0, 3.0, 2.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.326026201248169, -3.212735891342163, -3.0994455814361572, -2.9861555099487305, -2.8728652000427246, -2.7595748901367188, -2.646284580230713, -2.532994270324707, -2.419703960418701, -2.3064136505126953, -2.1931233406066895, -2.0798330307006836, -1.9665428400039673, -1.853252649307251, -1.7399623394012451, -1.6266720294952393, -1.513381838798523, -1.400091528892517, -1.2868013381958008, -1.173511028289795, -1.060220718383789, -0.946930468082428, -0.8336402177810669, -0.720349907875061, -0.6070596575737, -0.4937693774700165, -0.380479097366333, -0.2671888470649719, -0.15389856696128845, -0.04060828685760498, 0.0726819634437561, 0.18597227334976196, 0.29926252365112305, 0.4125528037548065, 0.52584308385849, 0.6391333341598511, 0.7524236440658569, 0.865713894367218, 0.9790041446685791, 1.092294454574585, 1.2055847644805908, 1.3188750743865967, 1.432165265083313, 1.5454555749893188, 1.6587458848953247, 1.772036075592041, 1.8853263854980469, 1.9986166954040527, 2.1119070053100586, 2.2251973152160645, 2.3384876251220703, 2.451777935028076, 2.565068006515503, 2.678358316421509, 2.7916486263275146, 2.9049389362335205, 3.0182290077209473, 3.131519317626953, 3.244809627532959, 3.358099937438965, 3.4713900089263916, 3.5846803188323975, 3.6979706287384033, 3.811260938644409, 3.924551248550415]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 6.0, 6.0, 8.0, 22.0, 20.0, 25.0, 41.0, 45.0, 45.0, 58.0, 62.0, 72.0, 86.0, 92.0, 82.0, 60.0, 74.0, 51.0, 37.0, 23.0, 29.0, 19.0, 8.0, 12.0, 9.0, 4.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.7596783638000488, -1.7197473049163818, -1.6798162460327148, -1.6398853063583374, -1.5999542474746704, -1.5600231885910034, -1.520092248916626, -1.480161190032959, -1.440230131149292, -1.400299072265625, -1.360368013381958, -1.3204370737075806, -1.2805060148239136, -1.2405749559402466, -1.2006440162658691, -1.1607129573822021, -1.1207818984985352, -1.0808508396148682, -1.0409197807312012, -1.0009888410568237, -0.9610577821731567, -0.9211267232894897, -0.8811957240104675, -0.8412647247314453, -0.8013336658477783, -0.7614026069641113, -0.7214716076850891, -0.6815406084060669, -0.6416095495223999, -0.6016784906387329, -0.5617474913597107, -0.5218164920806885, -0.4818854331970215, -0.4419544041156769, -0.4020233750343323, -0.36209234595298767, -0.32216131687164307, -0.28223028779029846, -0.24229925870895386, -0.20236822962760925, -0.16243720054626465, -0.12250617146492004, -0.08257514238357544, -0.042644113302230835, -0.0027130842208862305, 0.037217944860458374, 0.07714897394180298, 0.11708000302314758, 0.1570110321044922, 0.1969420611858368, 0.2368730902671814, 0.276804119348526, 0.3167351484298706, 0.3566661775112152, 0.3965972065925598, 0.4365282356739044, 0.476459264755249, 0.516390323638916, 0.5563213229179382, 0.5962523221969604, 0.6361833810806274, 0.6761144399642944, 0.7160454392433167, 0.7559764385223389, 0.7959074974060059]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 6.0, 9.0, 5.0, 3.0, 15.0, 14.0, 21.0, 18.0, 23.0, 45.0, 70.0, 112.0, 191.0, 375.0, 747.0, 1634.0, 4933.0, 21573.0, 368006.0, 3702071.0, 78213.0, 10886.0, 3121.0, 1087.0, 480.0, 251.0, 133.0, 71.0, 50.0, 31.0, 13.0, 13.0, 15.0, 6.0, 13.0, 9.0, 6.0, 4.0, 2.0, 0.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1695556640625, -0.1635608673095703, -0.15756607055664062, -0.15157127380371094, -0.14557647705078125, -0.13958168029785156, -0.13358688354492188, -0.1275920867919922, -0.1215972900390625, -0.11560249328613281, -0.10960769653320312, -0.10361289978027344, -0.09761810302734375, -0.09162330627441406, -0.08562850952148438, -0.07963371276855469, -0.073638916015625, -0.06764411926269531, -0.061649322509765625, -0.05565452575683594, -0.04965972900390625, -0.04366493225097656, -0.037670135498046875, -0.03167533874511719, -0.0256805419921875, -0.019685745239257812, -0.013690948486328125, -0.0076961517333984375, -0.00170135498046875, 0.0042934417724609375, 0.010288238525390625, 0.016283035278320312, 0.02227783203125, 0.028272628784179688, 0.034267425537109375, 0.04026222229003906, 0.04625701904296875, 0.05225181579589844, 0.058246612548828125, 0.06424140930175781, 0.0702362060546875, 0.07623100280761719, 0.08222579956054688, 0.08822059631347656, 0.09421539306640625, 0.10021018981933594, 0.10620498657226562, 0.11219978332519531, 0.118194580078125, 0.12418937683105469, 0.13018417358398438, 0.13617897033691406, 0.14217376708984375, 0.14816856384277344, 0.15416336059570312, 0.1601581573486328, 0.1661529541015625, 0.1721477508544922, 0.17814254760742188, 0.18413734436035156, 0.19013214111328125, 0.19612693786621094, 0.20212173461914062, 0.2081165313720703, 0.214111328125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 8.0, 14.0, 24.0, 27.0, 28.0, 49.0, 53.0, 59.0, 73.0, 67.0, 75.0, 68.0, 84.0, 80.0, 74.0, 56.0, 31.0, 31.0, 40.0, 26.0, 11.0, 10.0, 4.0, 10.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09393310546875, -0.09165096282958984, -0.08936882019042969, -0.08708667755126953, -0.08480453491210938, -0.08252239227294922, -0.08024024963378906, -0.0779581069946289, -0.07567596435546875, -0.0733938217163086, -0.07111167907714844, -0.06882953643798828, -0.06654739379882812, -0.06426525115966797, -0.06198310852050781, -0.059700965881347656, -0.0574188232421875, -0.055136680603027344, -0.05285453796386719, -0.05057239532470703, -0.048290252685546875, -0.04600811004638672, -0.04372596740722656, -0.041443824768066406, -0.03916168212890625, -0.036879539489746094, -0.03459739685058594, -0.03231525421142578, -0.030033111572265625, -0.02775096893310547, -0.025468826293945312, -0.023186683654785156, -0.020904541015625, -0.018622398376464844, -0.016340255737304688, -0.014058113098144531, -0.011775970458984375, -0.009493827819824219, -0.0072116851806640625, -0.004929542541503906, -0.00264739990234375, -0.00036525726318359375, 0.0019168853759765625, 0.004199028015136719, 0.006481170654296875, 0.008763313293457031, 0.011045455932617188, 0.013327598571777344, 0.0156097412109375, 0.017891883850097656, 0.020174026489257812, 0.02245616912841797, 0.024738311767578125, 0.02702045440673828, 0.029302597045898438, 0.031584739685058594, 0.03386688232421875, 0.036149024963378906, 0.03843116760253906, 0.04071331024169922, 0.042995452880859375, 0.04527759552001953, 0.04755973815917969, 0.049841880798339844, 0.0521240234375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 7.0, 10.0, 21.0, 23.0, 33.0, 56.0, 96.0, 159.0, 293.0, 604.0, 1361.0, 3579.0, 11957.0, 50433.0, 444832.0, 3413794.0, 216734.0, 35075.0, 9344.0, 3152.0, 1268.0, 615.0, 318.0, 185.0, 124.0, 64.0, 48.0, 30.0, 29.0, 15.0, 7.0, 7.0, 2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.173095703125, -0.1683368682861328, -0.16357803344726562, -0.15881919860839844, -0.15406036376953125, -0.14930152893066406, -0.14454269409179688, -0.1397838592529297, -0.1350250244140625, -0.1302661895751953, -0.12550735473632812, -0.12074851989746094, -0.11598968505859375, -0.11123085021972656, -0.10647201538085938, -0.10171318054199219, -0.096954345703125, -0.09219551086425781, -0.08743667602539062, -0.08267784118652344, -0.07791900634765625, -0.07316017150878906, -0.06840133666992188, -0.06364250183105469, -0.0588836669921875, -0.05412483215332031, -0.049365997314453125, -0.04460716247558594, -0.03984832763671875, -0.03508949279785156, -0.030330657958984375, -0.025571823120117188, -0.02081298828125, -0.016054153442382812, -0.011295318603515625, -0.0065364837646484375, -0.00177764892578125, 0.0029811859130859375, 0.007740020751953125, 0.012498855590820312, 0.0172576904296875, 0.022016525268554688, 0.026775360107421875, 0.03153419494628906, 0.03629302978515625, 0.04105186462402344, 0.045810699462890625, 0.05056953430175781, 0.055328369140625, 0.06008720397949219, 0.06484603881835938, 0.06960487365722656, 0.07436370849609375, 0.07912254333496094, 0.08388137817382812, 0.08864021301269531, 0.0933990478515625, 0.09815788269042969, 0.10291671752929688, 0.10767555236816406, 0.11243438720703125, 0.11719322204589844, 0.12195205688476562, 0.1267108917236328, 0.1314697265625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 6.0, 2.0, 1.0, 4.0, 6.0, 4.0, 8.0, 10.0, 13.0, 12.0, 22.0, 32.0, 43.0, 68.0, 93.0, 163.0, 319.0, 581.0, 996.0, 726.0, 375.0, 204.0, 111.0, 76.0, 51.0, 28.0, 30.0, 22.0, 21.0, 11.0, 7.0, 15.0, 6.0, 5.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08795166015625, -0.08370304107666016, -0.07945442199707031, -0.07520580291748047, -0.07095718383789062, -0.06670856475830078, -0.06245994567871094, -0.058211326599121094, -0.05396270751953125, -0.049714088439941406, -0.04546546936035156, -0.04121685028076172, -0.036968231201171875, -0.03271961212158203, -0.028470993041992188, -0.024222373962402344, -0.0199737548828125, -0.015725135803222656, -0.011476516723632812, -0.007227897644042969, -0.002979278564453125, 0.0012693405151367188, 0.0055179595947265625, 0.009766578674316406, 0.01401519775390625, 0.018263816833496094, 0.022512435913085938, 0.02676105499267578, 0.031009674072265625, 0.03525829315185547, 0.03950691223144531, 0.043755531311035156, 0.048004150390625, 0.052252769470214844, 0.05650138854980469, 0.06075000762939453, 0.06499862670898438, 0.06924724578857422, 0.07349586486816406, 0.0777444839477539, 0.08199310302734375, 0.0862417221069336, 0.09049034118652344, 0.09473896026611328, 0.09898757934570312, 0.10323619842529297, 0.10748481750488281, 0.11173343658447266, 0.1159820556640625, 0.12023067474365234, 0.12447929382324219, 0.12872791290283203, 0.13297653198242188, 0.13722515106201172, 0.14147377014160156, 0.1457223892211914, 0.14997100830078125, 0.1542196273803711, 0.15846824645996094, 0.16271686553955078, 0.16696548461914062, 0.17121410369873047, 0.1754627227783203, 0.17971134185791016, 0.1839599609375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 5.0, 19.0, 32.0, 67.0, 177.0, 249.0, 218.0, 111.0, 48.0, 32.0, 17.0, 5.0, 9.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.702487051486969, -0.6507090926170349, -0.598931074142456, -0.547153115272522, -0.4953750967979431, -0.44359713792800903, -0.39181914925575256, -0.3400411605834961, -0.2882631719112396, -0.23648518323898315, -0.18470719456672668, -0.1329292207956314, -0.08115123212337494, -0.029373258352279663, 0.022404730319976807, 0.07418271899223328, 0.12596070766448975, 0.17773869633674622, 0.22951668500900269, 0.28129464387893677, 0.3330726623535156, 0.3848506212234497, 0.4366286098957062, 0.48840659856796265, 0.5401846170425415, 0.5919625759124756, 0.6437405943870544, 0.6955185532569885, 0.7472965717315674, 0.7990745306015015, 0.8508524894714355, 0.9026305079460144, 0.9544085264205933, 1.0061864852905273, 1.0579644441604614, 1.109742522239685, 1.1615204811096191, 1.2132984399795532, 1.2650763988494873, 1.316854476928711, 1.368632435798645, 1.420410394668579, 1.4721883535385132, 1.5239664316177368, 1.575744390487671, 1.627522349357605, 1.679300308227539, 1.7310783863067627, 1.7828562259674072, 1.8346341848373413, 1.8864121437072754, 1.938190221786499, 1.989968180656433, 2.041746139526367, 2.093524217605591, 2.1453020572662354, 2.197080135345459, 2.2488582134246826, 2.300636053085327, 2.352414131164551, 2.4041919708251953, 2.455970048904419, 2.5077481269836426, 2.559525966644287, 2.6113040447235107]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 2.0, 3.0, 5.0, 9.0, 9.0, 8.0, 9.0, 12.0, 17.0, 21.0, 23.0, 26.0, 29.0, 40.0, 33.0, 27.0, 47.0, 47.0, 42.0, 40.0, 50.0, 52.0, 42.0, 34.0, 38.0, 43.0, 37.0, 34.0, 31.0, 28.0, 26.0, 24.0, 16.0, 11.0, 17.0, 10.0, 10.0, 15.0, 13.0, 11.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5210294723510742, -0.5037463307380676, -0.48646318912506104, -0.46918004751205444, -0.45189690589904785, -0.43461376428604126, -0.41733065247535706, -0.40004751086235046, -0.38276436924934387, -0.3654812276363373, -0.3481980860233307, -0.3309149444103241, -0.3136318325996399, -0.2963486909866333, -0.2790655493736267, -0.2617824077606201, -0.24449926614761353, -0.22721612453460693, -0.20993298292160034, -0.19264985620975494, -0.17536671459674835, -0.15808357298374176, -0.14080044627189636, -0.12351730465888977, -0.10623416304588318, -0.08895102143287659, -0.07166788727045059, -0.0543847493827343, -0.037101611495018005, -0.019818469882011414, -0.0025353357195854187, 0.014747798442840576, 0.03203094005584717, 0.04931407794356346, 0.06659721583127975, 0.08388034999370575, 0.10116349160671234, 0.11844663321971893, 0.13572975993156433, 0.15301290154457092, 0.17029604315757751, 0.1875791847705841, 0.2048623263835907, 0.2221454530954361, 0.2394285947084427, 0.2567117214202881, 0.2739948630332947, 0.29127800464630127, 0.30856114625930786, 0.32584428787231445, 0.34312742948532104, 0.36041057109832764, 0.37769371271133423, 0.3949768543243408, 0.412259966135025, 0.4295431077480316, 0.4468262493610382, 0.4641093909740448, 0.4813925325870514, 0.498675674200058, 0.5159587860107422, 0.5332419276237488, 0.5505250692367554, 0.567808210849762, 0.5850913524627686]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 6.0, 9.0, 13.0, 19.0, 34.0, 39.0, 57.0, 83.0, 130.0, 194.0, 288.0, 474.0, 758.0, 1418.0, 2457.0, 4791.0, 9855.0, 22748.0, 62084.0, 225608.0, 474771.0, 159532.0, 47371.0, 18277.0, 8219.0, 4033.0, 2201.0, 1233.0, 679.0, 391.0, 268.0, 142.0, 104.0, 75.0, 47.0, 50.0, 28.0, 19.0, 13.0, 9.0, 5.0, 4.0, 3.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.11395263671875, -0.11053848266601562, -0.10712432861328125, -0.10371017456054688, -0.1002960205078125, -0.09688186645507812, -0.09346771240234375, -0.09005355834960938, -0.086639404296875, -0.08322525024414062, -0.07981109619140625, -0.07639694213867188, -0.0729827880859375, -0.06956863403320312, -0.06615447998046875, -0.06274032592773438, -0.059326171875, -0.055912017822265625, -0.05249786376953125, -0.049083709716796875, -0.0456695556640625, -0.042255401611328125, -0.03884124755859375, -0.035427093505859375, -0.032012939453125, -0.028598785400390625, -0.02518463134765625, -0.021770477294921875, -0.0183563232421875, -0.014942169189453125, -0.01152801513671875, -0.008113861083984375, -0.00469970703125, -0.001285552978515625, 0.00212860107421875, 0.005542755126953125, 0.0089569091796875, 0.012371063232421875, 0.01578521728515625, 0.019199371337890625, 0.022613525390625, 0.026027679443359375, 0.02944183349609375, 0.032855987548828125, 0.0362701416015625, 0.039684295654296875, 0.04309844970703125, 0.046512603759765625, 0.0499267578125, 0.053340911865234375, 0.05675506591796875, 0.060169219970703125, 0.0635833740234375, 0.06699752807617188, 0.07041168212890625, 0.07382583618164062, 0.077239990234375, 0.08065414428710938, 0.08406829833984375, 0.08748245239257812, 0.0908966064453125, 0.09431076049804688, 0.09772491455078125, 0.10113906860351562, 0.10455322265625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 6.0, 9.0, 8.0, 9.0, 15.0, 19.0, 15.0, 28.0, 35.0, 29.0, 39.0, 37.0, 38.0, 36.0, 45.0, 59.0, 52.0, 58.0, 48.0, 55.0, 45.0, 32.0, 42.0, 44.0, 35.0, 39.0, 37.0, 23.0, 15.0, 12.0, 4.0, 4.0, 7.0, 9.0, 3.0, 2.0, 5.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.058685302734375, -0.057065486907958984, -0.05544567108154297, -0.05382585525512695, -0.05220603942871094, -0.05058622360229492, -0.048966407775878906, -0.04734659194946289, -0.045726776123046875, -0.04410696029663086, -0.042487144470214844, -0.04086732864379883, -0.03924751281738281, -0.0376276969909668, -0.03600788116455078, -0.034388065338134766, -0.03276824951171875, -0.031148433685302734, -0.02952861785888672, -0.027908802032470703, -0.026288986206054688, -0.024669170379638672, -0.023049354553222656, -0.02142953872680664, -0.019809722900390625, -0.01818990707397461, -0.016570091247558594, -0.014950275421142578, -0.013330459594726562, -0.011710643768310547, -0.010090827941894531, -0.008471012115478516, -0.0068511962890625, -0.005231380462646484, -0.0036115646362304688, -0.001991748809814453, -0.0003719329833984375, 0.0012478828430175781, 0.0028676986694335938, 0.004487514495849609, 0.006107330322265625, 0.007727146148681641, 0.009346961975097656, 0.010966777801513672, 0.012586593627929688, 0.014206409454345703, 0.01582622528076172, 0.017446041107177734, 0.01906585693359375, 0.020685672760009766, 0.02230548858642578, 0.023925304412841797, 0.025545120239257812, 0.027164936065673828, 0.028784751892089844, 0.03040456771850586, 0.032024383544921875, 0.03364419937133789, 0.035264015197753906, 0.03688383102416992, 0.03850364685058594, 0.04012346267700195, 0.04174327850341797, 0.043363094329833984, 0.04498291015625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 1.0, 1.0, 9.0, 8.0, 13.0, 9.0, 11.0, 28.0, 36.0, 69.0, 102.0, 170.0, 310.0, 620.0, 1480.0, 4276.0, 19362.0, 174885.0, 773766.0, 59410.0, 9295.0, 2609.0, 1025.0, 451.0, 252.0, 128.0, 70.0, 48.0, 36.0, 23.0, 16.0, 15.0, 6.0, 6.0, 7.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2423095703125, -0.2348041534423828, -0.22729873657226562, -0.21979331970214844, -0.21228790283203125, -0.20478248596191406, -0.19727706909179688, -0.1897716522216797, -0.1822662353515625, -0.1747608184814453, -0.16725540161132812, -0.15974998474121094, -0.15224456787109375, -0.14473915100097656, -0.13723373413085938, -0.1297283172607422, -0.122222900390625, -0.11471748352050781, -0.10721206665039062, -0.09970664978027344, -0.09220123291015625, -0.08469581604003906, -0.07719039916992188, -0.06968498229980469, -0.0621795654296875, -0.05467414855957031, -0.047168731689453125, -0.03966331481933594, -0.03215789794921875, -0.024652481079101562, -0.017147064208984375, -0.009641647338867188, -0.00213623046875, 0.0053691864013671875, 0.012874603271484375, 0.020380020141601562, 0.02788543701171875, 0.03539085388183594, 0.042896270751953125, 0.05040168762207031, 0.0579071044921875, 0.06541252136230469, 0.07291793823242188, 0.08042335510253906, 0.08792877197265625, 0.09543418884277344, 0.10293960571289062, 0.11044502258300781, 0.117950439453125, 0.1254558563232422, 0.13296127319335938, 0.14046669006347656, 0.14797210693359375, 0.15547752380371094, 0.16298294067382812, 0.1704883575439453, 0.1779937744140625, 0.1854991912841797, 0.19300460815429688, 0.20051002502441406, 0.20801544189453125, 0.21552085876464844, 0.22302627563476562, 0.2305316925048828, 0.238037109375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 3.0, 6.0, 5.0, 4.0, 9.0, 10.0, 14.0, 14.0, 23.0, 22.0, 29.0, 34.0, 36.0, 48.0, 42.0, 40.0, 44.0, 44.0, 59.0, 54.0, 55.0, 56.0, 52.0, 48.0, 36.0, 36.0, 35.0, 18.0, 21.0, 18.0, 18.0, 13.0, 10.0, 7.0, 8.0, 7.0, 5.0, 8.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.2470703125, -0.2401905059814453, -0.23331069946289062, -0.22643089294433594, -0.21955108642578125, -0.21267127990722656, -0.20579147338867188, -0.1989116668701172, -0.1920318603515625, -0.1851520538330078, -0.17827224731445312, -0.17139244079589844, -0.16451263427734375, -0.15763282775878906, -0.15075302124023438, -0.1438732147216797, -0.136993408203125, -0.1301136016845703, -0.12323379516601562, -0.11635398864746094, -0.10947418212890625, -0.10259437561035156, -0.09571456909179688, -0.08883476257324219, -0.0819549560546875, -0.07507514953613281, -0.06819534301757812, -0.06131553649902344, -0.05443572998046875, -0.04755592346191406, -0.040676116943359375, -0.03379631042480469, -0.02691650390625, -0.020036697387695312, -0.013156890869140625, -0.0062770843505859375, 0.00060272216796875, 0.0074825286865234375, 0.014362335205078125, 0.021242141723632812, 0.0281219482421875, 0.03500175476074219, 0.041881561279296875, 0.04876136779785156, 0.05564117431640625, 0.06252098083496094, 0.06940078735351562, 0.07628059387207031, 0.083160400390625, 0.09004020690917969, 0.09692001342773438, 0.10379981994628906, 0.11067962646484375, 0.11755943298339844, 0.12443923950195312, 0.1313190460205078, 0.1381988525390625, 0.1450786590576172, 0.15195846557617188, 0.15883827209472656, 0.16571807861328125, 0.17259788513183594, 0.17947769165039062, 0.1863574981689453, 0.1932373046875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 12.0, 13.0, 18.0, 23.0, 38.0, 65.0, 88.0, 174.0, 401.0, 919.0, 2859.0, 12238.0, 95501.0, 780448.0, 135027.0, 15459.0, 3290.0, 1023.0, 470.0, 203.0, 109.0, 66.0, 35.0, 19.0, 14.0, 10.0, 8.0, 1.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1107177734375, -0.10709571838378906, -0.10347366333007812, -0.09985160827636719, -0.09622955322265625, -0.09260749816894531, -0.08898544311523438, -0.08536338806152344, -0.0817413330078125, -0.07811927795410156, -0.07449722290039062, -0.07087516784667969, -0.06725311279296875, -0.06363105773925781, -0.060009002685546875, -0.05638694763183594, -0.052764892578125, -0.04914283752441406, -0.045520782470703125, -0.04189872741699219, -0.03827667236328125, -0.03465461730957031, -0.031032562255859375, -0.027410507202148438, -0.0237884521484375, -0.020166397094726562, -0.016544342041015625, -0.012922286987304688, -0.00930023193359375, -0.0056781768798828125, -0.002056121826171875, 0.0015659332275390625, 0.00518798828125, 0.008810043334960938, 0.012432098388671875, 0.016054153442382812, 0.01967620849609375, 0.023298263549804688, 0.026920318603515625, 0.030542373657226562, 0.0341644287109375, 0.03778648376464844, 0.041408538818359375, 0.04503059387207031, 0.04865264892578125, 0.05227470397949219, 0.055896759033203125, 0.05951881408691406, 0.063140869140625, 0.06676292419433594, 0.07038497924804688, 0.07400703430175781, 0.07762908935546875, 0.08125114440917969, 0.08487319946289062, 0.08849525451660156, 0.0921173095703125, 0.09573936462402344, 0.09936141967773438, 0.10298347473144531, 0.10660552978515625, 0.11022758483886719, 0.11384963989257812, 0.11747169494628906, 0.12109375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 1.0, 0.0, 4.0, 4.0, 4.0, 4.0, 3.0, 7.0, 14.0, 13.0, 24.0, 24.0, 36.0, 48.0, 62.0, 72.0, 83.0, 98.0, 100.0, 85.0, 77.0, 66.0, 44.0, 34.0, 18.0, 18.0, 12.0, 7.0, 13.0, 3.0, 6.0, 5.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.331899642944336e-05, -3.248453140258789e-05, -3.165006637573242e-05, -3.081560134887695e-05, -2.9981136322021484e-05, -2.9146671295166016e-05, -2.8312206268310547e-05, -2.7477741241455078e-05, -2.664327621459961e-05, -2.580881118774414e-05, -2.4974346160888672e-05, -2.4139881134033203e-05, -2.3305416107177734e-05, -2.2470951080322266e-05, -2.1636486053466797e-05, -2.0802021026611328e-05, -1.996755599975586e-05, -1.913309097290039e-05, -1.8298625946044922e-05, -1.7464160919189453e-05, -1.6629695892333984e-05, -1.5795230865478516e-05, -1.4960765838623047e-05, -1.4126300811767578e-05, -1.329183578491211e-05, -1.245737075805664e-05, -1.1622905731201172e-05, -1.0788440704345703e-05, -9.953975677490234e-06, -9.119510650634766e-06, -8.285045623779297e-06, -7.450580596923828e-06, -6.616115570068359e-06, -5.781650543212891e-06, -4.947185516357422e-06, -4.112720489501953e-06, -3.2782554626464844e-06, -2.4437904357910156e-06, -1.6093254089355469e-06, -7.748603820800781e-07, 5.960464477539063e-08, 8.940696716308594e-07, 1.7285346984863281e-06, 2.562999725341797e-06, 3.3974647521972656e-06, 4.231929779052734e-06, 5.066394805908203e-06, 5.900859832763672e-06, 6.735324859619141e-06, 7.569789886474609e-06, 8.404254913330078e-06, 9.238719940185547e-06, 1.0073184967041016e-05, 1.0907649993896484e-05, 1.1742115020751953e-05, 1.2576580047607422e-05, 1.341104507446289e-05, 1.424551010131836e-05, 1.5079975128173828e-05, 1.5914440155029297e-05, 1.6748905181884766e-05, 1.7583370208740234e-05, 1.8417835235595703e-05, 1.9252300262451172e-05, 2.008676528930664e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 6.0, 10.0, 20.0, 33.0, 43.0, 84.0, 175.0, 437.0, 1224.0, 4923.0, 41140.0, 817080.0, 168954.0, 11153.0, 2070.0, 627.0, 277.0, 117.0, 54.0, 67.0, 23.0, 14.0, 11.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09228515625, -0.08783149719238281, -0.08337783813476562, -0.07892417907714844, -0.07447052001953125, -0.07001686096191406, -0.06556320190429688, -0.06110954284667969, -0.0566558837890625, -0.05220222473144531, -0.047748565673828125, -0.04329490661621094, -0.03884124755859375, -0.03438758850097656, -0.029933929443359375, -0.025480270385742188, -0.021026611328125, -0.016572952270507812, -0.012119293212890625, -0.0076656341552734375, -0.00321197509765625, 0.0012416839599609375, 0.005695343017578125, 0.010149002075195312, 0.0146026611328125, 0.019056320190429688, 0.023509979248046875, 0.027963638305664062, 0.03241729736328125, 0.03687095642089844, 0.041324615478515625, 0.04577827453613281, 0.05023193359375, 0.05468559265136719, 0.059139251708984375, 0.06359291076660156, 0.06804656982421875, 0.07250022888183594, 0.07695388793945312, 0.08140754699707031, 0.0858612060546875, 0.09031486511230469, 0.09476852416992188, 0.09922218322753906, 0.10367584228515625, 0.10812950134277344, 0.11258316040039062, 0.11703681945800781, 0.121490478515625, 0.1259441375732422, 0.13039779663085938, 0.13485145568847656, 0.13930511474609375, 0.14375877380371094, 0.14821243286132812, 0.1526660919189453, 0.1571197509765625, 0.1615734100341797, 0.16602706909179688, 0.17048072814941406, 0.17493438720703125, 0.17938804626464844, 0.18384170532226562, 0.1882953643798828, 0.1927490234375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 1.0, 3.0, 8.0, 0.0, 3.0, 4.0, 7.0, 13.0, 9.0, 14.0, 11.0, 24.0, 16.0, 22.0, 32.0, 46.0, 34.0, 63.0, 62.0, 81.0, 71.0, 70.0, 59.0, 60.0, 38.0, 44.0, 37.0, 34.0, 24.0, 22.0, 15.0, 10.0, 12.0, 7.0, 14.0, 4.0, 9.0, 1.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.07110595703125, -0.06917905807495117, -0.06725215911865234, -0.06532526016235352, -0.06339836120605469, -0.06147146224975586, -0.05954456329345703, -0.0576176643371582, -0.055690765380859375, -0.05376386642456055, -0.05183696746826172, -0.04991006851196289, -0.04798316955566406, -0.046056270599365234, -0.044129371643066406, -0.04220247268676758, -0.04027557373046875, -0.03834867477416992, -0.036421775817871094, -0.034494876861572266, -0.03256797790527344, -0.03064107894897461, -0.02871417999267578, -0.026787281036376953, -0.024860382080078125, -0.022933483123779297, -0.02100658416748047, -0.01907968521118164, -0.017152786254882812, -0.015225887298583984, -0.013298988342285156, -0.011372089385986328, -0.0094451904296875, -0.007518291473388672, -0.005591392517089844, -0.0036644935607910156, -0.0017375946044921875, 0.00018930435180664062, 0.0021162033081054688, 0.004043102264404297, 0.005970001220703125, 0.007896900177001953, 0.009823799133300781, 0.01175069808959961, 0.013677597045898438, 0.015604496002197266, 0.017531394958496094, 0.019458293914794922, 0.02138519287109375, 0.023312091827392578, 0.025238990783691406, 0.027165889739990234, 0.029092788696289062, 0.03101968765258789, 0.03294658660888672, 0.03487348556518555, 0.036800384521484375, 0.0387272834777832, 0.04065418243408203, 0.04258108139038086, 0.04450798034667969, 0.046434879302978516, 0.048361778259277344, 0.05028867721557617, 0.052215576171875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 13.0, 30.0, 76.0, 144.0, 259.0, 234.0, 119.0, 57.0, 30.0, 13.0, 7.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.2298762798309326, -2.172567367553711, -2.1152584552764893, -2.0579495429992676, -2.000640630722046, -1.9433315992355347, -1.886022686958313, -1.8287137746810913, -1.7714048624038696, -1.714095950126648, -1.6567870378494263, -1.599478006362915, -1.5421690940856934, -1.4848601818084717, -1.42755126953125, -1.3702423572540283, -1.3129334449768066, -1.255624532699585, -1.1983156204223633, -1.1410067081451416, -1.0836976766586304, -1.0263887643814087, -0.969079852104187, -0.9117709398269653, -0.8544619083404541, -0.7971529960632324, -0.739844024181366, -0.6825351119041443, -0.6252261996269226, -0.5679172277450562, -0.5106083154678345, -0.4532994031906128, -0.3959904909133911, -0.33868154883384705, -0.28137263655662537, -0.2240636944770813, -0.16675476729869843, -0.10944584012031555, -0.052136898040771484, 0.005172014236450195, 0.06248095631599426, 0.11978988349437714, 0.17709881067276, 0.23440775275230408, 0.29171669483184814, 0.3490256071090698, 0.4063345491886139, 0.46364346146583557, 0.5209524035453796, 0.5782613158226013, 0.6355702877044678, 0.6928791999816895, 0.7501881122589111, 0.8074970245361328, 0.8648059964179993, 0.922114908695221, 0.9794238805770874, 1.036732792854309, 1.0940417051315308, 1.151350736618042, 1.2086596488952637, 1.2659685611724854, 1.323277473449707, 1.3805863857269287, 1.4378952980041504]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 0.0, 7.0, 9.0, 8.0, 5.0, 12.0, 12.0, 12.0, 12.0, 17.0, 20.0, 21.0, 17.0, 35.0, 25.0, 41.0, 36.0, 44.0, 46.0, 49.0, 62.0, 51.0, 45.0, 48.0, 44.0, 46.0, 35.0, 32.0, 29.0, 34.0, 27.0, 24.0, 20.0, 15.0, 11.0, 4.0, 11.0, 11.0, 4.0, 9.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7336015105247498, -0.7075657248497009, -0.6815299391746521, -0.6554941534996033, -0.6294583082199097, -0.6034225225448608, -0.577386736869812, -0.5513509511947632, -0.5253151655197144, -0.4992793798446655, -0.4732435941696167, -0.4472077786922455, -0.42117199301719666, -0.3951362073421478, -0.3691003918647766, -0.3430646061897278, -0.31702882051467896, -0.2909930348396301, -0.2649572491645813, -0.23892143368721008, -0.21288564801216125, -0.18684986233711243, -0.1608140617609024, -0.13477826118469238, -0.10874247550964355, -0.08270668238401413, -0.056670889258384705, -0.03063509613275528, -0.0045993030071258545, 0.021436482667922974, 0.047472283244132996, 0.07350808382034302, 0.09954386949539185, 0.12557965517044067, 0.1516154557466507, 0.17765125632286072, 0.20368704199790955, 0.22972282767295837, 0.2557586431503296, 0.2817944288253784, 0.30783021450042725, 0.3338660001754761, 0.3599017858505249, 0.3859376013278961, 0.41197338700294495, 0.4380091726779938, 0.464044988155365, 0.4900807738304138, 0.5161165595054626, 0.5421523451805115, 0.5681881308555603, 0.5942239165306091, 0.6202597618103027, 0.6462955474853516, 0.6723313331604004, 0.6983671188354492, 0.724402904510498, 0.7504386901855469, 0.7764744758605957, 0.8025102615356445, 0.8285460472106934, 0.8545818328857422, 0.8806176781654358, 0.9066534638404846, 0.9326892495155334]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 10.0, 6.0, 17.0, 11.0, 19.0, 41.0, 57.0, 89.0, 154.0, 249.0, 379.0, 633.0, 1154.0, 2127.0, 4255.0, 9212.0, 23001.0, 69972.0, 314080.0, 1936222.0, 1502900.0, 236949.0, 56726.0, 19656.0, 8150.0, 3741.0, 1896.0, 1055.0, 570.0, 373.0, 219.0, 135.0, 70.0, 66.0, 30.0, 25.0, 15.0, 10.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.073974609375, -0.07158184051513672, -0.06918907165527344, -0.06679630279541016, -0.06440353393554688, -0.062010765075683594, -0.05961799621582031, -0.05722522735595703, -0.05483245849609375, -0.05243968963623047, -0.05004692077636719, -0.047654151916503906, -0.045261383056640625, -0.042868614196777344, -0.04047584533691406, -0.03808307647705078, -0.0356903076171875, -0.03329753875732422, -0.030904769897460938, -0.028512001037597656, -0.026119232177734375, -0.023726463317871094, -0.021333694458007812, -0.01894092559814453, -0.01654815673828125, -0.014155387878417969, -0.011762619018554688, -0.009369850158691406, -0.006977081298828125, -0.004584312438964844, -0.0021915435791015625, 0.00020122528076171875, 0.002593994140625, 0.004986763000488281, 0.0073795318603515625, 0.009772300720214844, 0.012165069580078125, 0.014557838439941406, 0.016950607299804688, 0.01934337615966797, 0.02173614501953125, 0.02412891387939453, 0.026521682739257812, 0.028914451599121094, 0.031307220458984375, 0.033699989318847656, 0.03609275817871094, 0.03848552703857422, 0.0408782958984375, 0.04327106475830078, 0.04566383361816406, 0.048056602478027344, 0.050449371337890625, 0.052842140197753906, 0.05523490905761719, 0.05762767791748047, 0.06002044677734375, 0.06241321563720703, 0.06480598449707031, 0.0671987533569336, 0.06959152221679688, 0.07198429107666016, 0.07437705993652344, 0.07676982879638672, 0.07916259765625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 9.0, 8.0, 6.0, 13.0, 20.0, 24.0, 25.0, 45.0, 40.0, 65.0, 66.0, 64.0, 56.0, 66.0, 73.0, 54.0, 63.0, 49.0, 49.0, 41.0, 39.0, 35.0, 21.0, 20.0, 13.0, 14.0, 12.0, 4.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.058013916015625, -0.056078433990478516, -0.05414295196533203, -0.05220746994018555, -0.05027198791503906, -0.04833650588989258, -0.046401023864746094, -0.04446554183959961, -0.042530059814453125, -0.04059457778930664, -0.038659095764160156, -0.03672361373901367, -0.03478813171386719, -0.0328526496887207, -0.03091716766357422, -0.028981685638427734, -0.02704620361328125, -0.025110721588134766, -0.02317523956298828, -0.021239757537841797, -0.019304275512695312, -0.017368793487548828, -0.015433311462402344, -0.01349782943725586, -0.011562347412109375, -0.00962686538696289, -0.007691383361816406, -0.005755901336669922, -0.0038204193115234375, -0.0018849372863769531, 5.054473876953125e-05, 0.0019860267639160156, 0.0039215087890625, 0.005856990814208984, 0.007792472839355469, 0.009727954864501953, 0.011663436889648438, 0.013598918914794922, 0.015534400939941406, 0.01746988296508789, 0.019405364990234375, 0.02134084701538086, 0.023276329040527344, 0.025211811065673828, 0.027147293090820312, 0.029082775115966797, 0.03101825714111328, 0.032953739166259766, 0.03488922119140625, 0.036824703216552734, 0.03876018524169922, 0.0406956672668457, 0.04263114929199219, 0.04456663131713867, 0.046502113342285156, 0.04843759536743164, 0.050373077392578125, 0.05230855941772461, 0.054244041442871094, 0.05617952346801758, 0.05811500549316406, 0.06005048751831055, 0.06198596954345703, 0.06392145156860352, 0.06585693359375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 12.0, 7.0, 15.0, 33.0, 59.0, 92.0, 174.0, 357.0, 837.0, 2199.0, 7944.0, 45736.0, 735840.0, 3252189.0, 125738.0, 16393.0, 3954.0, 1387.0, 601.0, 313.0, 165.0, 82.0, 56.0, 26.0, 27.0, 23.0, 8.0, 6.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.259033203125, -0.2524280548095703, -0.24582290649414062, -0.23921775817871094, -0.23261260986328125, -0.22600746154785156, -0.21940231323242188, -0.2127971649169922, -0.2061920166015625, -0.1995868682861328, -0.19298171997070312, -0.18637657165527344, -0.17977142333984375, -0.17316627502441406, -0.16656112670898438, -0.1599559783935547, -0.153350830078125, -0.1467456817626953, -0.14014053344726562, -0.13353538513183594, -0.12693023681640625, -0.12032508850097656, -0.11371994018554688, -0.10711479187011719, -0.1005096435546875, -0.09390449523925781, -0.08729934692382812, -0.08069419860839844, -0.07408905029296875, -0.06748390197753906, -0.060878753662109375, -0.05427360534667969, -0.04766845703125, -0.04106330871582031, -0.034458160400390625, -0.027853012084960938, -0.02124786376953125, -0.014642715454101562, -0.008037567138671875, -0.0014324188232421875, 0.0051727294921875, 0.011777877807617188, 0.018383026123046875, 0.024988174438476562, 0.03159332275390625, 0.03819847106933594, 0.044803619384765625, 0.05140876770019531, 0.058013916015625, 0.06461906433105469, 0.07122421264648438, 0.07782936096191406, 0.08443450927734375, 0.09103965759277344, 0.09764480590820312, 0.10424995422363281, 0.1108551025390625, 0.11746025085449219, 0.12406539916992188, 0.13067054748535156, 0.13727569580078125, 0.14388084411621094, 0.15048599243164062, 0.1570911407470703, 0.1636962890625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 5.0, 4.0, 4.0, 9.0, 17.0, 25.0, 29.0, 49.0, 57.0, 78.0, 138.0, 257.0, 451.0, 757.0, 777.0, 536.0, 329.0, 185.0, 120.0, 68.0, 53.0, 35.0, 27.0, 21.0, 10.0, 4.0, 6.0, 5.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1484375, -0.14253616333007812, -0.13663482666015625, -0.13073348999023438, -0.1248321533203125, -0.11893081665039062, -0.11302947998046875, -0.10712814331054688, -0.101226806640625, -0.09532546997070312, -0.08942413330078125, -0.08352279663085938, -0.0776214599609375, -0.07172012329101562, -0.06581878662109375, -0.059917449951171875, -0.05401611328125, -0.048114776611328125, -0.04221343994140625, -0.036312103271484375, -0.0304107666015625, -0.024509429931640625, -0.01860809326171875, -0.012706756591796875, -0.006805419921875, -0.000904083251953125, 0.00499725341796875, 0.010898590087890625, 0.0167999267578125, 0.022701263427734375, 0.02860260009765625, 0.034503936767578125, 0.0404052734375, 0.046306610107421875, 0.05220794677734375, 0.058109283447265625, 0.0640106201171875, 0.06991195678710938, 0.07581329345703125, 0.08171463012695312, 0.087615966796875, 0.09351730346679688, 0.09941864013671875, 0.10531997680664062, 0.1112213134765625, 0.11712265014648438, 0.12302398681640625, 0.12892532348632812, 0.13482666015625, 0.14072799682617188, 0.14662933349609375, 0.15253067016601562, 0.1584320068359375, 0.16433334350585938, 0.17023468017578125, 0.17613601684570312, 0.182037353515625, 0.18793869018554688, 0.19384002685546875, 0.19974136352539062, 0.2056427001953125, 0.21154403686523438, 0.21744537353515625, 0.22334671020507812, 0.229248046875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 18.0, 73.0, 233.0, 371.0, 221.0, 46.0, 12.0, 5.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5941085815429688, -2.4825284481048584, -2.370948314666748, -2.2593679428100586, -2.1477878093719482, -2.036207675933838, -1.924627423286438, -1.813047170639038, -1.7014670372009277, -1.5898869037628174, -1.4783066511154175, -1.3667263984680176, -1.2551462650299072, -1.1435661315917969, -1.031985878944397, -0.9204056859016418, -0.8088254928588867, -0.6972452998161316, -0.5856651067733765, -0.47408491373062134, -0.3625047206878662, -0.2509245276451111, -0.13934433460235596, -0.02776414155960083, 0.0838160514831543, 0.19539624452590942, 0.30697643756866455, 0.4185566306114197, 0.5301368236541748, 0.6417170166969299, 0.7532972097396851, 0.8648774027824402, 0.9764575958251953, 1.0880377292633057, 1.1996179819107056, 1.3111982345581055, 1.4227783679962158, 1.5343585014343262, 1.645938754081726, 1.757519006729126, 1.8690991401672363, 1.9806792736053467, 2.092259407043457, 2.2038397789001465, 2.315419912338257, 2.427000045776367, 2.5385804176330566, 2.650160551071167, 2.7617406845092773, 2.8733208179473877, 2.984900951385498, 3.0964813232421875, 3.208061456680298, 3.319641590118408, 3.4312219619750977, 3.542802095413208, 3.6543822288513184, 3.7659623622894287, 3.877542495727539, 3.9891228675842285, 4.100703239440918, 4.212283134460449, 4.323863506317139, 4.43544340133667, 4.547023773193359]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 5.0, 7.0, 5.0, 6.0, 10.0, 12.0, 17.0, 14.0, 27.0, 21.0, 36.0, 24.0, 38.0, 35.0, 41.0, 39.0, 36.0, 42.0, 42.0, 38.0, 39.0, 41.0, 40.0, 61.0, 35.0, 38.0, 31.0, 35.0, 27.0, 27.0, 19.0, 20.0, 16.0, 8.0, 13.0, 10.0, 10.0, 3.0, 11.0, 6.0, 2.0, 1.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8110286593437195, -0.786143958568573, -0.7612591981887817, -0.7363744974136353, -0.711489737033844, -0.6866050362586975, -0.6617202758789062, -0.6368355751037598, -0.6119508743286133, -0.5870661735534668, -0.5621814131736755, -0.537296712398529, -0.5124119520187378, -0.4875272512435913, -0.46264252066612244, -0.43775779008865356, -0.4128730297088623, -0.38798829913139343, -0.36310356855392456, -0.3382188677787781, -0.3133341073989868, -0.28844940662384033, -0.26356467604637146, -0.2386799454689026, -0.21379521489143372, -0.18891048431396484, -0.16402575373649597, -0.1391410380601883, -0.11425630748271942, -0.08937157690525055, -0.06448686122894287, -0.039602130651474, -0.014717400074005127, 0.010167326778173447, 0.03505205363035202, 0.059936776757240295, 0.08482150733470917, 0.10970623791217804, 0.13459095358848572, 0.1594756841659546, 0.18436041474342346, 0.20924514532089233, 0.2341298758983612, 0.2590146064758301, 0.28389930725097656, 0.3087840676307678, 0.3336687684059143, 0.3585534989833832, 0.38343822956085205, 0.4083229601383209, 0.4332076907157898, 0.4580923914909363, 0.48297715187072754, 0.507861852645874, 0.5327465534210205, 0.5576313138008118, 0.582516074180603, 0.6074007749557495, 0.6322855353355408, 0.6571702361106873, 0.6820549964904785, 0.706939697265625, 0.7318243980407715, 0.7567091584205627, 0.7815938591957092]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 5.0, 4.0, 5.0, 4.0, 7.0, 6.0, 10.0, 30.0, 55.0, 49.0, 111.0, 170.0, 270.0, 450.0, 918.0, 1820.0, 4002.0, 9630.0, 25722.0, 74489.0, 237077.0, 432107.0, 172495.0, 55605.0, 19577.0, 7449.0, 3137.0, 1512.0, 789.0, 453.0, 216.0, 144.0, 99.0, 41.0, 34.0, 23.0, 18.0, 12.0, 6.0, 2.0, 1.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.092529296875, -0.08873176574707031, -0.08493423461914062, -0.08113670349121094, -0.07733917236328125, -0.07354164123535156, -0.06974411010742188, -0.06594657897949219, -0.0621490478515625, -0.05835151672363281, -0.054553985595703125, -0.05075645446777344, -0.04695892333984375, -0.04316139221191406, -0.039363861083984375, -0.03556632995605469, -0.031768798828125, -0.027971267700195312, -0.024173736572265625, -0.020376205444335938, -0.01657867431640625, -0.012781143188476562, -0.008983612060546875, -0.0051860809326171875, -0.0013885498046875, 0.0024089813232421875, 0.006206512451171875, 0.010004043579101562, 0.01380157470703125, 0.017599105834960938, 0.021396636962890625, 0.025194168090820312, 0.02899169921875, 0.03278923034667969, 0.036586761474609375, 0.04038429260253906, 0.04418182373046875, 0.04797935485839844, 0.051776885986328125, 0.05557441711425781, 0.0593719482421875, 0.06316947937011719, 0.06696701049804688, 0.07076454162597656, 0.07456207275390625, 0.07835960388183594, 0.08215713500976562, 0.08595466613769531, 0.089752197265625, 0.09354972839355469, 0.09734725952148438, 0.10114479064941406, 0.10494232177734375, 0.10873985290527344, 0.11253738403320312, 0.11633491516113281, 0.1201324462890625, 0.12392997741699219, 0.12772750854492188, 0.13152503967285156, 0.13532257080078125, 0.13912010192871094, 0.14291763305664062, 0.1467151641845703, 0.1505126953125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 6.0, 5.0, 6.0, 8.0, 14.0, 5.0, 20.0, 17.0, 21.0, 26.0, 24.0, 23.0, 32.0, 36.0, 38.0, 36.0, 47.0, 37.0, 49.0, 47.0, 48.0, 47.0, 45.0, 37.0, 43.0, 45.0, 35.0, 33.0, 28.0, 19.0, 28.0, 9.0, 19.0, 13.0, 12.0, 9.0, 8.0, 5.0, 6.0, 7.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041168212890625, -0.03974723815917969, -0.038326263427734375, -0.03690528869628906, -0.03548431396484375, -0.03406333923339844, -0.032642364501953125, -0.031221389770507812, -0.0298004150390625, -0.028379440307617188, -0.026958465576171875, -0.025537490844726562, -0.02411651611328125, -0.022695541381835938, -0.021274566650390625, -0.019853591918945312, -0.0184326171875, -0.017011642456054688, -0.015590667724609375, -0.014169692993164062, -0.01274871826171875, -0.011327743530273438, -0.009906768798828125, -0.008485794067382812, -0.0070648193359375, -0.0056438446044921875, -0.004222869873046875, -0.0028018951416015625, -0.00138092041015625, 4.00543212890625e-05, 0.001461029052734375, 0.0028820037841796875, 0.004302978515625, 0.0057239532470703125, 0.007144927978515625, 0.008565902709960938, 0.00998687744140625, 0.011407852172851562, 0.012828826904296875, 0.014249801635742188, 0.0156707763671875, 0.017091751098632812, 0.018512725830078125, 0.019933700561523438, 0.02135467529296875, 0.022775650024414062, 0.024196624755859375, 0.025617599487304688, 0.02703857421875, 0.028459548950195312, 0.029880523681640625, 0.03130149841308594, 0.03272247314453125, 0.03414344787597656, 0.035564422607421875, 0.03698539733886719, 0.0384063720703125, 0.03982734680175781, 0.041248321533203125, 0.04266929626464844, 0.04409027099609375, 0.04551124572753906, 0.046932220458984375, 0.04835319519042969, 0.049774169921875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 5.0, 3.0, 11.0, 10.0, 11.0, 16.0, 20.0, 18.0, 36.0, 46.0, 99.0, 143.0, 228.0, 398.0, 696.0, 1409.0, 2944.0, 8268.0, 38915.0, 585055.0, 364620.0, 32447.0, 7445.0, 2719.0, 1333.0, 673.0, 353.0, 213.0, 147.0, 90.0, 54.0, 36.0, 29.0, 30.0, 11.0, 8.0, 6.0, 3.0, 2.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.26611328125, -0.2580375671386719, -0.24996185302734375, -0.24188613891601562, -0.2338104248046875, -0.22573471069335938, -0.21765899658203125, -0.20958328247070312, -0.201507568359375, -0.19343185424804688, -0.18535614013671875, -0.17728042602539062, -0.1692047119140625, -0.16112899780273438, -0.15305328369140625, -0.14497756958007812, -0.13690185546875, -0.12882614135742188, -0.12075042724609375, -0.11267471313476562, -0.1045989990234375, -0.09652328491210938, -0.08844757080078125, -0.08037185668945312, -0.072296142578125, -0.06422042846679688, -0.05614471435546875, -0.048069000244140625, -0.0399932861328125, -0.031917572021484375, -0.02384185791015625, -0.015766143798828125, -0.0076904296875, 0.000385284423828125, 0.00846099853515625, 0.016536712646484375, 0.0246124267578125, 0.032688140869140625, 0.04076385498046875, 0.048839569091796875, 0.056915283203125, 0.06499099731445312, 0.07306671142578125, 0.08114242553710938, 0.0892181396484375, 0.09729385375976562, 0.10536956787109375, 0.11344528198242188, 0.12152099609375, 0.12959671020507812, 0.13767242431640625, 0.14574813842773438, 0.1538238525390625, 0.16189956665039062, 0.16997528076171875, 0.17805099487304688, 0.186126708984375, 0.19420242309570312, 0.20227813720703125, 0.21035385131835938, 0.2184295654296875, 0.22650527954101562, 0.23458099365234375, 0.24265670776367188, 0.250732421875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 0.0, 5.0, 3.0, 4.0, 6.0, 3.0, 6.0, 14.0, 7.0, 9.0, 13.0, 26.0, 29.0, 18.0, 25.0, 25.0, 38.0, 44.0, 41.0, 50.0, 49.0, 49.0, 46.0, 41.0, 33.0, 39.0, 53.0, 35.0, 45.0, 39.0, 21.0, 25.0, 31.0, 24.0, 17.0, 16.0, 16.0, 12.0, 11.0, 8.0, 6.0, 3.0, 4.0, 4.0, 1.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.2408447265625, -0.23380661010742188, -0.22676849365234375, -0.21973037719726562, -0.2126922607421875, -0.20565414428710938, -0.19861602783203125, -0.19157791137695312, -0.184539794921875, -0.17750167846679688, -0.17046356201171875, -0.16342544555664062, -0.1563873291015625, -0.14934921264648438, -0.14231109619140625, -0.13527297973632812, -0.12823486328125, -0.12119674682617188, -0.11415863037109375, -0.10712051391601562, -0.1000823974609375, -0.09304428100585938, -0.08600616455078125, -0.07896804809570312, -0.071929931640625, -0.06489181518554688, -0.05785369873046875, -0.050815582275390625, -0.0437774658203125, -0.036739349365234375, -0.02970123291015625, -0.022663116455078125, -0.015625, -0.008586883544921875, -0.00154876708984375, 0.005489349365234375, 0.0125274658203125, 0.019565582275390625, 0.02660369873046875, 0.033641815185546875, 0.040679931640625, 0.047718048095703125, 0.05475616455078125, 0.061794281005859375, 0.0688323974609375, 0.07587051391601562, 0.08290863037109375, 0.08994674682617188, 0.09698486328125, 0.10402297973632812, 0.11106109619140625, 0.11809921264648438, 0.1251373291015625, 0.13217544555664062, 0.13921356201171875, 0.14625167846679688, 0.153289794921875, 0.16032791137695312, 0.16736602783203125, 0.17440414428710938, 0.1814422607421875, 0.18848037719726562, 0.19551849365234375, 0.20255661010742188, 0.2095947265625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 7.0, 8.0, 11.0, 17.0, 14.0, 24.0, 32.0, 43.0, 75.0, 113.0, 177.0, 279.0, 509.0, 901.0, 1921.0, 4802.0, 14279.0, 54922.0, 266332.0, 577379.0, 92350.0, 22243.0, 6843.0, 2650.0, 1161.0, 556.0, 332.0, 209.0, 94.0, 78.0, 58.0, 37.0, 28.0, 23.0, 12.0, 9.0, 8.0, 11.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.06561279296875, -0.0635080337524414, -0.06140327453613281, -0.05929851531982422, -0.057193756103515625, -0.05508899688720703, -0.05298423767089844, -0.050879478454589844, -0.04877471923828125, -0.046669960021972656, -0.04456520080566406, -0.04246044158935547, -0.040355682373046875, -0.03825092315673828, -0.03614616394042969, -0.034041404724121094, -0.0319366455078125, -0.029831886291503906, -0.027727127075195312, -0.02562236785888672, -0.023517608642578125, -0.02141284942626953, -0.019308090209960938, -0.017203330993652344, -0.01509857177734375, -0.012993812561035156, -0.010889053344726562, -0.008784294128417969, -0.006679534912109375, -0.004574775695800781, -0.0024700164794921875, -0.00036525726318359375, 0.001739501953125, 0.0038442611694335938, 0.0059490203857421875, 0.008053779602050781, 0.010158538818359375, 0.012263298034667969, 0.014368057250976562, 0.016472816467285156, 0.01857757568359375, 0.020682334899902344, 0.022787094116210938, 0.02489185333251953, 0.026996612548828125, 0.02910137176513672, 0.031206130981445312, 0.033310890197753906, 0.0354156494140625, 0.037520408630371094, 0.03962516784667969, 0.04172992706298828, 0.043834686279296875, 0.04593944549560547, 0.04804420471191406, 0.050148963928222656, 0.05225372314453125, 0.054358482360839844, 0.05646324157714844, 0.05856800079345703, 0.060672760009765625, 0.06277751922607422, 0.06488227844238281, 0.0669870376586914, 0.069091796875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 3.0, 5.0, 4.0, 8.0, 2.0, 12.0, 11.0, 16.0, 16.0, 20.0, 14.0, 19.0, 18.0, 25.0, 37.0, 32.0, 41.0, 69.0, 65.0, 63.0, 60.0, 68.0, 64.0, 52.0, 37.0, 32.0, 30.0, 27.0, 16.0, 14.0, 16.0, 20.0, 11.0, 11.0, 13.0, 9.0, 8.0, 8.0, 6.0, 6.0, 1.0, 4.0, 5.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-2.2530555725097656e-05, -2.1889805793762207e-05, -2.1249055862426758e-05, -2.060830593109131e-05, -1.996755599975586e-05, -1.932680606842041e-05, -1.868605613708496e-05, -1.8045306205749512e-05, -1.7404556274414062e-05, -1.6763806343078613e-05, -1.6123056411743164e-05, -1.5482306480407715e-05, -1.4841556549072266e-05, -1.4200806617736816e-05, -1.3560056686401367e-05, -1.2919306755065918e-05, -1.2278556823730469e-05, -1.163780689239502e-05, -1.099705696105957e-05, -1.0356307029724121e-05, -9.715557098388672e-06, -9.074807167053223e-06, -8.434057235717773e-06, -7.793307304382324e-06, -7.152557373046875e-06, -6.511807441711426e-06, -5.8710575103759766e-06, -5.230307579040527e-06, -4.589557647705078e-06, -3.948807716369629e-06, -3.3080577850341797e-06, -2.6673078536987305e-06, -2.0265579223632812e-06, -1.385807991027832e-06, -7.450580596923828e-07, -1.043081283569336e-07, 5.364418029785156e-07, 1.1771917343139648e-06, 1.817941665649414e-06, 2.4586915969848633e-06, 3.0994415283203125e-06, 3.7401914596557617e-06, 4.380941390991211e-06, 5.02169132232666e-06, 5.662441253662109e-06, 6.303191184997559e-06, 6.943941116333008e-06, 7.584691047668457e-06, 8.225440979003906e-06, 8.866190910339355e-06, 9.506940841674805e-06, 1.0147690773010254e-05, 1.0788440704345703e-05, 1.1429190635681152e-05, 1.2069940567016602e-05, 1.271069049835205e-05, 1.33514404296875e-05, 1.399219036102295e-05, 1.4632940292358398e-05, 1.5273690223693848e-05, 1.5914440155029297e-05, 1.6555190086364746e-05, 1.7195940017700195e-05, 1.7836689949035645e-05, 1.8477439880371094e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 5.0, 11.0, 15.0, 29.0, 38.0, 34.0, 67.0, 109.0, 207.0, 380.0, 705.0, 1419.0, 3426.0, 10798.0, 55975.0, 595272.0, 327032.0, 39186.0, 8195.0, 2898.0, 1265.0, 646.0, 332.0, 184.0, 100.0, 82.0, 48.0, 21.0, 16.0, 12.0, 9.0, 8.0, 3.0, 5.0, 7.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.09576416015625, -0.09323787689208984, -0.09071159362792969, -0.08818531036376953, -0.08565902709960938, -0.08313274383544922, -0.08060646057128906, -0.0780801773071289, -0.07555389404296875, -0.0730276107788086, -0.07050132751464844, -0.06797504425048828, -0.06544876098632812, -0.06292247772216797, -0.06039619445800781, -0.057869911193847656, -0.0553436279296875, -0.052817344665527344, -0.05029106140136719, -0.04776477813720703, -0.045238494873046875, -0.04271221160888672, -0.04018592834472656, -0.037659645080566406, -0.03513336181640625, -0.032607078552246094, -0.030080795288085938, -0.02755451202392578, -0.025028228759765625, -0.02250194549560547, -0.019975662231445312, -0.017449378967285156, -0.014923095703125, -0.012396812438964844, -0.009870529174804688, -0.007344245910644531, -0.004817962646484375, -0.0022916793823242188, 0.0002346038818359375, 0.0027608871459960938, 0.00528717041015625, 0.007813453674316406, 0.010339736938476562, 0.012866020202636719, 0.015392303466796875, 0.01791858673095703, 0.020444869995117188, 0.022971153259277344, 0.0254974365234375, 0.028023719787597656, 0.030550003051757812, 0.03307628631591797, 0.035602569580078125, 0.03812885284423828, 0.04065513610839844, 0.043181419372558594, 0.04570770263671875, 0.048233985900878906, 0.05076026916503906, 0.05328655242919922, 0.055812835693359375, 0.05833911895751953, 0.06086540222167969, 0.06339168548583984, 0.06591796875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 8.0, 7.0, 11.0, 9.0, 15.0, 9.0, 18.0, 12.0, 16.0, 19.0, 29.0, 17.0, 40.0, 36.0, 39.0, 43.0, 54.0, 55.0, 58.0, 52.0, 45.0, 54.0, 46.0, 43.0, 32.0, 38.0, 22.0, 31.0, 17.0, 21.0, 17.0, 20.0, 14.0, 7.0, 12.0, 3.0, 5.0, 5.0, 7.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0560302734375, -0.05443000793457031, -0.052829742431640625, -0.05122947692871094, -0.04962921142578125, -0.04802894592285156, -0.046428680419921875, -0.04482841491699219, -0.0432281494140625, -0.04162788391113281, -0.040027618408203125, -0.03842735290527344, -0.03682708740234375, -0.03522682189941406, -0.033626556396484375, -0.03202629089355469, -0.030426025390625, -0.028825759887695312, -0.027225494384765625, -0.025625228881835938, -0.02402496337890625, -0.022424697875976562, -0.020824432373046875, -0.019224166870117188, -0.0176239013671875, -0.016023635864257812, -0.014423370361328125, -0.012823104858398438, -0.01122283935546875, -0.009622573852539062, -0.008022308349609375, -0.0064220428466796875, -0.00482177734375, -0.0032215118408203125, -0.001621246337890625, -2.09808349609375e-05, 0.00157928466796875, 0.0031795501708984375, 0.004779815673828125, 0.0063800811767578125, 0.0079803466796875, 0.009580612182617188, 0.011180877685546875, 0.012781143188476562, 0.01438140869140625, 0.015981674194335938, 0.017581939697265625, 0.019182205200195312, 0.020782470703125, 0.022382736206054688, 0.023983001708984375, 0.025583267211914062, 0.02718353271484375, 0.028783798217773438, 0.030384063720703125, 0.03198432922363281, 0.0335845947265625, 0.03518486022949219, 0.036785125732421875, 0.03838539123535156, 0.03998565673828125, 0.04158592224121094, 0.043186187744140625, 0.04478645324707031, 0.04638671875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 13.0, 21.0, 23.0, 34.0, 68.0, 100.0, 162.0, 202.0, 139.0, 92.0, 57.0, 32.0, 12.0, 16.0, 10.0, 6.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.1225615739822388, -1.0796549320220947, -1.0367484092712402, -0.9938417673110962, -0.9509351253509521, -0.9080285429954529, -0.8651219606399536, -0.8222153186798096, -0.7793087363243103, -0.736402153968811, -0.693495512008667, -0.6505889296531677, -0.6076823472976685, -0.5647757053375244, -0.5218691229820251, -0.4789625108242035, -0.43605589866638184, -0.3931492865085602, -0.3502426743507385, -0.30733609199523926, -0.2644294798374176, -0.22152286767959595, -0.17861628532409668, -0.13570967316627502, -0.09280306100845337, -0.04989645630121231, -0.0069898515939712524, 0.03591674566268921, 0.07882335782051086, 0.12172996997833252, 0.1646365523338318, 0.20754316449165344, 0.25044965744018555, 0.2933562695980072, 0.33626288175582886, 0.3791694641113281, 0.4220760762691498, 0.46498268842697144, 0.5078892707824707, 0.5507959127426147, 0.593702495098114, 0.6366090774536133, 0.6795157194137573, 0.7224223017692566, 0.7653288841247559, 0.8082355260848999, 0.8511421084403992, 0.8940486907958984, 0.9369553327560425, 0.9798619151115417, 1.022768497467041, 1.065675139427185, 1.108581781387329, 1.1514883041381836, 1.1943949460983276, 1.2373015880584717, 1.2802081108093262, 1.3231147527694702, 1.3660212755203247, 1.4089279174804688, 1.4518345594406128, 1.4947412014007568, 1.5376477241516113, 1.5805543661117554, 1.6234610080718994]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 4.0, 0.0, 5.0, 1.0, 5.0, 5.0, 6.0, 8.0, 9.0, 6.0, 17.0, 13.0, 23.0, 18.0, 28.0, 27.0, 34.0, 42.0, 33.0, 42.0, 34.0, 65.0, 81.0, 57.0, 53.0, 55.0, 68.0, 36.0, 31.0, 32.0, 26.0, 15.0, 24.0, 12.0, 9.0, 14.0, 18.0, 14.0, 10.0, 3.0, 8.0, 7.0, 2.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-1.043489694595337, -1.0154638290405273, -0.9874380230903625, -0.9594122171401978, -0.931386411190033, -0.9033605456352234, -0.8753347396850586, -0.847308874130249, -0.8192830681800842, -0.7912572622299194, -0.7632313966751099, -0.7352055907249451, -0.7071797847747803, -0.6791539192199707, -0.6511281132698059, -0.6231023073196411, -0.5950764417648315, -0.5670506358146667, -0.5390247702598572, -0.5109989643096924, -0.4829731285572052, -0.454947292804718, -0.4269214868545532, -0.39889565110206604, -0.37086987495422363, -0.34284403920173645, -0.31481823325157166, -0.2867923974990845, -0.2587665617465973, -0.2307407408952713, -0.2027149200439453, -0.17468908429145813, -0.14666324853897095, -0.11863742023706436, -0.09061159193515778, -0.06258577108383179, -0.0345599427819252, -0.006534114480018616, 0.021491706371307373, 0.049517542123794556, 0.07754336297512054, 0.10556919127702713, 0.13359501957893372, 0.1616208404302597, 0.1896466612815857, 0.21767249703407288, 0.24569831788539886, 0.27372413873672485, 0.30174997448921204, 0.3297758102416992, 0.357801616191864, 0.3858274519443512, 0.4138532876968384, 0.4418790936470032, 0.46990492939949036, 0.49793076515197754, 0.5259565711021423, 0.5539823770523071, 0.5820082426071167, 0.6100340485572815, 0.6380598545074463, 0.6660857200622559, 0.6941115260124207, 0.7221373319625854, 0.750163197517395]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 8.0, 9.0, 21.0, 21.0, 44.0, 66.0, 116.0, 201.0, 413.0, 682.0, 1434.0, 2974.0, 6862.0, 16718.0, 49970.0, 197669.0, 1165404.0, 2159560.0, 452591.0, 93452.0, 27585.0, 9997.0, 4314.0, 1965.0, 1010.0, 513.0, 260.0, 163.0, 104.0, 66.0, 33.0, 13.0, 13.0, 9.0, 7.0, 9.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06207275390625, -0.05994987487792969, -0.057826995849609375, -0.05570411682128906, -0.05358123779296875, -0.05145835876464844, -0.049335479736328125, -0.04721260070800781, -0.0450897216796875, -0.04296684265136719, -0.040843963623046875, -0.03872108459472656, -0.03659820556640625, -0.03447532653808594, -0.032352447509765625, -0.030229568481445312, -0.028106689453125, -0.025983810424804688, -0.023860931396484375, -0.021738052368164062, -0.01961517333984375, -0.017492294311523438, -0.015369415283203125, -0.013246536254882812, -0.0111236572265625, -0.009000778198242188, -0.006877899169921875, -0.0047550201416015625, -0.00263214111328125, -0.0005092620849609375, 0.001613616943359375, 0.0037364959716796875, 0.005859375, 0.007982254028320312, 0.010105133056640625, 0.012228012084960938, 0.01435089111328125, 0.016473770141601562, 0.018596649169921875, 0.020719528198242188, 0.0228424072265625, 0.024965286254882812, 0.027088165283203125, 0.029211044311523438, 0.03133392333984375, 0.03345680236816406, 0.035579681396484375, 0.03770256042480469, 0.039825439453125, 0.04194831848144531, 0.044071197509765625, 0.04619407653808594, 0.04831695556640625, 0.05043983459472656, 0.052562713623046875, 0.05468559265136719, 0.0568084716796875, 0.05893135070800781, 0.061054229736328125, 0.06317710876464844, 0.06529998779296875, 0.06742286682128906, 0.06954574584960938, 0.07166862487792969, 0.07379150390625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 4.0, 9.0, 8.0, 14.0, 13.0, 16.0, 15.0, 17.0, 30.0, 27.0, 27.0, 30.0, 40.0, 52.0, 49.0, 37.0, 38.0, 62.0, 51.0, 49.0, 49.0, 40.0, 49.0, 43.0, 37.0, 45.0, 24.0, 26.0, 27.0, 18.0, 10.0, 13.0, 3.0, 8.0, 4.0, 4.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.047515869140625, -0.04597282409667969, -0.044429779052734375, -0.04288673400878906, -0.04134368896484375, -0.03980064392089844, -0.038257598876953125, -0.03671455383300781, -0.0351715087890625, -0.03362846374511719, -0.032085418701171875, -0.030542373657226562, -0.02899932861328125, -0.027456283569335938, -0.025913238525390625, -0.024370193481445312, -0.0228271484375, -0.021284103393554688, -0.019741058349609375, -0.018198013305664062, -0.01665496826171875, -0.015111923217773438, -0.013568878173828125, -0.012025833129882812, -0.0104827880859375, -0.008939743041992188, -0.007396697998046875, -0.0058536529541015625, -0.00431060791015625, -0.0027675628662109375, -0.001224517822265625, 0.0003185272216796875, 0.001861572265625, 0.0034046173095703125, 0.004947662353515625, 0.0064907073974609375, 0.00803375244140625, 0.009576797485351562, 0.011119842529296875, 0.012662887573242188, 0.0142059326171875, 0.015748977661132812, 0.017292022705078125, 0.018835067749023438, 0.02037811279296875, 0.021921157836914062, 0.023464202880859375, 0.025007247924804688, 0.02655029296875, 0.028093338012695312, 0.029636383056640625, 0.031179428100585938, 0.03272247314453125, 0.03426551818847656, 0.035808563232421875, 0.03735160827636719, 0.0388946533203125, 0.04043769836425781, 0.041980743408203125, 0.04352378845214844, 0.04506683349609375, 0.04660987854003906, 0.048152923583984375, 0.04969596862792969, 0.051239013671875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 6.0, 4.0, 4.0, 7.0, 7.0, 16.0, 18.0, 12.0, 56.0, 65.0, 79.0, 167.0, 266.0, 446.0, 929.0, 2264.0, 6368.0, 19486.0, 84292.0, 737673.0, 2976954.0, 295493.0, 48915.0, 13119.0, 4420.0, 1628.0, 662.0, 357.0, 204.0, 113.0, 87.0, 55.0, 30.0, 22.0, 16.0, 8.0, 9.0, 8.0, 5.0, 1.0, 7.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1156005859375, -0.11165809631347656, -0.10771560668945312, -0.10377311706542969, -0.09983062744140625, -0.09588813781738281, -0.09194564819335938, -0.08800315856933594, -0.0840606689453125, -0.08011817932128906, -0.07617568969726562, -0.07223320007324219, -0.06829071044921875, -0.06434822082519531, -0.060405731201171875, -0.05646324157714844, -0.052520751953125, -0.04857826232910156, -0.044635772705078125, -0.04069328308105469, -0.03675079345703125, -0.03280830383300781, -0.028865814208984375, -0.024923324584960938, -0.0209808349609375, -0.017038345336914062, -0.013095855712890625, -0.009153366088867188, -0.00521087646484375, -0.0012683868408203125, 0.002674102783203125, 0.0066165924072265625, 0.01055908203125, 0.014501571655273438, 0.018444061279296875, 0.022386550903320312, 0.02632904052734375, 0.030271530151367188, 0.034214019775390625, 0.03815650939941406, 0.0420989990234375, 0.04604148864746094, 0.049983978271484375, 0.05392646789550781, 0.05786895751953125, 0.06181144714355469, 0.06575393676757812, 0.06969642639160156, 0.073638916015625, 0.07758140563964844, 0.08152389526367188, 0.08546638488769531, 0.08940887451171875, 0.09335136413574219, 0.09729385375976562, 0.10123634338378906, 0.1051788330078125, 0.10912132263183594, 0.11306381225585938, 0.11700630187988281, 0.12094879150390625, 0.12489128112792969, 0.12883377075195312, 0.13277626037597656, 0.13671875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 3.0, 1.0, 3.0, 5.0, 8.0, 5.0, 10.0, 9.0, 8.0, 15.0, 17.0, 18.0, 38.0, 46.0, 45.0, 55.0, 69.0, 118.0, 158.0, 203.0, 276.0, 430.0, 522.0, 493.0, 372.0, 287.0, 229.0, 143.0, 123.0, 76.0, 69.0, 47.0, 28.0, 30.0, 25.0, 16.0, 11.0, 9.0, 5.0, 1.0, 14.0, 6.0, 8.0, 8.0, 4.0, 0.0, 3.0, 2.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.092529296875, -0.08933639526367188, -0.08614349365234375, -0.08295059204101562, -0.0797576904296875, -0.07656478881835938, -0.07337188720703125, -0.07017898559570312, -0.066986083984375, -0.06379318237304688, -0.06060028076171875, -0.057407379150390625, -0.0542144775390625, -0.051021575927734375, -0.04782867431640625, -0.044635772705078125, -0.04144287109375, -0.038249969482421875, -0.03505706787109375, -0.031864166259765625, -0.0286712646484375, -0.025478363037109375, -0.02228546142578125, -0.019092559814453125, -0.015899658203125, -0.012706756591796875, -0.00951385498046875, -0.006320953369140625, -0.0031280517578125, 6.4849853515625e-05, 0.00325775146484375, 0.006450653076171875, 0.0096435546875, 0.012836456298828125, 0.01602935791015625, 0.019222259521484375, 0.0224151611328125, 0.025608062744140625, 0.02880096435546875, 0.031993865966796875, 0.035186767578125, 0.038379669189453125, 0.04157257080078125, 0.044765472412109375, 0.0479583740234375, 0.051151275634765625, 0.05434417724609375, 0.057537078857421875, 0.06072998046875, 0.06392288208007812, 0.06711578369140625, 0.07030868530273438, 0.0735015869140625, 0.07669448852539062, 0.07988739013671875, 0.08308029174804688, 0.086273193359375, 0.08946609497070312, 0.09265899658203125, 0.09585189819335938, 0.0990447998046875, 0.10223770141601562, 0.10543060302734375, 0.10862350463867188, 0.11181640625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 6.0, 12.0, 25.0, 80.0, 164.0, 280.0, 219.0, 116.0, 51.0, 20.0, 9.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4146473407745361, -1.3522950410842896, -1.289942741394043, -1.2275904417037964, -1.1652381420135498, -1.1028858423233032, -1.0405335426330566, -0.9781813025474548, -0.9158290028572083, -0.8534767031669617, -0.7911244034767151, -0.7287721633911133, -0.6664198637008667, -0.6040675640106201, -0.5417152643203735, -0.47936296463012695, -0.41701066493988037, -0.3546583652496338, -0.2923060655593872, -0.229953795671463, -0.16760149598121643, -0.10524919629096985, -0.042896926403045654, 0.019455373287200928, 0.08180767297744751, 0.1441599726676941, 0.20651225745677948, 0.26886454224586487, 0.33121684193611145, 0.39356914162635803, 0.4559214115142822, 0.5182737112045288, 0.5806260108947754, 0.642978310585022, 0.7053306102752686, 0.7676829099655151, 0.8300352096557617, 0.8923875093460083, 0.9547397494316101, 1.017091989517212, 1.079444408416748, 1.1417967081069946, 1.2041490077972412, 1.2665013074874878, 1.3288536071777344, 1.391205906867981, 1.4535582065582275, 1.5159103870391846, 1.5782626867294312, 1.6406149864196777, 1.7029672861099243, 1.765319585800171, 1.8276718854904175, 1.890024185180664, 1.952376365661621, 2.0147287845611572, 2.0770809650421143, 2.1394331455230713, 2.2017855644226074, 2.2641377449035645, 2.3264901638031006, 2.3888423442840576, 2.4511947631835938, 2.513546943664551, 2.575899362564087]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 2.0, 8.0, 9.0, 12.0, 9.0, 10.0, 15.0, 19.0, 26.0, 20.0, 29.0, 25.0, 39.0, 35.0, 46.0, 47.0, 50.0, 50.0, 39.0, 57.0, 63.0, 48.0, 50.0, 37.0, 28.0, 30.0, 31.0, 33.0, 26.0, 22.0, 16.0, 14.0, 12.0, 9.0, 5.0, 9.0, 9.0, 6.0, 3.0, 1.0, 1.0, 2.0, 5.0, 1.0], "bins": [-0.7618774771690369, -0.7423037886619568, -0.7227301597595215, -0.7031564712524414, -0.6835827827453613, -0.6640090942382812, -0.6444354057312012, -0.6248617768287659, -0.6052880883216858, -0.5857143998146057, -0.5661407709121704, -0.5465670824050903, -0.5269933938980103, -0.5074197053909302, -0.4878460466861725, -0.4682723879814148, -0.4486986994743347, -0.42912501096725464, -0.40955135226249695, -0.38997769355773926, -0.3704040050506592, -0.3508303165435791, -0.3312566578388214, -0.3116829991340637, -0.29210931062698364, -0.27253562211990356, -0.2529619634151459, -0.233388289809227, -0.2138146162033081, -0.19424094259738922, -0.17466726899147034, -0.15509359538555145, -0.13551992177963257, -0.11594624817371368, -0.0963725745677948, -0.07679890096187592, -0.05722522735595703, -0.03765155375003815, -0.018077880144119263, 0.0014957934617996216, 0.021069467067718506, 0.04064314067363739, 0.060216814279556274, 0.07979048788547516, 0.09936416149139404, 0.11893783509731293, 0.1385115087032318, 0.1580851823091507, 0.17765885591506958, 0.19723252952098846, 0.21680620312690735, 0.23637987673282623, 0.2559535503387451, 0.2755272388458252, 0.2951008975505829, 0.3146745562553406, 0.33424824476242065, 0.35382193326950073, 0.3733955919742584, 0.3929692506790161, 0.4125429391860962, 0.43211662769317627, 0.45169028639793396, 0.47126394510269165, 0.49083763360977173]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 6.0, 7.0, 22.0, 15.0, 46.0, 50.0, 104.0, 193.0, 331.0, 685.0, 1342.0, 2837.0, 6480.0, 18029.0, 60192.0, 262146.0, 509846.0, 131878.0, 34696.0, 11213.0, 4406.0, 1966.0, 952.0, 502.0, 255.0, 135.0, 87.0, 52.0, 32.0, 27.0, 10.0, 5.0, 6.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1378173828125, -0.13341140747070312, -0.12900543212890625, -0.12459945678710938, -0.1201934814453125, -0.11578750610351562, -0.11138153076171875, -0.10697555541992188, -0.102569580078125, -0.09816360473632812, -0.09375762939453125, -0.08935165405273438, -0.0849456787109375, -0.08053970336914062, -0.07613372802734375, -0.07172775268554688, -0.06732177734375, -0.06291580200195312, -0.05850982666015625, -0.054103851318359375, -0.0496978759765625, -0.045291900634765625, -0.04088592529296875, -0.036479949951171875, -0.032073974609375, -0.027667999267578125, -0.02326202392578125, -0.018856048583984375, -0.0144500732421875, -0.010044097900390625, -0.00563812255859375, -0.001232147216796875, 0.003173828125, 0.007579803466796875, 0.01198577880859375, 0.016391754150390625, 0.0207977294921875, 0.025203704833984375, 0.02960968017578125, 0.034015655517578125, 0.038421630859375, 0.042827606201171875, 0.04723358154296875, 0.051639556884765625, 0.0560455322265625, 0.060451507568359375, 0.06485748291015625, 0.06926345825195312, 0.07366943359375, 0.07807540893554688, 0.08248138427734375, 0.08688735961914062, 0.0912933349609375, 0.09569931030273438, 0.10010528564453125, 0.10451126098632812, 0.108917236328125, 0.11332321166992188, 0.11772918701171875, 0.12213516235351562, 0.1265411376953125, 0.13094711303710938, 0.13535308837890625, 0.13975906372070312, 0.1441650390625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 7.0, 4.0, 7.0, 11.0, 5.0, 5.0, 11.0, 14.0, 22.0, 14.0, 22.0, 21.0, 46.0, 53.0, 38.0, 32.0, 46.0, 45.0, 55.0, 52.0, 55.0, 55.0, 38.0, 44.0, 47.0, 27.0, 43.0, 38.0, 36.0, 27.0, 17.0, 16.0, 13.0, 8.0, 10.0, 9.0, 1.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.05877685546875, -0.05713605880737305, -0.055495262145996094, -0.05385446548461914, -0.05221366882324219, -0.050572872161865234, -0.04893207550048828, -0.04729127883911133, -0.045650482177734375, -0.04400968551635742, -0.04236888885498047, -0.040728092193603516, -0.03908729553222656, -0.03744649887084961, -0.035805702209472656, -0.0341649055480957, -0.03252410888671875, -0.030883312225341797, -0.029242515563964844, -0.02760171890258789, -0.025960922241210938, -0.024320125579833984, -0.02267932891845703, -0.021038532257080078, -0.019397735595703125, -0.017756938934326172, -0.01611614227294922, -0.014475345611572266, -0.012834548950195312, -0.01119375228881836, -0.009552955627441406, -0.007912158966064453, -0.0062713623046875, -0.004630565643310547, -0.0029897689819335938, -0.0013489723205566406, 0.0002918243408203125, 0.0019326210021972656, 0.0035734176635742188, 0.005214214324951172, 0.006855010986328125, 0.008495807647705078, 0.010136604309082031, 0.011777400970458984, 0.013418197631835938, 0.01505899429321289, 0.016699790954589844, 0.018340587615966797, 0.01998138427734375, 0.021622180938720703, 0.023262977600097656, 0.02490377426147461, 0.026544570922851562, 0.028185367584228516, 0.02982616424560547, 0.03146696090698242, 0.033107757568359375, 0.03474855422973633, 0.03638935089111328, 0.038030147552490234, 0.03967094421386719, 0.04131174087524414, 0.042952537536621094, 0.04459333419799805, 0.046234130859375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 4.0, 9.0, 8.0, 12.0, 32.0, 43.0, 69.0, 118.0, 199.0, 414.0, 899.0, 2139.0, 7842.0, 60659.0, 844909.0, 114862.0, 11475.0, 2777.0, 1020.0, 455.0, 272.0, 124.0, 69.0, 45.0, 43.0, 16.0, 16.0, 11.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.249755859375, -0.24071121215820312, -0.23166656494140625, -0.22262191772460938, -0.2135772705078125, -0.20453262329101562, -0.19548797607421875, -0.18644332885742188, -0.177398681640625, -0.16835403442382812, -0.15930938720703125, -0.15026473999023438, -0.1412200927734375, -0.13217544555664062, -0.12313079833984375, -0.11408615112304688, -0.10504150390625, -0.09599685668945312, -0.08695220947265625, -0.07790756225585938, -0.0688629150390625, -0.059818267822265625, -0.05077362060546875, -0.041728973388671875, -0.032684326171875, -0.023639678955078125, -0.01459503173828125, -0.005550384521484375, 0.0034942626953125, 0.012538909912109375, 0.02158355712890625, 0.030628204345703125, 0.0396728515625, 0.048717498779296875, 0.05776214599609375, 0.06680679321289062, 0.0758514404296875, 0.08489608764648438, 0.09394073486328125, 0.10298538208007812, 0.112030029296875, 0.12107467651367188, 0.13011932373046875, 0.13916397094726562, 0.1482086181640625, 0.15725326538085938, 0.16629791259765625, 0.17534255981445312, 0.18438720703125, 0.19343185424804688, 0.20247650146484375, 0.21152114868164062, 0.2205657958984375, 0.22961044311523438, 0.23865509033203125, 0.24769973754882812, 0.256744384765625, 0.2657890319824219, 0.27483367919921875, 0.2838783264160156, 0.2929229736328125, 0.3019676208496094, 0.31101226806640625, 0.3200569152832031, 0.3291015625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 6.0, 5.0, 6.0, 7.0, 4.0, 9.0, 6.0, 10.0, 12.0, 14.0, 14.0, 18.0, 15.0, 20.0, 28.0, 27.0, 30.0, 35.0, 53.0, 28.0, 33.0, 38.0, 41.0, 35.0, 47.0, 47.0, 42.0, 42.0, 45.0, 39.0, 36.0, 26.0, 29.0, 18.0, 18.0, 14.0, 19.0, 12.0, 19.0, 9.0, 6.0, 9.0, 7.0, 3.0, 4.0, 4.0, 4.0, 3.0, 2.0, 5.0, 6.0, 2.0, 1.0, 1.0], "bins": [-0.1964111328125, -0.1906261444091797, -0.18484115600585938, -0.17905616760253906, -0.17327117919921875, -0.16748619079589844, -0.16170120239257812, -0.1559162139892578, -0.1501312255859375, -0.1443462371826172, -0.13856124877929688, -0.13277626037597656, -0.12699127197265625, -0.12120628356933594, -0.11542129516601562, -0.10963630676269531, -0.103851318359375, -0.09806632995605469, -0.09228134155273438, -0.08649635314941406, -0.08071136474609375, -0.07492637634277344, -0.06914138793945312, -0.06335639953613281, -0.0575714111328125, -0.05178642272949219, -0.046001434326171875, -0.04021644592285156, -0.03443145751953125, -0.028646469116210938, -0.022861480712890625, -0.017076492309570312, -0.01129150390625, -0.0055065155029296875, 0.000278472900390625, 0.0060634613037109375, 0.01184844970703125, 0.017633438110351562, 0.023418426513671875, 0.029203414916992188, 0.0349884033203125, 0.04077339172363281, 0.046558380126953125, 0.05234336853027344, 0.05812835693359375, 0.06391334533691406, 0.06969833374023438, 0.07548332214355469, 0.081268310546875, 0.08705329895019531, 0.09283828735351562, 0.09862327575683594, 0.10440826416015625, 0.11019325256347656, 0.11597824096679688, 0.12176322937011719, 0.1275482177734375, 0.1333332061767578, 0.13911819458007812, 0.14490318298339844, 0.15068817138671875, 0.15647315979003906, 0.16225814819335938, 0.1680431365966797, 0.173828125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 2.0, 11.0, 8.0, 7.0, 7.0, 17.0, 29.0, 28.0, 53.0, 74.0, 89.0, 124.0, 216.0, 343.0, 560.0, 995.0, 1900.0, 4238.0, 10173.0, 30744.0, 111268.0, 556172.0, 240850.0, 59850.0, 17958.0, 6593.0, 2858.0, 1387.0, 776.0, 409.0, 267.0, 168.0, 105.0, 70.0, 63.0, 37.0, 22.0, 22.0, 12.0, 12.0, 14.0, 6.0, 5.0, 6.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.052337646484375, -0.05057954788208008, -0.048821449279785156, -0.047063350677490234, -0.04530525207519531, -0.04354715347290039, -0.04178905487060547, -0.04003095626831055, -0.038272857666015625, -0.0365147590637207, -0.03475666046142578, -0.03299856185913086, -0.031240463256835938, -0.029482364654541016, -0.027724266052246094, -0.025966167449951172, -0.02420806884765625, -0.022449970245361328, -0.020691871643066406, -0.018933773040771484, -0.017175674438476562, -0.01541757583618164, -0.013659477233886719, -0.011901378631591797, -0.010143280029296875, -0.008385181427001953, -0.006627082824707031, -0.004868984222412109, -0.0031108856201171875, -0.0013527870178222656, 0.00040531158447265625, 0.002163410186767578, 0.0039215087890625, 0.005679607391357422, 0.007437705993652344, 0.009195804595947266, 0.010953903198242188, 0.01271200180053711, 0.014470100402832031, 0.016228199005126953, 0.017986297607421875, 0.019744396209716797, 0.02150249481201172, 0.02326059341430664, 0.025018692016601562, 0.026776790618896484, 0.028534889221191406, 0.030292987823486328, 0.03205108642578125, 0.03380918502807617, 0.035567283630371094, 0.037325382232666016, 0.03908348083496094, 0.04084157943725586, 0.04259967803955078, 0.0443577766418457, 0.046115875244140625, 0.04787397384643555, 0.04963207244873047, 0.05139017105102539, 0.05314826965332031, 0.054906368255615234, 0.056664466857910156, 0.05842256546020508, 0.0601806640625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 5.0, 2.0, 2.0, 4.0, 5.0, 2.0, 8.0, 8.0, 12.0, 14.0, 21.0, 18.0, 30.0, 34.0, 32.0, 42.0, 65.0, 63.0, 52.0, 69.0, 76.0, 64.0, 71.0, 54.0, 31.0, 24.0, 31.0, 31.0, 26.0, 19.0, 15.0, 13.0, 16.0, 15.0, 5.0, 6.0, 3.0, 3.0, 3.0, 2.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.390146255493164e-05, -2.3271888494491577e-05, -2.2642314434051514e-05, -2.201274037361145e-05, -2.1383166313171387e-05, -2.0753592252731323e-05, -2.012401819229126e-05, -1.9494444131851196e-05, -1.8864870071411133e-05, -1.823529601097107e-05, -1.7605721950531006e-05, -1.6976147890090942e-05, -1.634657382965088e-05, -1.5716999769210815e-05, -1.5087425708770752e-05, -1.4457851648330688e-05, -1.3828277587890625e-05, -1.3198703527450562e-05, -1.2569129467010498e-05, -1.1939555406570435e-05, -1.1309981346130371e-05, -1.0680407285690308e-05, -1.0050833225250244e-05, -9.42125916481018e-06, -8.791685104370117e-06, -8.162111043930054e-06, -7.53253698348999e-06, -6.902962923049927e-06, -6.273388862609863e-06, -5.6438148021698e-06, -5.014240741729736e-06, -4.384666681289673e-06, -3.7550926208496094e-06, -3.125518560409546e-06, -2.4959444999694824e-06, -1.866370439529419e-06, -1.2367963790893555e-06, -6.07222318649292e-07, 2.2351741790771484e-08, 6.51925802230835e-07, 1.2814998626708984e-06, 1.911073923110962e-06, 2.5406479835510254e-06, 3.170222043991089e-06, 3.7997961044311523e-06, 4.429370164871216e-06, 5.058944225311279e-06, 5.688518285751343e-06, 6.318092346191406e-06, 6.94766640663147e-06, 7.577240467071533e-06, 8.206814527511597e-06, 8.83638858795166e-06, 9.465962648391724e-06, 1.0095536708831787e-05, 1.072511076927185e-05, 1.1354684829711914e-05, 1.1984258890151978e-05, 1.2613832950592041e-05, 1.3243407011032104e-05, 1.3872981071472168e-05, 1.4502555131912231e-05, 1.5132129192352295e-05, 1.576170325279236e-05, 1.6391277313232422e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 1.0, 2.0, 5.0, 10.0, 13.0, 11.0, 21.0, 25.0, 46.0, 56.0, 95.0, 147.0, 239.0, 435.0, 847.0, 1772.0, 4271.0, 13221.0, 59628.0, 501646.0, 388269.0, 57321.0, 12682.0, 4180.0, 1713.0, 769.0, 427.0, 279.0, 144.0, 99.0, 60.0, 34.0, 27.0, 16.0, 16.0, 10.0, 5.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0740966796875, -0.07191658020019531, -0.06973648071289062, -0.06755638122558594, -0.06537628173828125, -0.06319618225097656, -0.061016082763671875, -0.05883598327636719, -0.0566558837890625, -0.05447578430175781, -0.052295684814453125, -0.05011558532714844, -0.04793548583984375, -0.04575538635253906, -0.043575286865234375, -0.04139518737792969, -0.039215087890625, -0.03703498840332031, -0.034854888916015625, -0.03267478942871094, -0.03049468994140625, -0.028314590454101562, -0.026134490966796875, -0.023954391479492188, -0.0217742919921875, -0.019594192504882812, -0.017414093017578125, -0.015233993530273438, -0.01305389404296875, -0.010873794555664062, -0.008693695068359375, -0.0065135955810546875, -0.00433349609375, -0.0021533966064453125, 2.6702880859375e-05, 0.0022068023681640625, 0.00438690185546875, 0.0065670013427734375, 0.008747100830078125, 0.010927200317382812, 0.0131072998046875, 0.015287399291992188, 0.017467498779296875, 0.019647598266601562, 0.02182769775390625, 0.024007797241210938, 0.026187896728515625, 0.028367996215820312, 0.030548095703125, 0.03272819519042969, 0.034908294677734375, 0.03708839416503906, 0.03926849365234375, 0.04144859313964844, 0.043628692626953125, 0.04580879211425781, 0.0479888916015625, 0.05016899108886719, 0.052349090576171875, 0.05452919006347656, 0.05670928955078125, 0.05888938903808594, 0.061069488525390625, 0.06324958801269531, 0.0654296875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 5.0, 3.0, 7.0, 13.0, 7.0, 13.0, 15.0, 13.0, 15.0, 14.0, 28.0, 35.0, 37.0, 41.0, 57.0, 57.0, 82.0, 56.0, 57.0, 65.0, 57.0, 64.0, 42.0, 31.0, 33.0, 33.0, 20.0, 13.0, 22.0, 15.0, 8.0, 6.0, 10.0, 10.0, 3.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048736572265625, -0.04724407196044922, -0.04575157165527344, -0.044259071350097656, -0.042766571044921875, -0.041274070739746094, -0.03978157043457031, -0.03828907012939453, -0.03679656982421875, -0.03530406951904297, -0.03381156921386719, -0.032319068908691406, -0.030826568603515625, -0.029334068298339844, -0.027841567993164062, -0.02634906768798828, -0.0248565673828125, -0.02336406707763672, -0.021871566772460938, -0.020379066467285156, -0.018886566162109375, -0.017394065856933594, -0.015901565551757812, -0.014409065246582031, -0.01291656494140625, -0.011424064636230469, -0.009931564331054688, -0.008439064025878906, -0.006946563720703125, -0.005454063415527344, -0.0039615631103515625, -0.0024690628051757812, -0.0009765625, 0.0005159378051757812, 0.0020084381103515625, 0.0035009384155273438, 0.004993438720703125, 0.006485939025878906, 0.007978439331054688, 0.009470939636230469, 0.01096343994140625, 0.012455940246582031, 0.013948440551757812, 0.015440940856933594, 0.016933441162109375, 0.018425941467285156, 0.019918441772460938, 0.02141094207763672, 0.0229034423828125, 0.02439594268798828, 0.025888442993164062, 0.027380943298339844, 0.028873443603515625, 0.030365943908691406, 0.03185844421386719, 0.03335094451904297, 0.03484344482421875, 0.03633594512939453, 0.03782844543457031, 0.039320945739746094, 0.040813446044921875, 0.042305946350097656, 0.04379844665527344, 0.04529094696044922, 0.046783447265625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 8.0, 8.0, 20.0, 64.0, 127.0, 322.0, 252.0, 112.0, 50.0, 17.0, 9.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4606847763061523, -1.3905689716339111, -1.3204530477523804, -1.2503372430801392, -1.1802213191986084, -1.1101055145263672, -1.039989709854126, -0.96987384557724, -0.899757981300354, -0.829642117023468, -0.759526252746582, -0.6894104480743408, -0.6192945837974548, -0.5491787195205688, -0.47906288504600525, -0.40894705057144165, -0.33883118629455566, -0.2687153220176697, -0.19859948754310608, -0.1284836381673813, -0.058367788791656494, 0.011748075485229492, 0.08186390995979309, 0.1519797444343567, 0.22209560871124268, 0.29221147298812866, 0.36232730746269226, 0.43244314193725586, 0.5025590062141418, 0.5726748704910278, 0.642790675163269, 0.712906539440155, 0.7830226421356201, 0.8531385064125061, 0.9232543706893921, 0.9933701753616333, 1.063486099243164, 1.1336019039154053, 1.2037177085876465, 1.2738335132598877, 1.3439494371414185, 1.4140652418136597, 1.4841811656951904, 1.5542969703674316, 1.6244127750396729, 1.6945286989212036, 1.7646445035934448, 1.8347604274749756, 1.9048762321472168, 1.974992036819458, 2.045107841491699, 2.1152238845825195, 2.1853396892547607, 2.255455493927002, 2.325571298599243, 2.3956871032714844, 2.4658031463623047, 2.535918951034546, 2.606034755706787, 2.6761507987976074, 2.7462666034698486, 2.81638240814209, 2.886498212814331, 2.9566140174865723, 3.0267298221588135]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 6.0, 4.0, 5.0, 11.0, 5.0, 11.0, 6.0, 13.0, 16.0, 15.0, 21.0, 25.0, 29.0, 30.0, 31.0, 30.0, 43.0, 36.0, 48.0, 68.0, 61.0, 65.0, 60.0, 43.0, 53.0, 35.0, 31.0, 22.0, 23.0, 20.0, 19.0, 17.0, 16.0, 13.0, 11.0, 14.0, 7.0, 7.0, 7.0, 6.0, 1.0, 4.0, 6.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.8308830857276917, -0.8063111305236816, -0.7817391753196716, -0.7571672201156616, -0.7325952649116516, -0.7080233097076416, -0.6834513545036316, -0.6588793992996216, -0.6343074440956116, -0.6097354888916016, -0.5851635336875916, -0.5605915784835815, -0.5360196232795715, -0.5114476680755615, -0.4868757128715515, -0.4623037576675415, -0.4377318322658539, -0.41315987706184387, -0.38858792185783386, -0.36401596665382385, -0.33944401144981384, -0.31487205624580383, -0.2903001308441162, -0.2657281756401062, -0.241156205534935, -0.216584250330925, -0.19201229512691498, -0.16744035482406616, -0.14286839962005615, -0.11829643696546555, -0.09372448921203613, -0.06915253400802612, -0.04458057880401611, -0.020008625462651253, 0.004563327878713608, 0.02913527935743332, 0.05370723456144333, 0.07827918976545334, 0.10285113751888275, 0.12742309272289276, 0.15199504792690277, 0.17656700313091278, 0.2011389583349228, 0.2257108986377716, 0.2502828538417816, 0.2748548090457916, 0.29942676424980164, 0.32399871945381165, 0.34857067465782166, 0.37314262986183167, 0.3977145850658417, 0.4222865402698517, 0.4468584954738617, 0.4714304506778717, 0.4960023760795593, 0.5205743312835693, 0.5451462864875793, 0.5697182416915894, 0.5942901968955994, 0.6188621520996094, 0.6434341073036194, 0.6680060625076294, 0.6925780177116394, 0.7171499729156494, 0.7417219281196594]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 4.0, 12.0, 12.0, 17.0, 21.0, 52.0, 78.0, 114.0, 215.0, 319.0, 633.0, 1216.0, 2441.0, 5559.0, 15243.0, 52736.0, 312309.0, 2355352.0, 1250542.0, 147460.0, 31583.0, 10148.0, 4193.0, 1863.0, 924.0, 486.0, 297.0, 148.0, 126.0, 65.0, 38.0, 28.0, 16.0, 11.0, 9.0, 8.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.09442138671875, -0.09204959869384766, -0.08967781066894531, -0.08730602264404297, -0.08493423461914062, -0.08256244659423828, -0.08019065856933594, -0.0778188705444336, -0.07544708251953125, -0.0730752944946289, -0.07070350646972656, -0.06833171844482422, -0.06595993041992188, -0.06358814239501953, -0.06121635437011719, -0.058844566345214844, -0.0564727783203125, -0.054100990295410156, -0.05172920227050781, -0.04935741424560547, -0.046985626220703125, -0.04461383819580078, -0.04224205017089844, -0.039870262145996094, -0.03749847412109375, -0.035126686096191406, -0.03275489807128906, -0.03038311004638672, -0.028011322021484375, -0.02563953399658203, -0.023267745971679688, -0.020895957946777344, -0.018524169921875, -0.016152381896972656, -0.013780593872070312, -0.011408805847167969, -0.009037017822265625, -0.006665229797363281, -0.0042934417724609375, -0.0019216537475585938, 0.00045013427734375, 0.0028219223022460938, 0.0051937103271484375, 0.007565498352050781, 0.009937286376953125, 0.012309074401855469, 0.014680862426757812, 0.017052650451660156, 0.0194244384765625, 0.021796226501464844, 0.024168014526367188, 0.02653980255126953, 0.028911590576171875, 0.03128337860107422, 0.03365516662597656, 0.036026954650878906, 0.03839874267578125, 0.040770530700683594, 0.04314231872558594, 0.04551410675048828, 0.047885894775390625, 0.05025768280029297, 0.05262947082519531, 0.055001258850097656, 0.057373046875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 2.0, 5.0, 4.0, 3.0, 8.0, 6.0, 7.0, 12.0, 12.0, 14.0, 27.0, 32.0, 26.0, 24.0, 33.0, 35.0, 34.0, 32.0, 34.0, 33.0, 51.0, 47.0, 49.0, 37.0, 44.0, 32.0, 39.0, 43.0, 34.0, 42.0, 24.0, 24.0, 27.0, 24.0, 22.0, 20.0, 14.0, 10.0, 8.0, 6.0, 7.0, 7.0, 4.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.042877197265625, -0.04151439666748047, -0.04015159606933594, -0.038788795471191406, -0.037425994873046875, -0.036063194274902344, -0.03470039367675781, -0.03333759307861328, -0.03197479248046875, -0.03061199188232422, -0.029249191284179688, -0.027886390686035156, -0.026523590087890625, -0.025160789489746094, -0.023797988891601562, -0.02243518829345703, -0.0210723876953125, -0.01970958709716797, -0.018346786499023438, -0.016983985900878906, -0.015621185302734375, -0.014258384704589844, -0.012895584106445312, -0.011532783508300781, -0.01016998291015625, -0.008807182312011719, -0.0074443817138671875, -0.006081581115722656, -0.004718780517578125, -0.0033559799194335938, -0.0019931793212890625, -0.0006303787231445312, 0.000732421875, 0.0020952224731445312, 0.0034580230712890625, 0.004820823669433594, 0.006183624267578125, 0.007546424865722656, 0.008909225463867188, 0.010272026062011719, 0.01163482666015625, 0.012997627258300781, 0.014360427856445312, 0.015723228454589844, 0.017086029052734375, 0.018448829650878906, 0.019811630249023438, 0.02117443084716797, 0.0225372314453125, 0.02390003204345703, 0.025262832641601562, 0.026625633239746094, 0.027988433837890625, 0.029351234436035156, 0.030714035034179688, 0.03207683563232422, 0.03343963623046875, 0.03480243682861328, 0.03616523742675781, 0.037528038024902344, 0.038890838623046875, 0.040253639221191406, 0.04161643981933594, 0.04297924041748047, 0.044342041015625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 7.0, 9.0, 33.0, 56.0, 58.0, 119.0, 221.0, 459.0, 1071.0, 3519.0, 15478.0, 148591.0, 3665702.0, 327376.0, 24454.0, 4782.0, 1329.0, 467.0, 239.0, 114.0, 63.0, 38.0, 33.0, 17.0, 12.0, 7.0, 10.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1949462890625, -0.18896865844726562, -0.18299102783203125, -0.17701339721679688, -0.1710357666015625, -0.16505813598632812, -0.15908050537109375, -0.15310287475585938, -0.147125244140625, -0.14114761352539062, -0.13516998291015625, -0.12919235229492188, -0.1232147216796875, -0.11723709106445312, -0.11125946044921875, -0.10528182983398438, -0.09930419921875, -0.09332656860351562, -0.08734893798828125, -0.08137130737304688, -0.0753936767578125, -0.06941604614257812, -0.06343841552734375, -0.057460784912109375, -0.051483154296875, -0.045505523681640625, -0.03952789306640625, -0.033550262451171875, -0.0275726318359375, -0.021595001220703125, -0.01561737060546875, -0.009639739990234375, -0.003662109375, 0.002315521240234375, 0.00829315185546875, 0.014270782470703125, 0.0202484130859375, 0.026226043701171875, 0.03220367431640625, 0.038181304931640625, 0.044158935546875, 0.050136566162109375, 0.05611419677734375, 0.062091827392578125, 0.0680694580078125, 0.07404708862304688, 0.08002471923828125, 0.08600234985351562, 0.09197998046875, 0.09795761108398438, 0.10393524169921875, 0.10991287231445312, 0.1158905029296875, 0.12186813354492188, 0.12784576416015625, 0.13382339477539062, 0.139801025390625, 0.14577865600585938, 0.15175628662109375, 0.15773391723632812, 0.1637115478515625, 0.16968917846679688, 0.17566680908203125, 0.18164443969726562, 0.1876220703125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 1.0, 2.0, 3.0, 4.0, 4.0, 10.0, 9.0, 15.0, 12.0, 19.0, 23.0, 35.0, 57.0, 96.0, 113.0, 194.0, 294.0, 423.0, 613.0, 699.0, 465.0, 322.0, 185.0, 137.0, 104.0, 51.0, 41.0, 30.0, 32.0, 15.0, 13.0, 9.0, 11.0, 10.0, 4.0, 2.0, 4.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.119140625, -0.11554431915283203, -0.11194801330566406, -0.1083517074584961, -0.10475540161132812, -0.10115909576416016, -0.09756278991699219, -0.09396648406982422, -0.09037017822265625, -0.08677387237548828, -0.08317756652832031, -0.07958126068115234, -0.07598495483398438, -0.0723886489868164, -0.06879234313964844, -0.06519603729248047, -0.0615997314453125, -0.05800342559814453, -0.05440711975097656, -0.050810813903808594, -0.047214508056640625, -0.043618202209472656, -0.04002189636230469, -0.03642559051513672, -0.03282928466796875, -0.02923297882080078, -0.025636672973632812, -0.022040367126464844, -0.018444061279296875, -0.014847755432128906, -0.011251449584960938, -0.007655143737792969, -0.004058837890625, -0.00046253204345703125, 0.0031337738037109375, 0.006730079650878906, 0.010326385498046875, 0.013922691345214844, 0.017518997192382812, 0.02111530303955078, 0.02471160888671875, 0.02830791473388672, 0.03190422058105469, 0.035500526428222656, 0.039096832275390625, 0.042693138122558594, 0.04628944396972656, 0.04988574981689453, 0.0534820556640625, 0.05707836151123047, 0.06067466735839844, 0.0642709732055664, 0.06786727905273438, 0.07146358489990234, 0.07505989074707031, 0.07865619659423828, 0.08225250244140625, 0.08584880828857422, 0.08944511413574219, 0.09304141998291016, 0.09663772583007812, 0.1002340316772461, 0.10383033752441406, 0.10742664337158203, 0.11102294921875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 6.0, 7.0, 9.0, 31.0, 58.0, 177.0, 243.0, 213.0, 143.0, 63.0, 25.0, 13.0, 6.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.8412970304489136, -1.7834926843643188, -1.7256882190704346, -1.6678838729858398, -1.6100794076919556, -1.5522750616073608, -1.4944705963134766, -1.4366662502288818, -1.378861904144287, -1.3210575580596924, -1.263253092765808, -1.2054487466812134, -1.147644281387329, -1.0898399353027344, -1.0320355892181396, -0.9742311239242554, -0.9164266586303711, -0.8586222529411316, -0.8008178472518921, -0.7430135011672974, -0.6852090358734131, -0.6274046897888184, -0.5696002840995789, -0.5117958784103394, -0.45399147272109985, -0.39618706703186035, -0.33838266134262085, -0.28057828545570374, -0.22277387976646423, -0.16496947407722473, -0.10716509819030762, -0.049360692501068115, 0.008443832397460938, 0.06624823063611984, 0.12405262887477875, 0.18185701966285706, 0.23966142535209656, 0.29746583104133606, 0.3552702069282532, 0.4130746126174927, 0.4708790183067322, 0.5286834239959717, 0.5864878296852112, 0.6442922353744507, 0.7020965814590454, 0.7599010467529297, 0.8177053928375244, 0.8755097985267639, 0.9333142042160034, 0.9911186099052429, 1.0489230155944824, 1.1067273616790771, 1.1645318269729614, 1.2223361730575562, 1.2801406383514404, 1.3379449844360352, 1.3957493305206299, 1.4535536766052246, 1.5113581418991089, 1.5691624879837036, 1.626966953277588, 1.6847712993621826, 1.7425756454467773, 1.8003801107406616, 1.858184576034546]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 5.0, 9.0, 14.0, 15.0, 20.0, 25.0, 30.0, 29.0, 52.0, 54.0, 58.0, 79.0, 65.0, 68.0, 65.0, 72.0, 64.0, 45.0, 50.0, 41.0, 29.0, 21.0, 14.0, 21.0, 15.0, 10.0, 4.0, 9.0, 7.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7511221766471863, -0.7279333472251892, -0.7047445178031921, -0.6815556883811951, -0.6583667993545532, -0.6351779699325562, -0.6119891405105591, -0.588800311088562, -0.5656114816665649, -0.5424226522445679, -0.5192338228225708, -0.49604496359825134, -0.4728561341762543, -0.4496673047542572, -0.42647844552993774, -0.4032896161079407, -0.3801007866859436, -0.35691195726394653, -0.33372312784194946, -0.31053426861763, -0.28734543919563293, -0.26415660977363586, -0.2409677654504776, -0.21777892112731934, -0.19459009170532227, -0.1714012622833252, -0.14821241796016693, -0.12502357363700867, -0.1018347442150116, -0.07864590734243393, -0.05545707046985626, -0.032268226146698, -0.009079396724700928, 0.01410944014787674, 0.03729827702045441, 0.060487113893032074, 0.08367595076560974, 0.10686478763818741, 0.13005362451076508, 0.15324246883392334, 0.1764312982559204, 0.19962012767791748, 0.22280897200107574, 0.245997816324234, 0.2691866457462311, 0.29237547516822815, 0.3155643343925476, 0.3387531638145447, 0.36194199323654175, 0.3851308226585388, 0.4083196520805359, 0.43150851130485535, 0.4546973407268524, 0.4778861701488495, 0.501075029373169, 0.524263858795166, 0.5474526882171631, 0.5706415176391602, 0.5938303470611572, 0.6170191764831543, 0.6402080059051514, 0.6633968949317932, 0.6865857243537903, 0.7097745537757874, 0.7329633831977844]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 8.0, 24.0, 29.0, 33.0, 56.0, 86.0, 138.0, 230.0, 387.0, 616.0, 1052.0, 1854.0, 3494.0, 7425.0, 16826.0, 43524.0, 125211.0, 319162.0, 322948.0, 128447.0, 44311.0, 17085.0, 7415.0, 3525.0, 1920.0, 1101.0, 654.0, 374.0, 218.0, 136.0, 99.0, 56.0, 33.0, 29.0, 19.0, 6.0, 13.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06781005859375, -0.06547260284423828, -0.06313514709472656, -0.060797691345214844, -0.058460235595703125, -0.056122779846191406, -0.05378532409667969, -0.05144786834716797, -0.04911041259765625, -0.04677295684814453, -0.04443550109863281, -0.042098045349121094, -0.039760589599609375, -0.037423133850097656, -0.03508567810058594, -0.03274822235107422, -0.0304107666015625, -0.02807331085205078, -0.025735855102539062, -0.023398399353027344, -0.021060943603515625, -0.018723487854003906, -0.016386032104492188, -0.014048576354980469, -0.01171112060546875, -0.009373664855957031, -0.0070362091064453125, -0.004698753356933594, -0.002361297607421875, -2.384185791015625e-05, 0.0023136138916015625, 0.004651069641113281, 0.006988525390625, 0.009325981140136719, 0.011663436889648438, 0.014000892639160156, 0.016338348388671875, 0.018675804138183594, 0.021013259887695312, 0.02335071563720703, 0.02568817138671875, 0.02802562713623047, 0.030363082885742188, 0.032700538635253906, 0.035037994384765625, 0.037375450134277344, 0.03971290588378906, 0.04205036163330078, 0.0443878173828125, 0.04672527313232422, 0.04906272888183594, 0.051400184631347656, 0.053737640380859375, 0.056075096130371094, 0.05841255187988281, 0.06075000762939453, 0.06308746337890625, 0.06542491912841797, 0.06776237487792969, 0.0700998306274414, 0.07243728637695312, 0.07477474212646484, 0.07711219787597656, 0.07944965362548828, 0.081787109375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 8.0, 5.0, 5.0, 10.0, 7.0, 13.0, 17.0, 18.0, 18.0, 18.0, 24.0, 29.0, 39.0, 35.0, 28.0, 40.0, 47.0, 34.0, 42.0, 46.0, 44.0, 37.0, 42.0, 39.0, 35.0, 25.0, 33.0, 22.0, 37.0, 27.0, 32.0, 16.0, 22.0, 18.0, 14.0, 20.0, 7.0, 10.0, 10.0, 2.0, 3.0, 4.0, 5.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04022216796875, -0.03884601593017578, -0.03746986389160156, -0.036093711853027344, -0.034717559814453125, -0.033341407775878906, -0.03196525573730469, -0.03058910369873047, -0.02921295166015625, -0.02783679962158203, -0.026460647583007812, -0.025084495544433594, -0.023708343505859375, -0.022332191467285156, -0.020956039428710938, -0.01957988739013672, -0.0182037353515625, -0.01682758331298828, -0.015451431274414062, -0.014075279235839844, -0.012699127197265625, -0.011322975158691406, -0.009946823120117188, -0.008570671081542969, -0.00719451904296875, -0.005818367004394531, -0.0044422149658203125, -0.0030660629272460938, -0.001689910888671875, -0.00031375885009765625, 0.0010623931884765625, 0.0024385452270507812, 0.003814697265625, 0.005190849304199219, 0.0065670013427734375, 0.007943153381347656, 0.009319305419921875, 0.010695457458496094, 0.012071609497070312, 0.013447761535644531, 0.01482391357421875, 0.01620006561279297, 0.017576217651367188, 0.018952369689941406, 0.020328521728515625, 0.021704673767089844, 0.023080825805664062, 0.02445697784423828, 0.0258331298828125, 0.02720928192138672, 0.028585433959960938, 0.029961585998535156, 0.031337738037109375, 0.032713890075683594, 0.03409004211425781, 0.03546619415283203, 0.03684234619140625, 0.03821849822998047, 0.03959465026855469, 0.040970802307128906, 0.042346954345703125, 0.043723106384277344, 0.04509925842285156, 0.04647541046142578, 0.0478515625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 7.0, 6.0, 5.0, 12.0, 11.0, 12.0, 17.0, 30.0, 35.0, 53.0, 100.0, 201.0, 341.0, 704.0, 1706.0, 5120.0, 22546.0, 163258.0, 718263.0, 112431.0, 16744.0, 4139.0, 1453.0, 590.0, 314.0, 149.0, 100.0, 77.0, 40.0, 31.0, 18.0, 9.0, 9.0, 9.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.160888671875, -0.15634536743164062, -0.15180206298828125, -0.14725875854492188, -0.1427154541015625, -0.13817214965820312, -0.13362884521484375, -0.12908554077148438, -0.124542236328125, -0.11999893188476562, -0.11545562744140625, -0.11091232299804688, -0.1063690185546875, -0.10182571411132812, -0.09728240966796875, -0.09273910522460938, -0.08819580078125, -0.08365249633789062, -0.07910919189453125, -0.07456588745117188, -0.0700225830078125, -0.06547927856445312, -0.06093597412109375, -0.056392669677734375, -0.051849365234375, -0.047306060791015625, -0.04276275634765625, -0.038219451904296875, -0.0336761474609375, -0.029132843017578125, -0.02458953857421875, -0.020046234130859375, -0.0155029296875, -0.010959625244140625, -0.00641632080078125, -0.001873016357421875, 0.0026702880859375, 0.007213592529296875, 0.01175689697265625, 0.016300201416015625, 0.020843505859375, 0.025386810302734375, 0.02993011474609375, 0.034473419189453125, 0.0390167236328125, 0.043560028076171875, 0.04810333251953125, 0.052646636962890625, 0.05718994140625, 0.061733245849609375, 0.06627655029296875, 0.07081985473632812, 0.0753631591796875, 0.07990646362304688, 0.08444976806640625, 0.08899307250976562, 0.093536376953125, 0.09807968139648438, 0.10262298583984375, 0.10716629028320312, 0.1117095947265625, 0.11625289916992188, 0.12079620361328125, 0.12533950805664062, 0.1298828125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 4.0, 9.0, 9.0, 13.0, 14.0, 30.0, 19.0, 29.0, 32.0, 35.0, 33.0, 41.0, 34.0, 60.0, 48.0, 34.0, 42.0, 47.0, 55.0, 51.0, 37.0, 52.0, 40.0, 24.0, 40.0, 32.0, 22.0, 22.0, 13.0, 19.0, 7.0, 6.0, 11.0, 10.0, 5.0, 7.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.185546875, -0.17974853515625, -0.1739501953125, -0.16815185546875, -0.162353515625, -0.15655517578125, -0.1507568359375, -0.14495849609375, -0.13916015625, -0.13336181640625, -0.1275634765625, -0.12176513671875, -0.115966796875, -0.11016845703125, -0.1043701171875, -0.09857177734375, -0.0927734375, -0.08697509765625, -0.0811767578125, -0.07537841796875, -0.069580078125, -0.06378173828125, -0.0579833984375, -0.05218505859375, -0.04638671875, -0.04058837890625, -0.0347900390625, -0.02899169921875, -0.023193359375, -0.01739501953125, -0.0115966796875, -0.00579833984375, 0.0, 0.00579833984375, 0.0115966796875, 0.01739501953125, 0.023193359375, 0.02899169921875, 0.0347900390625, 0.04058837890625, 0.04638671875, 0.05218505859375, 0.0579833984375, 0.06378173828125, 0.069580078125, 0.07537841796875, 0.0811767578125, 0.08697509765625, 0.0927734375, 0.09857177734375, 0.1043701171875, 0.11016845703125, 0.115966796875, 0.12176513671875, 0.1275634765625, 0.13336181640625, 0.13916015625, 0.14495849609375, 0.1507568359375, 0.15655517578125, 0.162353515625, 0.16815185546875, 0.1739501953125, 0.17974853515625, 0.185546875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 2.0, 14.0, 20.0, 25.0, 38.0, 45.0, 68.0, 108.0, 189.0, 334.0, 722.0, 1618.0, 4775.0, 17801.0, 103342.0, 726763.0, 158586.0, 24195.0, 6098.0, 2046.0, 852.0, 381.0, 213.0, 111.0, 68.0, 54.0, 27.0, 21.0, 12.0, 6.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06341552734375, -0.06119823455810547, -0.05898094177246094, -0.056763648986816406, -0.054546356201171875, -0.052329063415527344, -0.05011177062988281, -0.04789447784423828, -0.04567718505859375, -0.04345989227294922, -0.04124259948730469, -0.039025306701660156, -0.036808013916015625, -0.034590721130371094, -0.03237342834472656, -0.03015613555908203, -0.0279388427734375, -0.02572154998779297, -0.023504257202148438, -0.021286964416503906, -0.019069671630859375, -0.016852378845214844, -0.014635086059570312, -0.012417793273925781, -0.01020050048828125, -0.007983207702636719, -0.0057659149169921875, -0.0035486221313476562, -0.001331329345703125, 0.0008859634399414062, 0.0031032562255859375, 0.005320549011230469, 0.007537841796875, 0.009755134582519531, 0.011972427368164062, 0.014189720153808594, 0.016407012939453125, 0.018624305725097656, 0.020841598510742188, 0.02305889129638672, 0.02527618408203125, 0.02749347686767578, 0.029710769653320312, 0.031928062438964844, 0.034145355224609375, 0.036362648010253906, 0.03857994079589844, 0.04079723358154297, 0.0430145263671875, 0.04523181915283203, 0.04744911193847656, 0.049666404724121094, 0.051883697509765625, 0.054100990295410156, 0.05631828308105469, 0.05853557586669922, 0.06075286865234375, 0.06297016143798828, 0.06518745422363281, 0.06740474700927734, 0.06962203979492188, 0.0718393325805664, 0.07405662536621094, 0.07627391815185547, 0.0784912109375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 3.0, 7.0, 13.0, 16.0, 16.0, 35.0, 40.0, 46.0, 64.0, 67.0, 96.0, 86.0, 107.0, 74.0, 87.0, 50.0, 43.0, 38.0, 35.0, 14.0, 16.0, 11.0, 7.0, 13.0, 4.0, 2.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3589859008789062e-05, -1.290440559387207e-05, -1.2218952178955078e-05, -1.1533498764038086e-05, -1.0848045349121094e-05, -1.0162591934204102e-05, -9.47713851928711e-06, -8.791685104370117e-06, -8.106231689453125e-06, -7.420778274536133e-06, -6.735324859619141e-06, -6.0498714447021484e-06, -5.364418029785156e-06, -4.678964614868164e-06, -3.993511199951172e-06, -3.3080577850341797e-06, -2.6226043701171875e-06, -1.9371509552001953e-06, -1.2516975402832031e-06, -5.662441253662109e-07, 1.1920928955078125e-07, 8.046627044677734e-07, 1.4901161193847656e-06, 2.175569534301758e-06, 2.86102294921875e-06, 3.546476364135742e-06, 4.231929779052734e-06, 4.9173831939697266e-06, 5.602836608886719e-06, 6.288290023803711e-06, 6.973743438720703e-06, 7.659196853637695e-06, 8.344650268554688e-06, 9.03010368347168e-06, 9.715557098388672e-06, 1.0401010513305664e-05, 1.1086463928222656e-05, 1.1771917343139648e-05, 1.245737075805664e-05, 1.3142824172973633e-05, 1.3828277587890625e-05, 1.4513731002807617e-05, 1.519918441772461e-05, 1.58846378326416e-05, 1.6570091247558594e-05, 1.7255544662475586e-05, 1.7940998077392578e-05, 1.862645149230957e-05, 1.9311904907226562e-05, 1.9997358322143555e-05, 2.0682811737060547e-05, 2.136826515197754e-05, 2.205371856689453e-05, 2.2739171981811523e-05, 2.3424625396728516e-05, 2.4110078811645508e-05, 2.47955322265625e-05, 2.5480985641479492e-05, 2.6166439056396484e-05, 2.6851892471313477e-05, 2.753734588623047e-05, 2.822279930114746e-05, 2.8908252716064453e-05, 2.9593706130981445e-05, 3.0279159545898438e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 9.0, 8.0, 6.0, 14.0, 14.0, 31.0, 47.0, 83.0, 181.0, 391.0, 946.0, 2824.0, 11516.0, 78043.0, 772579.0, 157426.0, 18114.0, 4105.0, 1251.0, 489.0, 219.0, 114.0, 53.0, 31.0, 19.0, 13.0, 7.0, 7.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06292724609375, -0.060265541076660156, -0.05760383605957031, -0.05494213104248047, -0.052280426025390625, -0.04961872100830078, -0.04695701599121094, -0.044295310974121094, -0.04163360595703125, -0.038971900939941406, -0.03631019592285156, -0.03364849090576172, -0.030986785888671875, -0.02832508087158203, -0.025663375854492188, -0.023001670837402344, -0.0203399658203125, -0.017678260803222656, -0.015016555786132812, -0.012354850769042969, -0.009693145751953125, -0.007031440734863281, -0.0043697357177734375, -0.0017080307006835938, 0.00095367431640625, 0.0036153793334960938, 0.0062770843505859375, 0.008938789367675781, 0.011600494384765625, 0.014262199401855469, 0.016923904418945312, 0.019585609436035156, 0.022247314453125, 0.024909019470214844, 0.027570724487304688, 0.03023242950439453, 0.032894134521484375, 0.03555583953857422, 0.03821754455566406, 0.040879249572753906, 0.04354095458984375, 0.046202659606933594, 0.04886436462402344, 0.05152606964111328, 0.054187774658203125, 0.05684947967529297, 0.05951118469238281, 0.062172889709472656, 0.0648345947265625, 0.06749629974365234, 0.07015800476074219, 0.07281970977783203, 0.07548141479492188, 0.07814311981201172, 0.08080482482910156, 0.0834665298461914, 0.08612823486328125, 0.0887899398803711, 0.09145164489746094, 0.09411334991455078, 0.09677505493164062, 0.09943675994873047, 0.10209846496582031, 0.10476016998291016, 0.107421875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 2.0, 2.0, 10.0, 9.0, 21.0, 27.0, 31.0, 42.0, 56.0, 65.0, 69.0, 88.0, 104.0, 91.0, 75.0, 76.0, 55.0, 53.0, 32.0, 24.0, 19.0, 8.0, 10.0, 8.0, 6.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07061767578125, -0.0686197280883789, -0.06662178039550781, -0.06462383270263672, -0.06262588500976562, -0.06062793731689453, -0.05862998962402344, -0.056632041931152344, -0.05463409423828125, -0.052636146545410156, -0.05063819885253906, -0.04864025115966797, -0.046642303466796875, -0.04464435577392578, -0.04264640808105469, -0.040648460388183594, -0.0386505126953125, -0.036652565002441406, -0.03465461730957031, -0.03265666961669922, -0.030658721923828125, -0.02866077423095703, -0.026662826538085938, -0.024664878845214844, -0.02266693115234375, -0.020668983459472656, -0.018671035766601562, -0.01667308807373047, -0.014675140380859375, -0.012677192687988281, -0.010679244995117188, -0.008681297302246094, -0.006683349609375, -0.004685401916503906, -0.0026874542236328125, -0.0006895065307617188, 0.001308441162109375, 0.0033063888549804688, 0.0053043365478515625, 0.007302284240722656, 0.00930023193359375, 0.011298179626464844, 0.013296127319335938, 0.015294075012207031, 0.017292022705078125, 0.01928997039794922, 0.021287918090820312, 0.023285865783691406, 0.0252838134765625, 0.027281761169433594, 0.029279708862304688, 0.03127765655517578, 0.033275604248046875, 0.03527355194091797, 0.03727149963378906, 0.039269447326660156, 0.04126739501953125, 0.043265342712402344, 0.04526329040527344, 0.04726123809814453, 0.049259185791015625, 0.05125713348388672, 0.05325508117675781, 0.055253028869628906, 0.0572509765625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 8.0, 17.0, 32.0, 121.0, 363.0, 297.0, 108.0, 36.0, 12.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.206325054168701, -2.137188673019409, -2.0680525302886963, -1.9989162683486938, -1.9297800064086914, -1.8606436252593994, -1.791507363319397, -1.7223711013793945, -1.653234839439392, -1.5840985774993896, -1.5149623155593872, -1.4458260536193848, -1.3766896724700928, -1.3075535297393799, -1.238417148590088, -1.1692808866500854, -1.100144624710083, -1.0310083627700806, -0.9618721008300781, -0.8927357792854309, -0.8235995173454285, -0.754463255405426, -0.6853269338607788, -0.6161906719207764, -0.5470544099807739, -0.4779181480407715, -0.40878185629844666, -0.3396455645561218, -0.2705093026161194, -0.20137304067611694, -0.13223674893379211, -0.06310045719146729, 0.006036043167114258, 0.0751723200082779, 0.14430859684944153, 0.21344487369060516, 0.2825811505317688, 0.35171741247177124, 0.42085370421409607, 0.4899899959564209, 0.5591262578964233, 0.6282625198364258, 0.6973987817764282, 0.7665351033210754, 0.8356713652610779, 0.9048076272010803, 0.9739439487457275, 1.04308021068573, 1.1122164726257324, 1.1813527345657349, 1.2504889965057373, 1.3196252584457397, 1.3887615203857422, 1.4578979015350342, 1.5270341634750366, 1.596170425415039, 1.6653066873550415, 1.734442949295044, 1.8035792112350464, 1.8727154731750488, 1.9418518543243408, 2.0109879970550537, 2.0801243782043457, 2.1492605209350586, 2.2183969020843506]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 0.0, 3.0, 4.0, 3.0, 6.0, 4.0, 9.0, 7.0, 5.0, 10.0, 11.0, 8.0, 13.0, 15.0, 14.0, 21.0, 22.0, 24.0, 28.0, 32.0, 37.0, 43.0, 48.0, 76.0, 61.0, 65.0, 57.0, 59.0, 43.0, 35.0, 21.0, 36.0, 31.0, 26.0, 24.0, 10.0, 19.0, 20.0, 9.0, 11.0, 9.0, 5.0, 6.0, 6.0, 9.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6456982493400574, -0.623222827911377, -0.6007474660873413, -0.5782720446586609, -0.5557966232299805, -0.5333212018013, -0.5108457803726196, -0.488370418548584, -0.46589499711990356, -0.44341957569122314, -0.4209441840648651, -0.3984687924385071, -0.37599337100982666, -0.35351794958114624, -0.3310425579547882, -0.3085671663284302, -0.28609174489974976, -0.26361632347106934, -0.2411409318447113, -0.21866552531719208, -0.19619011878967285, -0.17371471226215363, -0.1512393057346344, -0.12876389920711517, -0.10628849267959595, -0.08381308615207672, -0.061337679624557495, -0.03886227309703827, -0.016386866569519043, 0.006088539958000183, 0.02856394648551941, 0.051039353013038635, 0.07351481914520264, 0.09599022567272186, 0.11846563220024109, 0.14094103872776031, 0.16341644525527954, 0.18589185178279877, 0.208367258310318, 0.23084266483783722, 0.25331807136535645, 0.27579349279403687, 0.2982688844203949, 0.32074427604675293, 0.34321969747543335, 0.36569511890411377, 0.3881705105304718, 0.41064590215682983, 0.43312132358551025, 0.4555967450141907, 0.4780721366405487, 0.5005475282669067, 0.5230229496955872, 0.5454983711242676, 0.5679737329483032, 0.5904491543769836, 0.6129245758056641, 0.6353999972343445, 0.6578754186630249, 0.6803507804870605, 0.702826201915741, 0.7253016233444214, 0.747776985168457, 0.7702524065971375, 0.7927278280258179]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 2.0, 3.0, 8.0, 7.0, 16.0, 17.0, 22.0, 39.0, 37.0, 81.0, 127.0, 177.0, 285.0, 460.0, 737.0, 1248.0, 2275.0, 4059.0, 7655.0, 16602.0, 45034.0, 173660.0, 982675.0, 2231021.0, 559787.0, 109053.0, 32024.0, 12876.0, 6157.0, 3267.0, 1924.0, 1107.0, 647.0, 411.0, 263.0, 173.0, 115.0, 75.0, 45.0, 40.0, 31.0, 22.0, 9.0, 9.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.051666259765625, -0.049776554107666016, -0.04788684844970703, -0.04599714279174805, -0.04410743713378906, -0.04221773147583008, -0.040328025817871094, -0.03843832015991211, -0.036548614501953125, -0.03465890884399414, -0.032769203186035156, -0.030879497528076172, -0.028989791870117188, -0.027100086212158203, -0.02521038055419922, -0.023320674896240234, -0.02143096923828125, -0.019541263580322266, -0.01765155792236328, -0.015761852264404297, -0.013872146606445312, -0.011982440948486328, -0.010092735290527344, -0.00820302963256836, -0.006313323974609375, -0.004423618316650391, -0.0025339126586914062, -0.0006442070007324219, 0.0012454986572265625, 0.003135204315185547, 0.005024909973144531, 0.006914615631103516, 0.0088043212890625, 0.010694026947021484, 0.012583732604980469, 0.014473438262939453, 0.016363143920898438, 0.018252849578857422, 0.020142555236816406, 0.02203226089477539, 0.023921966552734375, 0.02581167221069336, 0.027701377868652344, 0.029591083526611328, 0.03148078918457031, 0.0333704948425293, 0.03526020050048828, 0.037149906158447266, 0.03903961181640625, 0.040929317474365234, 0.04281902313232422, 0.0447087287902832, 0.04659843444824219, 0.04848814010620117, 0.050377845764160156, 0.05226755142211914, 0.054157257080078125, 0.05604696273803711, 0.057936668395996094, 0.05982637405395508, 0.06171607971191406, 0.06360578536987305, 0.06549549102783203, 0.06738519668579102, 0.06927490234375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 7.0, 7.0, 4.0, 6.0, 6.0, 8.0, 9.0, 12.0, 23.0, 18.0, 22.0, 20.0, 36.0, 51.0, 37.0, 44.0, 42.0, 37.0, 56.0, 58.0, 54.0, 45.0, 54.0, 34.0, 45.0, 50.0, 34.0, 33.0, 36.0, 17.0, 21.0, 17.0, 23.0, 12.0, 4.0, 7.0, 9.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.055450439453125, -0.053768157958984375, -0.05208587646484375, -0.050403594970703125, -0.0487213134765625, -0.047039031982421875, -0.04535675048828125, -0.043674468994140625, -0.0419921875, -0.040309906005859375, -0.03862762451171875, -0.036945343017578125, -0.0352630615234375, -0.033580780029296875, -0.03189849853515625, -0.030216217041015625, -0.028533935546875, -0.026851654052734375, -0.02516937255859375, -0.023487091064453125, -0.0218048095703125, -0.020122528076171875, -0.01844024658203125, -0.016757965087890625, -0.01507568359375, -0.013393402099609375, -0.01171112060546875, -0.010028839111328125, -0.0083465576171875, -0.006664276123046875, -0.00498199462890625, -0.003299713134765625, -0.001617431640625, 6.4849853515625e-05, 0.00174713134765625, 0.003429412841796875, 0.0051116943359375, 0.006793975830078125, 0.00847625732421875, 0.010158538818359375, 0.0118408203125, 0.013523101806640625, 0.01520538330078125, 0.016887664794921875, 0.0185699462890625, 0.020252227783203125, 0.02193450927734375, 0.023616790771484375, 0.025299072265625, 0.026981353759765625, 0.02866363525390625, 0.030345916748046875, 0.0320281982421875, 0.033710479736328125, 0.03539276123046875, 0.037075042724609375, 0.03875732421875, 0.040439605712890625, 0.04212188720703125, 0.043804168701171875, 0.0454864501953125, 0.047168731689453125, 0.04885101318359375, 0.050533294677734375, 0.052215576171875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 3.0, 9.0, 9.0, 16.0, 30.0, 36.0, 72.0, 94.0, 181.0, 536.0, 1914.0, 9065.0, 88956.0, 3719728.0, 350134.0, 18727.0, 3254.0, 843.0, 312.0, 128.0, 64.0, 47.0, 24.0, 25.0, 17.0, 13.0, 9.0, 8.0, 5.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1859130859375, -0.1791973114013672, -0.17248153686523438, -0.16576576232910156, -0.15904998779296875, -0.15233421325683594, -0.14561843872070312, -0.1389026641845703, -0.1321868896484375, -0.1254711151123047, -0.11875534057617188, -0.11203956604003906, -0.10532379150390625, -0.09860801696777344, -0.09189224243164062, -0.08517646789550781, -0.078460693359375, -0.07174491882324219, -0.06502914428710938, -0.05831336975097656, -0.05159759521484375, -0.04488182067871094, -0.038166046142578125, -0.03145027160644531, -0.0247344970703125, -0.018018722534179688, -0.011302947998046875, -0.0045871734619140625, 0.00212860107421875, 0.008844375610351562, 0.015560150146484375, 0.022275924682617188, 0.02899169921875, 0.03570747375488281, 0.042423248291015625, 0.04913902282714844, 0.05585479736328125, 0.06257057189941406, 0.06928634643554688, 0.07600212097167969, 0.0827178955078125, 0.08943367004394531, 0.09614944458007812, 0.10286521911621094, 0.10958099365234375, 0.11629676818847656, 0.12301254272460938, 0.1297283172607422, 0.136444091796875, 0.1431598663330078, 0.14987564086914062, 0.15659141540527344, 0.16330718994140625, 0.17002296447753906, 0.17673873901367188, 0.1834545135498047, 0.1901702880859375, 0.1968860626220703, 0.20360183715820312, 0.21031761169433594, 0.21703338623046875, 0.22374916076660156, 0.23046493530273438, 0.2371807098388672, 0.243896484375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 7.0, 5.0, 7.0, 5.0, 11.0, 15.0, 15.0, 22.0, 37.0, 47.0, 53.0, 98.0, 148.0, 266.0, 376.0, 618.0, 664.0, 621.0, 369.0, 230.0, 125.0, 105.0, 59.0, 48.0, 27.0, 23.0, 14.0, 10.0, 16.0, 5.0, 6.0, 4.0, 3.0, 6.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10040283203125, -0.09674739837646484, -0.09309196472167969, -0.08943653106689453, -0.08578109741210938, -0.08212566375732422, -0.07847023010253906, -0.0748147964477539, -0.07115936279296875, -0.0675039291381836, -0.06384849548339844, -0.06019306182861328, -0.056537628173828125, -0.05288219451904297, -0.04922676086425781, -0.045571327209472656, -0.0419158935546875, -0.038260459899902344, -0.03460502624511719, -0.03094959259033203, -0.027294158935546875, -0.02363872528076172, -0.019983291625976562, -0.016327857971191406, -0.01267242431640625, -0.009016990661621094, -0.0053615570068359375, -0.0017061233520507812, 0.001949310302734375, 0.005604743957519531, 0.009260177612304688, 0.012915611267089844, 0.016571044921875, 0.020226478576660156, 0.023881912231445312, 0.02753734588623047, 0.031192779541015625, 0.03484821319580078, 0.03850364685058594, 0.042159080505371094, 0.04581451416015625, 0.049469947814941406, 0.05312538146972656, 0.05678081512451172, 0.060436248779296875, 0.06409168243408203, 0.06774711608886719, 0.07140254974365234, 0.0750579833984375, 0.07871341705322266, 0.08236885070800781, 0.08602428436279297, 0.08967971801757812, 0.09333515167236328, 0.09699058532714844, 0.1006460189819336, 0.10430145263671875, 0.1079568862915039, 0.11161231994628906, 0.11526775360107422, 0.11892318725585938, 0.12257862091064453, 0.1262340545654297, 0.12988948822021484, 0.133544921875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 9.0, 10.0, 30.0, 56.0, 112.0, 174.0, 234.0, 171.0, 92.0, 68.0, 18.0, 11.0, 7.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0755388736724854, -1.0312937498092651, -0.9870485663414001, -0.9428034424781799, -0.8985582590103149, -0.8543131351470947, -0.8100680112838745, -0.7658228278160095, -0.7215776443481445, -0.6773325204849243, -0.6330873370170593, -0.5888422131538391, -0.5445970296859741, -0.5003519058227539, -0.4561067521572113, -0.4118615984916687, -0.3676164746284485, -0.3233713209629059, -0.2791261672973633, -0.23488102853298187, -0.19063587486743927, -0.14639072120189667, -0.10214558243751526, -0.057900428771972656, -0.013655275106430054, 0.03058987483382225, 0.07483502477407455, 0.11908017098903656, 0.16332532465457916, 0.20757047832012177, 0.2518156170845032, 0.2960607707500458, 0.3403059244155884, 0.384551078081131, 0.4287962317466736, 0.4730413556098938, 0.5172865390777588, 0.561531662940979, 0.6057767868041992, 0.6500219702720642, 0.6942671537399292, 0.7385122776031494, 0.7827574610710144, 0.8270025849342346, 0.8712477684020996, 0.9154928922653198, 0.95973801612854, 1.0039832592010498, 1.0482282638549805, 1.0924733877182007, 1.136718511581421, 1.1809637546539307, 1.2252088785171509, 1.269454002380371, 1.3136991262435913, 1.3579442501068115, 1.4021894931793213, 1.4464346170425415, 1.4906797409057617, 1.5349249839782715, 1.5791701078414917, 1.623415231704712, 1.6676603555679321, 1.7119054794311523, 1.756150722503662]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 7.0, 8.0, 9.0, 10.0, 10.0, 14.0, 13.0, 21.0, 15.0, 18.0, 29.0, 29.0, 33.0, 41.0, 52.0, 50.0, 51.0, 45.0, 47.0, 52.0, 55.0, 61.0, 38.0, 39.0, 35.0, 40.0, 28.0, 17.0, 25.0, 15.0, 11.0, 15.0, 15.0, 17.0, 17.0, 2.0, 3.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.5719928741455078, -0.5546301603317261, -0.5372673869132996, -0.519904613494873, -0.5025418996810913, -0.4851791560649872, -0.46781641244888306, -0.45045366883277893, -0.4330909252166748, -0.4157281816005707, -0.39836543798446655, -0.3810026943683624, -0.3636399507522583, -0.3462772071361542, -0.32891446352005005, -0.3115517199039459, -0.2941889762878418, -0.27682623267173767, -0.25946348905563354, -0.24210074543952942, -0.2247380018234253, -0.20737525820732117, -0.19001251459121704, -0.17264977097511292, -0.1552870273590088, -0.13792428374290466, -0.12056154012680054, -0.10319879651069641, -0.08583605289459229, -0.06847330927848816, -0.05111056566238403, -0.03374782204627991, -0.016385138034820557, 0.0009776055812835693, 0.018340349197387695, 0.03570309281349182, 0.05306583642959595, 0.07042858004570007, 0.0877913236618042, 0.10515406727790833, 0.12251681089401245, 0.13987955451011658, 0.1572422981262207, 0.17460504174232483, 0.19196778535842896, 0.20933052897453308, 0.2266932725906372, 0.24405601620674133, 0.26141875982284546, 0.2787815034389496, 0.2961442470550537, 0.31350699067115784, 0.33086973428726196, 0.3482324779033661, 0.3655952215194702, 0.38295796513557434, 0.40032070875167847, 0.4176834523677826, 0.4350461959838867, 0.45240893959999084, 0.46977168321609497, 0.4871344268321991, 0.5044971704483032, 0.521859884262085, 0.5392226576805115]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 15.0, 8.0, 17.0, 32.0, 37.0, 43.0, 66.0, 123.0, 160.0, 259.0, 441.0, 812.0, 1279.0, 2497.0, 5165.0, 11566.0, 32259.0, 108556.0, 370343.0, 358759.0, 103291.0, 31142.0, 11239.0, 4784.0, 2403.0, 1287.0, 754.0, 395.0, 272.0, 171.0, 120.0, 75.0, 54.0, 34.0, 31.0, 23.0, 12.0, 8.0, 7.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08160400390625, -0.07888221740722656, -0.07616043090820312, -0.07343864440917969, -0.07071685791015625, -0.06799507141113281, -0.06527328491210938, -0.06255149841308594, -0.0598297119140625, -0.05710792541503906, -0.054386138916015625, -0.05166435241699219, -0.04894256591796875, -0.04622077941894531, -0.043498992919921875, -0.04077720642089844, -0.038055419921875, -0.03533363342285156, -0.032611846923828125, -0.029890060424804688, -0.02716827392578125, -0.024446487426757812, -0.021724700927734375, -0.019002914428710938, -0.0162811279296875, -0.013559341430664062, -0.010837554931640625, -0.008115768432617188, -0.00539398193359375, -0.0026721954345703125, 4.9591064453125e-05, 0.0027713775634765625, 0.0054931640625, 0.008214950561523438, 0.010936737060546875, 0.013658523559570312, 0.01638031005859375, 0.019102096557617188, 0.021823883056640625, 0.024545669555664062, 0.0272674560546875, 0.029989242553710938, 0.032711029052734375, 0.03543281555175781, 0.03815460205078125, 0.04087638854980469, 0.043598175048828125, 0.04631996154785156, 0.049041748046875, 0.05176353454589844, 0.054485321044921875, 0.05720710754394531, 0.05992889404296875, 0.06265068054199219, 0.06537246704101562, 0.06809425354003906, 0.0708160400390625, 0.07353782653808594, 0.07625961303710938, 0.07898139953613281, 0.08170318603515625, 0.08442497253417969, 0.08714675903320312, 0.08986854553222656, 0.09259033203125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 3.0, 6.0, 10.0, 12.0, 11.0, 14.0, 29.0, 24.0, 36.0, 30.0, 36.0, 38.0, 50.0, 51.0, 45.0, 54.0, 51.0, 50.0, 57.0, 49.0, 61.0, 42.0, 42.0, 30.0, 30.0, 16.0, 27.0, 24.0, 19.0, 13.0, 7.0, 10.0, 6.0, 2.0, 4.0, 3.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055694580078125, -0.053822994232177734, -0.05195140838623047, -0.0500798225402832, -0.04820823669433594, -0.04633665084838867, -0.044465065002441406, -0.04259347915649414, -0.040721893310546875, -0.03885030746459961, -0.036978721618652344, -0.03510713577270508, -0.03323554992675781, -0.03136396408081055, -0.02949237823486328, -0.027620792388916016, -0.02574920654296875, -0.023877620697021484, -0.02200603485107422, -0.020134449005126953, -0.018262863159179688, -0.016391277313232422, -0.014519691467285156, -0.01264810562133789, -0.010776519775390625, -0.00890493392944336, -0.007033348083496094, -0.005161762237548828, -0.0032901763916015625, -0.0014185905456542969, 0.00045299530029296875, 0.0023245811462402344, 0.0041961669921875, 0.006067752838134766, 0.007939338684082031, 0.009810924530029297, 0.011682510375976562, 0.013554096221923828, 0.015425682067871094, 0.01729726791381836, 0.019168853759765625, 0.02104043960571289, 0.022912025451660156, 0.024783611297607422, 0.026655197143554688, 0.028526782989501953, 0.03039836883544922, 0.032269954681396484, 0.03414154052734375, 0.036013126373291016, 0.03788471221923828, 0.03975629806518555, 0.04162788391113281, 0.04349946975708008, 0.045371055603027344, 0.04724264144897461, 0.049114227294921875, 0.05098581314086914, 0.052857398986816406, 0.05472898483276367, 0.05660057067871094, 0.0584721565246582, 0.06034374237060547, 0.062215328216552734, 0.0640869140625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 4.0, 10.0, 6.0, 16.0, 11.0, 14.0, 36.0, 39.0, 74.0, 100.0, 191.0, 292.0, 624.0, 1277.0, 3379.0, 11080.0, 53497.0, 593125.0, 326432.0, 43424.0, 9398.0, 2981.0, 1236.0, 548.0, 263.0, 182.0, 103.0, 61.0, 52.0, 34.0, 23.0, 16.0, 8.0, 3.0, 4.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.1512451171875, -0.14715099334716797, -0.14305686950683594, -0.1389627456665039, -0.13486862182617188, -0.13077449798583984, -0.1266803741455078, -0.12258625030517578, -0.11849212646484375, -0.11439800262451172, -0.11030387878417969, -0.10620975494384766, -0.10211563110351562, -0.0980215072631836, -0.09392738342285156, -0.08983325958251953, -0.0857391357421875, -0.08164501190185547, -0.07755088806152344, -0.0734567642211914, -0.06936264038085938, -0.06526851654052734, -0.06117439270019531, -0.05708026885986328, -0.05298614501953125, -0.04889202117919922, -0.04479789733886719, -0.040703773498535156, -0.036609649658203125, -0.032515525817871094, -0.028421401977539062, -0.02432727813720703, -0.020233154296875, -0.01613903045654297, -0.012044906616210938, -0.007950782775878906, -0.003856658935546875, 0.00023746490478515625, 0.0043315887451171875, 0.008425712585449219, 0.01251983642578125, 0.01661396026611328, 0.020708084106445312, 0.024802207946777344, 0.028896331787109375, 0.032990455627441406, 0.03708457946777344, 0.04117870330810547, 0.0452728271484375, 0.04936695098876953, 0.05346107482910156, 0.057555198669433594, 0.061649322509765625, 0.06574344635009766, 0.06983757019042969, 0.07393169403076172, 0.07802581787109375, 0.08211994171142578, 0.08621406555175781, 0.09030818939208984, 0.09440231323242188, 0.0984964370727539, 0.10259056091308594, 0.10668468475341797, 0.11077880859375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 2.0, 5.0, 3.0, 7.0, 8.0, 4.0, 9.0, 5.0, 13.0, 26.0, 20.0, 31.0, 40.0, 32.0, 35.0, 40.0, 50.0, 51.0, 64.0, 49.0, 55.0, 54.0, 51.0, 45.0, 51.0, 42.0, 28.0, 34.0, 36.0, 28.0, 23.0, 8.0, 7.0, 10.0, 8.0, 8.0, 4.0, 6.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.238037109375, -0.231414794921875, -0.22479248046875, -0.218170166015625, -0.2115478515625, -0.204925537109375, -0.19830322265625, -0.191680908203125, -0.18505859375, -0.178436279296875, -0.17181396484375, -0.165191650390625, -0.1585693359375, -0.151947021484375, -0.14532470703125, -0.138702392578125, -0.132080078125, -0.125457763671875, -0.11883544921875, -0.112213134765625, -0.1055908203125, -0.098968505859375, -0.09234619140625, -0.085723876953125, -0.0791015625, -0.072479248046875, -0.06585693359375, -0.059234619140625, -0.0526123046875, -0.045989990234375, -0.03936767578125, -0.032745361328125, -0.026123046875, -0.019500732421875, -0.01287841796875, -0.006256103515625, 0.0003662109375, 0.006988525390625, 0.01361083984375, 0.020233154296875, 0.02685546875, 0.033477783203125, 0.04010009765625, 0.046722412109375, 0.0533447265625, 0.059967041015625, 0.06658935546875, 0.073211669921875, 0.079833984375, 0.086456298828125, 0.09307861328125, 0.099700927734375, 0.1063232421875, 0.112945556640625, 0.11956787109375, 0.126190185546875, 0.1328125, 0.139434814453125, 0.14605712890625, 0.152679443359375, 0.1593017578125, 0.165924072265625, 0.17254638671875, 0.179168701171875, 0.185791015625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 8.0, 6.0, 20.0, 15.0, 31.0, 43.0, 33.0, 87.0, 148.0, 244.0, 431.0, 825.0, 1621.0, 3315.0, 7342.0, 18753.0, 54751.0, 202517.0, 596082.0, 107312.0, 32827.0, 12195.0, 4970.0, 2318.0, 1110.0, 667.0, 342.0, 197.0, 139.0, 81.0, 39.0, 37.0, 14.0, 16.0, 11.0, 7.0, 0.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.025390625, -0.02429962158203125, -0.0232086181640625, -0.02211761474609375, -0.021026611328125, -0.01993560791015625, -0.0188446044921875, -0.01775360107421875, -0.01666259765625, -0.01557159423828125, -0.0144805908203125, -0.01338958740234375, -0.012298583984375, -0.01120758056640625, -0.0101165771484375, -0.00902557373046875, -0.0079345703125, -0.00684356689453125, -0.0057525634765625, -0.00466156005859375, -0.003570556640625, -0.00247955322265625, -0.0013885498046875, -0.00029754638671875, 0.00079345703125, 0.00188446044921875, 0.0029754638671875, 0.00406646728515625, 0.005157470703125, 0.00624847412109375, 0.0073394775390625, 0.00843048095703125, 0.009521484375, 0.01061248779296875, 0.0117034912109375, 0.01279449462890625, 0.013885498046875, 0.01497650146484375, 0.0160675048828125, 0.01715850830078125, 0.01824951171875, 0.01934051513671875, 0.0204315185546875, 0.02152252197265625, 0.022613525390625, 0.02370452880859375, 0.0247955322265625, 0.02588653564453125, 0.0269775390625, 0.02806854248046875, 0.0291595458984375, 0.03025054931640625, 0.031341552734375, 0.03243255615234375, 0.0335235595703125, 0.03461456298828125, 0.03570556640625, 0.03679656982421875, 0.0378875732421875, 0.03897857666015625, 0.040069580078125, 0.04116058349609375, 0.0422515869140625, 0.04334259033203125, 0.04443359375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 7.0, 11.0, 12.0, 13.0, 18.0, 28.0, 35.0, 52.0, 49.0, 68.0, 72.0, 115.0, 102.0, 80.0, 71.0, 70.0, 53.0, 37.0, 29.0, 19.0, 9.0, 12.0, 8.0, 7.0, 9.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1219253540039062e-05, -2.0633451640605927e-05, -2.004764974117279e-05, -1.9461847841739655e-05, -1.887604594230652e-05, -1.8290244042873383e-05, -1.7704442143440247e-05, -1.711864024400711e-05, -1.6532838344573975e-05, -1.594703644514084e-05, -1.5361234545707703e-05, -1.4775432646274567e-05, -1.418963074684143e-05, -1.3603828847408295e-05, -1.3018026947975159e-05, -1.2432225048542023e-05, -1.1846423149108887e-05, -1.126062124967575e-05, -1.0674819350242615e-05, -1.0089017450809479e-05, -9.503215551376343e-06, -8.917413651943207e-06, -8.33161175251007e-06, -7.745809853076935e-06, -7.160007953643799e-06, -6.574206054210663e-06, -5.988404154777527e-06, -5.402602255344391e-06, -4.816800355911255e-06, -4.230998456478119e-06, -3.645196557044983e-06, -3.059394657611847e-06, -2.473592758178711e-06, -1.887790858745575e-06, -1.301988959312439e-06, -7.16187059879303e-07, -1.30385160446167e-07, 4.55416738986969e-07, 1.041218638420105e-06, 1.627020537853241e-06, 2.212822437286377e-06, 2.798624336719513e-06, 3.384426236152649e-06, 3.970228135585785e-06, 4.556030035018921e-06, 5.141831934452057e-06, 5.727633833885193e-06, 6.313435733318329e-06, 6.899237632751465e-06, 7.485039532184601e-06, 8.070841431617737e-06, 8.656643331050873e-06, 9.242445230484009e-06, 9.828247129917145e-06, 1.041404902935028e-05, 1.0999850928783417e-05, 1.1585652828216553e-05, 1.2171454727649689e-05, 1.2757256627082825e-05, 1.334305852651596e-05, 1.3928860425949097e-05, 1.4514662325382233e-05, 1.5100464224815369e-05, 1.5686266124248505e-05, 1.627206802368164e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 1.0, 3.0, 4.0, 7.0, 9.0, 19.0, 14.0, 37.0, 58.0, 118.0, 195.0, 395.0, 920.0, 2418.0, 7681.0, 33530.0, 226068.0, 687888.0, 69336.0, 13540.0, 3807.0, 1302.0, 595.0, 251.0, 138.0, 87.0, 47.0, 28.0, 28.0, 14.0, 5.0, 3.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048431396484375, -0.046651363372802734, -0.04487133026123047, -0.0430912971496582, -0.04131126403808594, -0.03953123092651367, -0.037751197814941406, -0.03597116470336914, -0.034191131591796875, -0.03241109848022461, -0.030631065368652344, -0.028851032257080078, -0.027070999145507812, -0.025290966033935547, -0.02351093292236328, -0.021730899810791016, -0.01995086669921875, -0.018170833587646484, -0.01639080047607422, -0.014610767364501953, -0.012830734252929688, -0.011050701141357422, -0.009270668029785156, -0.007490634918212891, -0.005710601806640625, -0.003930568695068359, -0.0021505355834960938, -0.0003705024719238281, 0.0014095306396484375, 0.003189563751220703, 0.004969596862792969, 0.006749629974365234, 0.0085296630859375, 0.010309696197509766, 0.012089729309082031, 0.013869762420654297, 0.015649795532226562, 0.017429828643798828, 0.019209861755371094, 0.02098989486694336, 0.022769927978515625, 0.02454996109008789, 0.026329994201660156, 0.028110027313232422, 0.029890060424804688, 0.03167009353637695, 0.03345012664794922, 0.035230159759521484, 0.03701019287109375, 0.038790225982666016, 0.04057025909423828, 0.04235029220581055, 0.04413032531738281, 0.04591035842895508, 0.047690391540527344, 0.04947042465209961, 0.051250457763671875, 0.05303049087524414, 0.054810523986816406, 0.05659055709838867, 0.05837059020996094, 0.0601506233215332, 0.06193065643310547, 0.06371068954467773, 0.06549072265625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 6.0, 17.0, 13.0, 16.0, 30.0, 28.0, 30.0, 38.0, 60.0, 73.0, 111.0, 108.0, 101.0, 84.0, 59.0, 48.0, 27.0, 32.0, 26.0, 17.0, 15.0, 14.0, 6.0, 5.0, 6.0, 4.0, 5.0, 6.0, 2.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05499267578125, -0.0534820556640625, -0.051971435546875, -0.0504608154296875, -0.0489501953125, -0.0474395751953125, -0.045928955078125, -0.0444183349609375, -0.04290771484375, -0.0413970947265625, -0.039886474609375, -0.0383758544921875, -0.036865234375, -0.0353546142578125, -0.033843994140625, -0.0323333740234375, -0.03082275390625, -0.0293121337890625, -0.027801513671875, -0.0262908935546875, -0.0247802734375, -0.0232696533203125, -0.021759033203125, -0.0202484130859375, -0.01873779296875, -0.0172271728515625, -0.015716552734375, -0.0142059326171875, -0.0126953125, -0.0111846923828125, -0.009674072265625, -0.0081634521484375, -0.00665283203125, -0.0051422119140625, -0.003631591796875, -0.0021209716796875, -0.0006103515625, 0.0009002685546875, 0.002410888671875, 0.0039215087890625, 0.00543212890625, 0.0069427490234375, 0.008453369140625, 0.0099639892578125, 0.011474609375, 0.0129852294921875, 0.014495849609375, 0.0160064697265625, 0.01751708984375, 0.0190277099609375, 0.020538330078125, 0.0220489501953125, 0.0235595703125, 0.0250701904296875, 0.026580810546875, 0.0280914306640625, 0.02960205078125, 0.0311126708984375, 0.032623291015625, 0.0341339111328125, 0.03564453125, 0.0371551513671875, 0.038665771484375, 0.0401763916015625, 0.04168701171875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 6.0, 3.0, 3.0, 8.0, 8.0, 23.0, 39.0, 90.0, 148.0, 319.0, 190.0, 82.0, 52.0, 18.0, 7.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1870087385177612, -1.1456937789916992, -1.1043787002563477, -1.0630637407302856, -1.0217487812042236, -0.9804337024688721, -0.9391187429428101, -0.8978037238121033, -0.8564887046813965, -0.8151736855506897, -0.7738586664199829, -0.7325437068939209, -0.6912286877632141, -0.6499136686325073, -0.6085987091064453, -0.5672836899757385, -0.5259686708450317, -0.48465365171432495, -0.44333866238594055, -0.40202367305755615, -0.36070865392684937, -0.3193936347961426, -0.2780786454677582, -0.23676365613937378, -0.195448637008667, -0.1541336327791214, -0.1128186285495758, -0.07150362432003021, -0.03018862009048462, 0.011126384139060974, 0.05244138836860657, 0.09375637769699097, 0.1350712776184082, 0.1763862818479538, 0.2177012860774994, 0.2590162754058838, 0.3003312945365906, 0.34164631366729736, 0.38296130299568176, 0.42427629232406616, 0.46559131145477295, 0.5069063305854797, 0.5482213497161865, 0.5895363092422485, 0.6308513283729553, 0.6721663475036621, 0.7134813070297241, 0.7547963261604309, 0.7961113452911377, 0.8374263644218445, 0.8787413835525513, 0.9200563430786133, 0.9613713622093201, 1.0026863813400269, 1.0440013408660889, 1.0853164196014404, 1.1266313791275024, 1.1679463386535645, 1.209261417388916, 1.250576376914978, 1.29189133644104, 1.3332064151763916, 1.3745213747024536, 1.4158363342285156, 1.4571514129638672]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 4.0, 11.0, 8.0, 7.0, 9.0, 9.0, 10.0, 20.0, 7.0, 22.0, 24.0, 21.0, 24.0, 32.0, 23.0, 31.0, 50.0, 46.0, 59.0, 71.0, 76.0, 72.0, 61.0, 45.0, 28.0, 32.0, 37.0, 27.0, 16.0, 21.0, 12.0, 13.0, 15.0, 10.0, 9.0, 12.0, 8.0, 6.0, 2.0, 3.0, 2.0, 0.0, 7.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.706863284111023, -0.6832928657531738, -0.6597223877906799, -0.6361519694328308, -0.6125814914703369, -0.5890110731124878, -0.5654406547546387, -0.5418702363967896, -0.5182997584342957, -0.49472931027412415, -0.47115886211395264, -0.4475884437561035, -0.424017995595932, -0.4004475474357605, -0.3768771290779114, -0.35330668091773987, -0.32973623275756836, -0.30616578459739685, -0.28259533643722534, -0.2590249180793762, -0.2354544699192047, -0.2118840217590332, -0.1883135885000229, -0.16474315524101257, -0.14117270708084106, -0.11760226637125015, -0.09403182566165924, -0.07046138495206833, -0.04689094424247742, -0.023320503532886505, 0.00024993717670440674, 0.02382037043571472, 0.04739081859588623, 0.07096125930547714, 0.09453170001506805, 0.11810214072465897, 0.14167258143424988, 0.1652430295944214, 0.1888134628534317, 0.21238389611244202, 0.23595434427261353, 0.25952479243278503, 0.28309524059295654, 0.30666565895080566, 0.3302361071109772, 0.3538065552711487, 0.3773769736289978, 0.4009474217891693, 0.4245178699493408, 0.44808831810951233, 0.47165876626968384, 0.49522918462753296, 0.5187996625900269, 0.542370080947876, 0.5659404993057251, 0.5895109176635742, 0.6130813956260681, 0.6366518139839172, 0.6602222919464111, 0.6837927103042603, 0.7073631286621094, 0.7309336066246033, 0.7545040249824524, 0.7780745029449463, 0.8016449213027954]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 2.0, 2.0, 6.0, 6.0, 8.0, 16.0, 23.0, 34.0, 45.0, 63.0, 133.0, 186.0, 326.0, 539.0, 944.0, 1787.0, 3716.0, 8684.0, 24871.0, 104970.0, 705011.0, 2558197.0, 650420.0, 95682.0, 22690.0, 8050.0, 3556.0, 1819.0, 946.0, 591.0, 378.0, 195.0, 121.0, 85.0, 64.0, 29.0, 34.0, 20.0, 19.0, 12.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06561279296875, -0.06322479248046875, -0.0608367919921875, -0.05844879150390625, -0.056060791015625, -0.05367279052734375, -0.0512847900390625, -0.04889678955078125, -0.0465087890625, -0.04412078857421875, -0.0417327880859375, -0.03934478759765625, -0.036956787109375, -0.03456878662109375, -0.0321807861328125, -0.02979278564453125, -0.02740478515625, -0.02501678466796875, -0.0226287841796875, -0.02024078369140625, -0.017852783203125, -0.01546478271484375, -0.0130767822265625, -0.01068878173828125, -0.00830078125, -0.00591278076171875, -0.0035247802734375, -0.00113677978515625, 0.001251220703125, 0.00363922119140625, 0.0060272216796875, 0.00841522216796875, 0.01080322265625, 0.01319122314453125, 0.0155792236328125, 0.01796722412109375, 0.020355224609375, 0.02274322509765625, 0.0251312255859375, 0.02751922607421875, 0.0299072265625, 0.03229522705078125, 0.0346832275390625, 0.03707122802734375, 0.039459228515625, 0.04184722900390625, 0.0442352294921875, 0.04662322998046875, 0.04901123046875, 0.05139923095703125, 0.0537872314453125, 0.05617523193359375, 0.058563232421875, 0.06095123291015625, 0.0633392333984375, 0.06572723388671875, 0.068115234375, 0.07050323486328125, 0.0728912353515625, 0.07527923583984375, 0.077667236328125, 0.08005523681640625, 0.0824432373046875, 0.08483123779296875, 0.08721923828125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 3.0, 2.0, 7.0, 6.0, 11.0, 11.0, 8.0, 13.0, 17.0, 21.0, 18.0, 22.0, 25.0, 30.0, 40.0, 48.0, 52.0, 44.0, 46.0, 34.0, 37.0, 49.0, 37.0, 31.0, 45.0, 45.0, 33.0, 39.0, 35.0, 25.0, 23.0, 13.0, 25.0, 20.0, 11.0, 10.0, 15.0, 10.0, 8.0, 8.0, 3.0, 3.0, 4.0, 7.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04779052734375, -0.04626941680908203, -0.04474830627441406, -0.043227195739746094, -0.041706085205078125, -0.040184974670410156, -0.03866386413574219, -0.03714275360107422, -0.03562164306640625, -0.03410053253173828, -0.03257942199707031, -0.031058311462402344, -0.029537200927734375, -0.028016090393066406, -0.026494979858398438, -0.02497386932373047, -0.0234527587890625, -0.02193164825439453, -0.020410537719726562, -0.018889427185058594, -0.017368316650390625, -0.015847206115722656, -0.014326095581054688, -0.012804985046386719, -0.01128387451171875, -0.009762763977050781, -0.008241653442382812, -0.006720542907714844, -0.005199432373046875, -0.0036783218383789062, -0.0021572113037109375, -0.0006361007690429688, 0.000885009765625, 0.0024061203002929688, 0.0039272308349609375, 0.005448341369628906, 0.006969451904296875, 0.008490562438964844, 0.010011672973632812, 0.011532783508300781, 0.01305389404296875, 0.014575004577636719, 0.016096115112304688, 0.017617225646972656, 0.019138336181640625, 0.020659446716308594, 0.022180557250976562, 0.02370166778564453, 0.0252227783203125, 0.02674388885498047, 0.028264999389648438, 0.029786109924316406, 0.031307220458984375, 0.032828330993652344, 0.03434944152832031, 0.03587055206298828, 0.03739166259765625, 0.03891277313232422, 0.04043388366699219, 0.041954994201660156, 0.043476104736328125, 0.044997215270996094, 0.04651832580566406, 0.04803943634033203, 0.049560546875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 9.0, 8.0, 16.0, 22.0, 42.0, 76.0, 134.0, 296.0, 890.0, 5281.0, 107682.0, 3944523.0, 127618.0, 6108.0, 970.0, 279.0, 138.0, 78.0, 47.0, 32.0, 12.0, 11.0, 4.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32763671875, -0.3197460174560547, -0.3118553161621094, -0.30396461486816406, -0.29607391357421875, -0.28818321228027344, -0.2802925109863281, -0.2724018096923828, -0.2645111083984375, -0.2566204071044922, -0.24872970581054688, -0.24083900451660156, -0.23294830322265625, -0.22505760192871094, -0.21716690063476562, -0.2092761993408203, -0.201385498046875, -0.1934947967529297, -0.18560409545898438, -0.17771339416503906, -0.16982269287109375, -0.16193199157714844, -0.15404129028320312, -0.1461505889892578, -0.1382598876953125, -0.1303691864013672, -0.12247848510742188, -0.11458778381347656, -0.10669708251953125, -0.09880638122558594, -0.09091567993164062, -0.08302497863769531, -0.07513427734375, -0.06724357604980469, -0.059352874755859375, -0.05146217346191406, -0.04357147216796875, -0.03568077087402344, -0.027790069580078125, -0.019899368286132812, -0.0120086669921875, -0.0041179656982421875, 0.003772735595703125, 0.011663436889648438, 0.01955413818359375, 0.027444839477539062, 0.035335540771484375, 0.04322624206542969, 0.051116943359375, 0.05900764465332031, 0.06689834594726562, 0.07478904724121094, 0.08267974853515625, 0.09057044982910156, 0.09846115112304688, 0.10635185241699219, 0.1142425537109375, 0.12213325500488281, 0.13002395629882812, 0.13791465759277344, 0.14580535888671875, 0.15369606018066406, 0.16158676147460938, 0.1694774627685547, 0.1773681640625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 6.0, 11.0, 10.0, 8.0, 18.0, 23.0, 29.0, 28.0, 45.0, 49.0, 92.0, 123.0, 151.0, 228.0, 352.0, 453.0, 594.0, 536.0, 402.0, 271.0, 189.0, 120.0, 74.0, 56.0, 49.0, 30.0, 24.0, 18.0, 22.0, 13.0, 9.0, 6.0, 7.0, 2.0, 5.0, 3.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08837890625, -0.0852975845336914, -0.08221626281738281, -0.07913494110107422, -0.07605361938476562, -0.07297229766845703, -0.06989097595214844, -0.06680965423583984, -0.06372833251953125, -0.060647010803222656, -0.05756568908691406, -0.05448436737060547, -0.051403045654296875, -0.04832172393798828, -0.04524040222167969, -0.042159080505371094, -0.0390777587890625, -0.035996437072753906, -0.03291511535644531, -0.02983379364013672, -0.026752471923828125, -0.02367115020751953, -0.020589828491210938, -0.017508506774902344, -0.01442718505859375, -0.011345863342285156, -0.008264541625976562, -0.005183219909667969, -0.002101898193359375, 0.0009794235229492188, 0.0040607452392578125, 0.007142066955566406, 0.010223388671875, 0.013304710388183594, 0.016386032104492188, 0.01946735382080078, 0.022548675537109375, 0.02562999725341797, 0.028711318969726562, 0.031792640686035156, 0.03487396240234375, 0.037955284118652344, 0.04103660583496094, 0.04411792755126953, 0.047199249267578125, 0.05028057098388672, 0.05336189270019531, 0.056443214416503906, 0.0595245361328125, 0.0626058578491211, 0.06568717956542969, 0.06876850128173828, 0.07184982299804688, 0.07493114471435547, 0.07801246643066406, 0.08109378814697266, 0.08417510986328125, 0.08725643157958984, 0.09033775329589844, 0.09341907501220703, 0.09650039672851562, 0.09958171844482422, 0.10266304016113281, 0.1057443618774414, 0.10882568359375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 4.0, 5.0, 12.0, 17.0, 34.0, 61.0, 100.0, 141.0, 157.0, 165.0, 119.0, 74.0, 45.0, 23.0, 13.0, 12.0, 7.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3923041820526123, -1.3603432178497314, -1.3283822536468506, -1.2964212894439697, -1.2644603252410889, -1.2324994802474976, -1.2005385160446167, -1.1685775518417358, -1.136616587638855, -1.1046556234359741, -1.0726946592330933, -1.0407336950302124, -1.008772850036621, -0.9768118262290955, -0.9448509216308594, -0.9128899574279785, -0.8809289932250977, -0.8489680290222168, -0.8170070648193359, -0.7850461602210999, -0.753085196018219, -0.7211242318153381, -0.689163327217102, -0.6572023630142212, -0.6252413988113403, -0.5932804346084595, -0.5613194704055786, -0.5293585658073425, -0.49739760160446167, -0.4654366374015808, -0.43347570300102234, -0.40151476860046387, -0.3695538640022278, -0.3375928997993469, -0.30563196539878845, -0.27367103099823, -0.24171006679534912, -0.20974911749362946, -0.1777881681919098, -0.14582721889019012, -0.11386626958847046, -0.0819053202867508, -0.04994437098503113, -0.017983421683311462, 0.013977527618408203, 0.04593847692012787, 0.07789942622184753, 0.1098603755235672, 0.14182132482528687, 0.17378227412700653, 0.2057432234287262, 0.23770417273044586, 0.2696651220321655, 0.3016260862350464, 0.33358702063560486, 0.36554795503616333, 0.3975089192390442, 0.42946988344192505, 0.4614308178424835, 0.493391752243042, 0.5253527164459229, 0.5573136806488037, 0.5892746448516846, 0.6212355494499207, 0.6531965136528015]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 7.0, 6.0, 1.0, 5.0, 3.0, 7.0, 14.0, 7.0, 15.0, 10.0, 18.0, 14.0, 22.0, 21.0, 29.0, 26.0, 23.0, 29.0, 37.0, 41.0, 39.0, 55.0, 42.0, 37.0, 44.0, 39.0, 44.0, 29.0, 34.0, 36.0, 29.0, 29.0, 26.0, 34.0, 22.0, 16.0, 21.0, 13.0, 16.0, 11.0, 14.0, 7.0, 9.0, 4.0, 5.0, 9.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.4441753029823303, -0.4309903681278229, -0.41780543327331543, -0.404620498418808, -0.39143556356430054, -0.3782505989074707, -0.36506566405296326, -0.3518807291984558, -0.33869579434394836, -0.3255108594894409, -0.31232592463493347, -0.299140989780426, -0.2859560251235962, -0.27277112007141113, -0.2595861554145813, -0.24640122056007385, -0.2332162857055664, -0.22003135085105896, -0.2068464159965515, -0.19366146624088287, -0.18047653138637543, -0.16729159653186798, -0.15410664677619934, -0.1409217119216919, -0.12773677706718445, -0.114551842212677, -0.10136689990758896, -0.08818195760250092, -0.07499702274799347, -0.06181208789348602, -0.04862714558839798, -0.035442203283309937, -0.02225726842880249, -0.009072329849004745, 0.004112608730792999, 0.017297547310590744, 0.03048248589038849, 0.043667420744895935, 0.05685236304998398, 0.07003730535507202, 0.08322224020957947, 0.09640717506408691, 0.10959211736917496, 0.122777059674263, 0.13596199452877045, 0.1491469293832779, 0.16233187913894653, 0.17551681399345398, 0.18870174884796143, 0.20188668370246887, 0.21507161855697632, 0.22825656831264496, 0.2414415031671524, 0.25462645292282104, 0.2678113877773285, 0.28099632263183594, 0.2941812574863434, 0.30736619234085083, 0.3205511271953583, 0.3337360620498657, 0.34692102670669556, 0.3601059317588806, 0.37329089641571045, 0.3864758312702179, 0.39966076612472534]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 9.0, 4.0, 8.0, 8.0, 18.0, 30.0, 36.0, 55.0, 81.0, 150.0, 208.0, 379.0, 642.0, 1222.0, 2377.0, 5110.0, 12100.0, 29815.0, 86796.0, 294932.0, 407995.0, 133728.0, 43036.0, 16380.0, 6750.0, 3156.0, 1563.0, 805.0, 456.0, 255.0, 163.0, 99.0, 69.0, 43.0, 30.0, 22.0, 16.0, 11.0, 4.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.09588623046875, -0.09323596954345703, -0.09058570861816406, -0.0879354476928711, -0.08528518676757812, -0.08263492584228516, -0.07998466491699219, -0.07733440399169922, -0.07468414306640625, -0.07203388214111328, -0.06938362121582031, -0.06673336029052734, -0.06408309936523438, -0.061432838439941406, -0.05878257751464844, -0.05613231658935547, -0.0534820556640625, -0.05083179473876953, -0.04818153381347656, -0.045531272888183594, -0.042881011962890625, -0.040230751037597656, -0.03758049011230469, -0.03493022918701172, -0.03227996826171875, -0.02962970733642578, -0.026979446411132812, -0.024329185485839844, -0.021678924560546875, -0.019028663635253906, -0.016378402709960938, -0.013728141784667969, -0.011077880859375, -0.008427619934082031, -0.0057773590087890625, -0.0031270980834960938, -0.000476837158203125, 0.0021734237670898438, 0.0048236846923828125, 0.007473945617675781, 0.01012420654296875, 0.012774467468261719, 0.015424728393554688, 0.018074989318847656, 0.020725250244140625, 0.023375511169433594, 0.026025772094726562, 0.02867603302001953, 0.0313262939453125, 0.03397655487060547, 0.03662681579589844, 0.039277076721191406, 0.041927337646484375, 0.044577598571777344, 0.04722785949707031, 0.04987812042236328, 0.05252838134765625, 0.05517864227294922, 0.05782890319824219, 0.060479164123535156, 0.06312942504882812, 0.0657796859741211, 0.06842994689941406, 0.07108020782470703, 0.07373046875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 4.0, 6.0, 9.0, 6.0, 7.0, 7.0, 8.0, 13.0, 12.0, 20.0, 12.0, 17.0, 24.0, 28.0, 22.0, 30.0, 34.0, 37.0, 39.0, 44.0, 41.0, 35.0, 51.0, 39.0, 37.0, 35.0, 42.0, 53.0, 39.0, 23.0, 32.0, 32.0, 19.0, 26.0, 15.0, 24.0, 10.0, 7.0, 11.0, 9.0, 11.0, 5.0, 7.0, 8.0, 3.0, 3.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04931640625, -0.04781532287597656, -0.046314239501953125, -0.04481315612792969, -0.04331207275390625, -0.04181098937988281, -0.040309906005859375, -0.03880882263183594, -0.0373077392578125, -0.03580665588378906, -0.034305572509765625, -0.03280448913574219, -0.03130340576171875, -0.029802322387695312, -0.028301239013671875, -0.026800155639648438, -0.025299072265625, -0.023797988891601562, -0.022296905517578125, -0.020795822143554688, -0.01929473876953125, -0.017793655395507812, -0.016292572021484375, -0.014791488647460938, -0.0132904052734375, -0.011789321899414062, -0.010288238525390625, -0.008787155151367188, -0.00728607177734375, -0.0057849884033203125, -0.004283905029296875, -0.0027828216552734375, -0.00128173828125, 0.0002193450927734375, 0.001720428466796875, 0.0032215118408203125, 0.00472259521484375, 0.0062236785888671875, 0.007724761962890625, 0.009225845336914062, 0.0107269287109375, 0.012228012084960938, 0.013729095458984375, 0.015230178833007812, 0.01673126220703125, 0.018232345581054688, 0.019733428955078125, 0.021234512329101562, 0.022735595703125, 0.024236679077148438, 0.025737762451171875, 0.027238845825195312, 0.02873992919921875, 0.030241012573242188, 0.031742095947265625, 0.03324317932128906, 0.0347442626953125, 0.03624534606933594, 0.037746429443359375, 0.03924751281738281, 0.04074859619140625, 0.04224967956542969, 0.043750762939453125, 0.04525184631347656, 0.0467529296875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 7.0, 6.0, 1.0, 12.0, 20.0, 21.0, 23.0, 32.0, 55.0, 95.0, 131.0, 214.0, 344.0, 651.0, 1283.0, 3048.0, 8928.0, 34519.0, 219314.0, 690311.0, 67077.0, 14234.0, 4379.0, 1830.0, 828.0, 448.0, 241.0, 185.0, 119.0, 57.0, 44.0, 33.0, 26.0, 13.0, 6.0, 8.0, 4.0, 3.0, 4.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1431884765625, -0.13923263549804688, -0.13527679443359375, -0.13132095336914062, -0.1273651123046875, -0.12340927124023438, -0.11945343017578125, -0.11549758911132812, -0.111541748046875, -0.10758590698242188, -0.10363006591796875, -0.09967422485351562, -0.0957183837890625, -0.09176254272460938, -0.08780670166015625, -0.08385086059570312, -0.07989501953125, -0.07593917846679688, -0.07198333740234375, -0.06802749633789062, -0.0640716552734375, -0.060115814208984375, -0.05615997314453125, -0.052204132080078125, -0.048248291015625, -0.044292449951171875, -0.04033660888671875, -0.036380767822265625, -0.0324249267578125, -0.028469085693359375, -0.02451324462890625, -0.020557403564453125, -0.0166015625, -0.012645721435546875, -0.00868988037109375, -0.004734039306640625, -0.0007781982421875, 0.003177642822265625, 0.00713348388671875, 0.011089324951171875, 0.015045166015625, 0.019001007080078125, 0.02295684814453125, 0.026912689208984375, 0.0308685302734375, 0.034824371337890625, 0.03878021240234375, 0.042736053466796875, 0.04669189453125, 0.050647735595703125, 0.05460357666015625, 0.058559417724609375, 0.0625152587890625, 0.06647109985351562, 0.07042694091796875, 0.07438278198242188, 0.078338623046875, 0.08229446411132812, 0.08625030517578125, 0.09020614624023438, 0.0941619873046875, 0.09811782836914062, 0.10207366943359375, 0.10602951049804688, 0.1099853515625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 10.0, 5.0, 8.0, 10.0, 13.0, 14.0, 23.0, 26.0, 27.0, 38.0, 49.0, 55.0, 60.0, 62.0, 59.0, 73.0, 65.0, 52.0, 50.0, 62.0, 31.0, 45.0, 36.0, 29.0, 29.0, 25.0, 6.0, 9.0, 9.0, 3.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.314208984375, -0.3063220977783203, -0.2984352111816406, -0.29054832458496094, -0.28266143798828125, -0.27477455139160156, -0.2668876647949219, -0.2590007781982422, -0.2511138916015625, -0.2432270050048828, -0.23534011840820312, -0.22745323181152344, -0.21956634521484375, -0.21167945861816406, -0.20379257202148438, -0.1959056854248047, -0.188018798828125, -0.1801319122314453, -0.17224502563476562, -0.16435813903808594, -0.15647125244140625, -0.14858436584472656, -0.14069747924804688, -0.1328105926513672, -0.1249237060546875, -0.11703681945800781, -0.10914993286132812, -0.10126304626464844, -0.09337615966796875, -0.08548927307128906, -0.07760238647460938, -0.06971549987792969, -0.06182861328125, -0.05394172668457031, -0.046054840087890625, -0.03816795349121094, -0.03028106689453125, -0.022394180297851562, -0.014507293701171875, -0.0066204071044921875, 0.0012664794921875, 0.009153366088867188, 0.017040252685546875, 0.024927139282226562, 0.03281402587890625, 0.04070091247558594, 0.048587799072265625, 0.05647468566894531, 0.064361572265625, 0.07224845886230469, 0.08013534545898438, 0.08802223205566406, 0.09590911865234375, 0.10379600524902344, 0.11168289184570312, 0.11956977844238281, 0.1274566650390625, 0.1353435516357422, 0.14323043823242188, 0.15111732482910156, 0.15900421142578125, 0.16689109802246094, 0.17477798461914062, 0.1826648712158203, 0.1905517578125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 6.0, 9.0, 14.0, 13.0, 28.0, 38.0, 54.0, 86.0, 128.0, 245.0, 538.0, 1256.0, 3009.0, 8354.0, 27160.0, 117923.0, 702873.0, 140075.0, 31250.0, 9512.0, 3307.0, 1379.0, 582.0, 290.0, 156.0, 90.0, 60.0, 37.0, 26.0, 15.0, 7.0, 9.0, 8.0, 4.0, 1.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034759521484375, -0.033621788024902344, -0.03248405456542969, -0.03134632110595703, -0.030208587646484375, -0.02907085418701172, -0.027933120727539062, -0.026795387268066406, -0.02565765380859375, -0.024519920349121094, -0.023382186889648438, -0.02224445343017578, -0.021106719970703125, -0.01996898651123047, -0.018831253051757812, -0.017693519592285156, -0.0165557861328125, -0.015418052673339844, -0.014280319213867188, -0.013142585754394531, -0.012004852294921875, -0.010867118835449219, -0.009729385375976562, -0.008591651916503906, -0.00745391845703125, -0.006316184997558594, -0.0051784515380859375, -0.004040718078613281, -0.002902984619140625, -0.0017652511596679688, -0.0006275177001953125, 0.0005102157592773438, 0.00164794921875, 0.0027856826782226562, 0.0039234161376953125, 0.005061149597167969, 0.006198883056640625, 0.007336616516113281, 0.008474349975585938, 0.009612083435058594, 0.01074981689453125, 0.011887550354003906, 0.013025283813476562, 0.014163017272949219, 0.015300750732421875, 0.01643848419189453, 0.017576217651367188, 0.018713951110839844, 0.0198516845703125, 0.020989418029785156, 0.022127151489257812, 0.02326488494873047, 0.024402618408203125, 0.02554035186767578, 0.026678085327148438, 0.027815818786621094, 0.02895355224609375, 0.030091285705566406, 0.031229019165039062, 0.03236675262451172, 0.033504486083984375, 0.03464221954345703, 0.03577995300292969, 0.036917686462402344, 0.038055419921875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 4.0, 6.0, 4.0, 7.0, 7.0, 11.0, 14.0, 16.0, 22.0, 24.0, 48.0, 53.0, 85.0, 88.0, 92.0, 103.0, 87.0, 80.0, 54.0, 51.0, 27.0, 21.0, 26.0, 11.0, 13.0, 5.0, 9.0, 12.0, 6.0, 7.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.531839370727539e-05, -1.471489667892456e-05, -1.411139965057373e-05, -1.35079026222229e-05, -1.290440559387207e-05, -1.230090856552124e-05, -1.169741153717041e-05, -1.109391450881958e-05, -1.049041748046875e-05, -9.88692045211792e-06, -9.28342342376709e-06, -8.67992639541626e-06, -8.07642936706543e-06, -7.4729323387146e-06, -6.8694353103637695e-06, -6.2659382820129395e-06, -5.662441253662109e-06, -5.058944225311279e-06, -4.455447196960449e-06, -3.851950168609619e-06, -3.248453140258789e-06, -2.644956111907959e-06, -2.041459083557129e-06, -1.4379620552062988e-06, -8.344650268554688e-07, -2.3096799850463867e-07, 3.725290298461914e-07, 9.760260581970215e-07, 1.5795230865478516e-06, 2.1830201148986816e-06, 2.7865171432495117e-06, 3.390014171600342e-06, 3.993511199951172e-06, 4.597008228302002e-06, 5.200505256652832e-06, 5.804002285003662e-06, 6.407499313354492e-06, 7.010996341705322e-06, 7.614493370056152e-06, 8.217990398406982e-06, 8.821487426757812e-06, 9.424984455108643e-06, 1.0028481483459473e-05, 1.0631978511810303e-05, 1.1235475540161133e-05, 1.1838972568511963e-05, 1.2442469596862793e-05, 1.3045966625213623e-05, 1.3649463653564453e-05, 1.4252960681915283e-05, 1.4856457710266113e-05, 1.5459954738616943e-05, 1.6063451766967773e-05, 1.6666948795318604e-05, 1.7270445823669434e-05, 1.7873942852020264e-05, 1.8477439880371094e-05, 1.9080936908721924e-05, 1.9684433937072754e-05, 2.0287930965423584e-05, 2.0891427993774414e-05, 2.1494925022125244e-05, 2.2098422050476074e-05, 2.2701919078826904e-05, 2.3305416107177734e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 4.0, 10.0, 12.0, 16.0, 23.0, 33.0, 36.0, 52.0, 100.0, 149.0, 267.0, 445.0, 803.0, 1574.0, 3428.0, 8035.0, 21706.0, 72809.0, 416582.0, 412823.0, 72797.0, 21791.0, 8140.0, 3464.0, 1519.0, 763.0, 424.0, 262.0, 152.0, 117.0, 92.0, 36.0, 19.0, 19.0, 7.0, 10.0, 7.0, 5.0, 10.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0295562744140625, -0.02860283851623535, -0.027649402618408203, -0.026695966720581055, -0.025742530822753906, -0.024789094924926758, -0.02383565902709961, -0.02288222312927246, -0.021928787231445312, -0.020975351333618164, -0.020021915435791016, -0.019068479537963867, -0.01811504364013672, -0.01716160774230957, -0.016208171844482422, -0.015254735946655273, -0.014301300048828125, -0.013347864151000977, -0.012394428253173828, -0.01144099235534668, -0.010487556457519531, -0.009534120559692383, -0.008580684661865234, -0.007627248764038086, -0.0066738128662109375, -0.005720376968383789, -0.004766941070556641, -0.003813505172729492, -0.0028600692749023438, -0.0019066333770751953, -0.0009531974792480469, 2.384185791015625e-07, 0.00095367431640625, 0.0019071102142333984, 0.002860546112060547, 0.0038139820098876953, 0.004767417907714844, 0.005720853805541992, 0.006674289703369141, 0.007627725601196289, 0.008581161499023438, 0.009534597396850586, 0.010488033294677734, 0.011441469192504883, 0.012394905090332031, 0.01334834098815918, 0.014301776885986328, 0.015255212783813477, 0.016208648681640625, 0.017162084579467773, 0.018115520477294922, 0.01906895637512207, 0.02002239227294922, 0.020975828170776367, 0.021929264068603516, 0.022882699966430664, 0.023836135864257812, 0.02478957176208496, 0.02574300765991211, 0.026696443557739258, 0.027649879455566406, 0.028603315353393555, 0.029556751251220703, 0.03051018714904785, 0.031463623046875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 3.0, 6.0, 6.0, 2.0, 17.0, 8.0, 23.0, 20.0, 27.0, 30.0, 43.0, 54.0, 61.0, 92.0, 84.0, 94.0, 74.0, 76.0, 64.0, 48.0, 45.0, 27.0, 21.0, 10.0, 15.0, 5.0, 14.0, 13.0, 5.0, 3.0, 2.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034423828125, -0.033111572265625, -0.03179931640625, -0.030487060546875, -0.0291748046875, -0.027862548828125, -0.02655029296875, -0.025238037109375, -0.02392578125, -0.022613525390625, -0.02130126953125, -0.019989013671875, -0.0186767578125, -0.017364501953125, -0.01605224609375, -0.014739990234375, -0.013427734375, -0.012115478515625, -0.01080322265625, -0.009490966796875, -0.0081787109375, -0.006866455078125, -0.00555419921875, -0.004241943359375, -0.0029296875, -0.001617431640625, -0.00030517578125, 0.001007080078125, 0.0023193359375, 0.003631591796875, 0.00494384765625, 0.006256103515625, 0.007568359375, 0.008880615234375, 0.01019287109375, 0.011505126953125, 0.0128173828125, 0.014129638671875, 0.01544189453125, 0.016754150390625, 0.01806640625, 0.019378662109375, 0.02069091796875, 0.022003173828125, 0.0233154296875, 0.024627685546875, 0.02593994140625, 0.027252197265625, 0.028564453125, 0.029876708984375, 0.03118896484375, 0.032501220703125, 0.0338134765625, 0.035125732421875, 0.03643798828125, 0.037750244140625, 0.0390625, 0.040374755859375, 0.04168701171875, 0.042999267578125, 0.0443115234375, 0.045623779296875, 0.04693603515625, 0.048248291015625, 0.049560546875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 7.0, 18.0, 29.0, 70.0, 205.0, 399.0, 148.0, 75.0, 29.0, 11.0, 4.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.105802059173584, -2.052506923675537, -1.9992116689682007, -1.9459164142608643, -1.8926211595535278, -1.8393259048461914, -1.7860307693481445, -1.732735514640808, -1.6794402599334717, -1.6261450052261353, -1.5728498697280884, -1.519554615020752, -1.4662593603134155, -1.412964105606079, -1.3596689701080322, -1.3063737154006958, -1.253078579902649, -1.1997833251953125, -1.1464881896972656, -1.0931929349899292, -1.0398976802825928, -0.9866024851799011, -0.9333072900772095, -0.880012035369873, -0.8267168402671814, -0.7734216451644897, -0.7201263904571533, -0.6668311953544617, -0.61353600025177, -0.5602407455444336, -0.5069455504417419, -0.4536503255367279, -0.4003552198410034, -0.3470599949359894, -0.29376477003097534, -0.2404695749282837, -0.18717435002326965, -0.13387912511825562, -0.08058393001556396, -0.027288705110549927, 0.02600651979446411, 0.07930173724889755, 0.132596954703331, 0.18589216470718384, 0.23918738961219788, 0.2924826145172119, 0.34577780961990356, 0.3990730345249176, 0.45236825942993164, 0.5056634545326233, 0.5589587092399597, 0.6122539043426514, 0.6655491590499878, 0.7188443541526794, 0.7721395492553711, 0.8254348039627075, 0.8787299990653992, 0.9320251941680908, 0.9853204488754272, 1.0386157035827637, 1.0919108390808105, 1.145206093788147, 1.1985013484954834, 1.2517964839935303, 1.3050917387008667]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 4.0, 8.0, 4.0, 9.0, 8.0, 11.0, 14.0, 19.0, 20.0, 28.0, 22.0, 29.0, 28.0, 49.0, 59.0, 80.0, 94.0, 89.0, 78.0, 50.0, 37.0, 40.0, 32.0, 23.0, 27.0, 16.0, 23.0, 13.0, 21.0, 10.0, 10.0, 7.0, 11.0, 7.0, 4.0, 2.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.8954162001609802, -0.8705326318740845, -0.845649003982544, -0.8207653760910034, -0.7958818078041077, -0.7709982395172119, -0.7461146116256714, -0.7212309837341309, -0.6963474154472351, -0.6714638471603394, -0.6465802192687988, -0.6216965913772583, -0.5968130230903625, -0.5719294548034668, -0.5470458269119263, -0.5221621990203857, -0.49727863073349, -0.47239503264427185, -0.4475114345550537, -0.42262783646583557, -0.39774423837661743, -0.3728606402873993, -0.34797704219818115, -0.323093444108963, -0.2982098460197449, -0.27332624793052673, -0.2484426498413086, -0.22355905175209045, -0.19867545366287231, -0.17379185557365417, -0.14890825748443604, -0.1240246593952179, -0.09914106130599976, -0.07425746321678162, -0.04937386512756348, -0.024490267038345337, 0.00039333105087280273, 0.025276929140090942, 0.05016052722930908, 0.07504412531852722, 0.09992772340774536, 0.1248113214969635, 0.14969491958618164, 0.17457851767539978, 0.19946211576461792, 0.22434571385383606, 0.2492293119430542, 0.27411291003227234, 0.2989965081214905, 0.3238801062107086, 0.34876370429992676, 0.3736473023891449, 0.39853090047836304, 0.4234144985675812, 0.4482980966567993, 0.47318169474601746, 0.4980652928352356, 0.5229488611221313, 0.5478324890136719, 0.5727161169052124, 0.5975996851921082, 0.6224832534790039, 0.6473668813705444, 0.672250509262085, 0.6971340775489807]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 10.0, 13.0, 10.0, 21.0, 38.0, 55.0, 83.0, 155.0, 250.0, 396.0, 760.0, 1435.0, 2897.0, 6542.0, 17188.0, 54241.0, 223531.0, 1077675.0, 2029715.0, 600563.0, 122850.0, 33320.0, 12165.0, 4974.0, 2381.0, 1245.0, 649.0, 371.0, 255.0, 163.0, 105.0, 75.0, 45.0, 38.0, 19.0, 17.0, 6.0, 11.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.099365234375, -0.0961923599243164, -0.09301948547363281, -0.08984661102294922, -0.08667373657226562, -0.08350086212158203, -0.08032798767089844, -0.07715511322021484, -0.07398223876953125, -0.07080936431884766, -0.06763648986816406, -0.06446361541748047, -0.061290740966796875, -0.05811786651611328, -0.05494499206542969, -0.051772117614746094, -0.0485992431640625, -0.045426368713378906, -0.04225349426269531, -0.03908061981201172, -0.035907745361328125, -0.03273487091064453, -0.029561996459960938, -0.026389122009277344, -0.02321624755859375, -0.020043373107910156, -0.016870498657226562, -0.013697624206542969, -0.010524749755859375, -0.007351875305175781, -0.0041790008544921875, -0.0010061264038085938, 0.002166748046875, 0.005339622497558594, 0.008512496948242188, 0.011685371398925781, 0.014858245849609375, 0.01803112030029297, 0.021203994750976562, 0.024376869201660156, 0.02754974365234375, 0.030722618103027344, 0.03389549255371094, 0.03706836700439453, 0.040241241455078125, 0.04341411590576172, 0.04658699035644531, 0.049759864807128906, 0.0529327392578125, 0.056105613708496094, 0.05927848815917969, 0.06245136260986328, 0.06562423706054688, 0.06879711151123047, 0.07196998596191406, 0.07514286041259766, 0.07831573486328125, 0.08148860931396484, 0.08466148376464844, 0.08783435821533203, 0.09100723266601562, 0.09418010711669922, 0.09735298156738281, 0.1005258560180664, 0.10369873046875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 3.0, 3.0, 4.0, 3.0, 7.0, 8.0, 7.0, 12.0, 10.0, 13.0, 17.0, 24.0, 20.0, 22.0, 32.0, 33.0, 28.0, 37.0, 44.0, 38.0, 42.0, 41.0, 39.0, 46.0, 50.0, 50.0, 37.0, 36.0, 36.0, 31.0, 29.0, 34.0, 24.0, 26.0, 18.0, 24.0, 9.0, 11.0, 12.0, 7.0, 14.0, 5.0, 2.0, 1.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04644775390625, -0.044939517974853516, -0.04343128204345703, -0.04192304611206055, -0.04041481018066406, -0.03890657424926758, -0.037398338317871094, -0.03589010238647461, -0.034381866455078125, -0.03287363052368164, -0.031365394592285156, -0.029857158660888672, -0.028348922729492188, -0.026840686798095703, -0.02533245086669922, -0.023824214935302734, -0.02231597900390625, -0.020807743072509766, -0.01929950714111328, -0.017791271209716797, -0.016283035278320312, -0.014774799346923828, -0.013266563415527344, -0.01175832748413086, -0.010250091552734375, -0.00874185562133789, -0.007233619689941406, -0.005725383758544922, -0.0042171478271484375, -0.002708911895751953, -0.0012006759643554688, 0.0003075599670410156, 0.0018157958984375, 0.0033240318298339844, 0.004832267761230469, 0.006340503692626953, 0.007848739624023438, 0.009356975555419922, 0.010865211486816406, 0.01237344741821289, 0.013881683349609375, 0.01538991928100586, 0.016898155212402344, 0.018406391143798828, 0.019914627075195312, 0.021422863006591797, 0.02293109893798828, 0.024439334869384766, 0.02594757080078125, 0.027455806732177734, 0.02896404266357422, 0.030472278594970703, 0.03198051452636719, 0.03348875045776367, 0.034996986389160156, 0.03650522232055664, 0.038013458251953125, 0.03952169418334961, 0.041029930114746094, 0.04253816604614258, 0.04404640197753906, 0.04555463790893555, 0.04706287384033203, 0.048571109771728516, 0.050079345703125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 6.0, 14.0, 15.0, 20.0, 40.0, 44.0, 88.0, 108.0, 175.0, 262.0, 508.0, 1131.0, 3232.0, 16470.0, 776648.0, 3353766.0, 34159.0, 4675.0, 1392.0, 663.0, 318.0, 176.0, 110.0, 83.0, 52.0, 24.0, 28.0, 16.0, 12.0, 15.0, 8.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.434326171875, -0.4223060607910156, -0.41028594970703125, -0.3982658386230469, -0.3862457275390625, -0.3742256164550781, -0.36220550537109375, -0.3501853942871094, -0.338165283203125, -0.3261451721191406, -0.31412506103515625, -0.3021049499511719, -0.2900848388671875, -0.2780647277832031, -0.26604461669921875, -0.2540245056152344, -0.24200439453125, -0.22998428344726562, -0.21796417236328125, -0.20594406127929688, -0.1939239501953125, -0.18190383911132812, -0.16988372802734375, -0.15786361694335938, -0.145843505859375, -0.13382339477539062, -0.12180328369140625, -0.10978317260742188, -0.0977630615234375, -0.08574295043945312, -0.07372283935546875, -0.061702728271484375, -0.0496826171875, -0.037662506103515625, -0.02564239501953125, -0.013622283935546875, -0.0016021728515625, 0.010417938232421875, 0.02243804931640625, 0.034458160400390625, 0.046478271484375, 0.058498382568359375, 0.07051849365234375, 0.08253860473632812, 0.0945587158203125, 0.10657882690429688, 0.11859893798828125, 0.13061904907226562, 0.14263916015625, 0.15465927124023438, 0.16667938232421875, 0.17869949340820312, 0.1907196044921875, 0.20273971557617188, 0.21475982666015625, 0.22677993774414062, 0.238800048828125, 0.2508201599121094, 0.26284027099609375, 0.2748603820800781, 0.2868804931640625, 0.2989006042480469, 0.31092071533203125, 0.3229408264160156, 0.3349609375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 5.0, 5.0, 2.0, 9.0, 11.0, 19.0, 17.0, 25.0, 49.0, 43.0, 48.0, 78.0, 129.0, 163.0, 189.0, 273.0, 369.0, 402.0, 450.0, 400.0, 321.0, 269.0, 184.0, 149.0, 108.0, 73.0, 81.0, 45.0, 36.0, 32.0, 22.0, 17.0, 16.0, 6.0, 10.0, 2.0, 2.0, 7.0, 2.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1507568359375, -0.1457843780517578, -0.14081192016601562, -0.13583946228027344, -0.13086700439453125, -0.12589454650878906, -0.12092208862304688, -0.11594963073730469, -0.1109771728515625, -0.10600471496582031, -0.10103225708007812, -0.09605979919433594, -0.09108734130859375, -0.08611488342285156, -0.08114242553710938, -0.07616996765136719, -0.071197509765625, -0.06622505187988281, -0.061252593994140625, -0.05628013610839844, -0.05130767822265625, -0.04633522033691406, -0.041362762451171875, -0.03639030456542969, -0.0314178466796875, -0.026445388793945312, -0.021472930908203125, -0.016500473022460938, -0.01152801513671875, -0.0065555572509765625, -0.001583099365234375, 0.0033893585205078125, 0.00836181640625, 0.013334274291992188, 0.018306732177734375, 0.023279190063476562, 0.02825164794921875, 0.03322410583496094, 0.038196563720703125, 0.04316902160644531, 0.0481414794921875, 0.05311393737792969, 0.058086395263671875, 0.06305885314941406, 0.06803131103515625, 0.07300376892089844, 0.07797622680664062, 0.08294868469238281, 0.087921142578125, 0.09289360046386719, 0.09786605834960938, 0.10283851623535156, 0.10781097412109375, 0.11278343200683594, 0.11775588989257812, 0.12272834777832031, 0.1277008056640625, 0.1326732635498047, 0.13764572143554688, 0.14261817932128906, 0.14759063720703125, 0.15256309509277344, 0.15753555297851562, 0.1625080108642578, 0.16748046875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 11.0, 7.0, 7.0, 17.0, 37.0, 88.0, 161.0, 213.0, 223.0, 115.0, 69.0, 23.0, 10.0, 6.0, 7.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.9089221954345703, -3.8128654956817627, -3.716808557510376, -3.6207518577575684, -3.5246949195861816, -3.428638219833374, -3.3325815200805664, -3.2365245819091797, -3.140467882156372, -3.0444111824035645, -2.9483542442321777, -2.85229754447937, -2.7562408447265625, -2.660183906555176, -2.564127206802368, -2.4680705070495605, -2.372013568878174, -2.275956869125366, -2.1798999309539795, -2.083843231201172, -1.9877864122390747, -1.8917295932769775, -1.79567289352417, -1.6996160745620728, -1.6035592555999756, -1.5075024366378784, -1.4114456176757812, -1.3153889179229736, -1.2193320989608765, -1.1232752799987793, -1.0272185802459717, -0.9311617612838745, -0.8351047039031982, -0.7390478849411011, -0.6429911255836487, -0.5469343662261963, -0.4508775472640991, -0.35482075810432434, -0.25876396894454956, -0.16270720958709717, -0.066650390625, 0.02940639853477478, 0.12546318769454956, 0.22151997685432434, 0.3175767660140991, 0.4136335551738739, 0.5096903443336487, 0.6057471036911011, 0.7018039226531982, 0.7978607416152954, 0.8939175009727478, 0.9899742603302002, 1.0860310792922974, 1.1820878982543945, 1.2781445980072021, 1.3742014169692993, 1.4702582359313965, 1.5663150548934937, 1.6623718738555908, 1.7584285736083984, 1.8544853925704956, 1.9505422115325928, 2.0465989112854004, 2.142655849456787, 2.2387125492095947]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 4.0, 7.0, 3.0, 11.0, 8.0, 8.0, 13.0, 15.0, 13.0, 11.0, 24.0, 24.0, 36.0, 25.0, 25.0, 33.0, 34.0, 26.0, 45.0, 46.0, 46.0, 52.0, 43.0, 46.0, 43.0, 45.0, 26.0, 43.0, 26.0, 26.0, 21.0, 30.0, 17.0, 17.0, 13.0, 16.0, 10.0, 10.0, 10.0, 10.0, 10.0, 6.0, 10.0, 3.0, 3.0, 1.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.8835044503211975, -0.854857861995697, -0.8262112140655518, -0.7975646257400513, -0.7689180374145508, -0.7402713894844055, -0.711624801158905, -0.6829781532287598, -0.6543315649032593, -0.6256849765777588, -0.5970383286476135, -0.568391740322113, -0.5397450923919678, -0.5110985040664673, -0.4824519157409668, -0.4538052976131439, -0.42515867948532104, -0.39651206135749817, -0.3678654432296753, -0.3392188549041748, -0.31057223677635193, -0.28192561864852905, -0.25327903032302856, -0.2246324121952057, -0.1959857940673828, -0.16733917593955994, -0.13869257271289825, -0.11004596203565598, -0.0813993513584137, -0.05275273323059082, -0.024106130003929138, 0.004540473222732544, 0.033187150955200195, 0.061833761632442474, 0.09048037230968475, 0.11912698298692703, 0.1477735936641693, 0.1764202117919922, 0.20506681501865387, 0.23371341824531555, 0.2623600363731384, 0.2910066545009613, 0.3196532726287842, 0.34829986095428467, 0.37694647908210754, 0.4055930972099304, 0.4342396855354309, 0.4628863036632538, 0.49153292179107666, 0.5201795101165771, 0.5488261580467224, 0.5774727463722229, 0.6061193943023682, 0.6347659826278687, 0.6634125709533691, 0.6920591592788696, 0.7207058072090149, 0.7493523955345154, 0.7779990434646606, 0.8066456317901611, 0.8352922201156616, 0.8639388680458069, 0.8925854563713074, 0.9212321043014526, 0.9498786926269531]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 4.0, 7.0, 6.0, 10.0, 16.0, 25.0, 43.0, 62.0, 75.0, 127.0, 195.0, 298.0, 429.0, 691.0, 1036.0, 1720.0, 3027.0, 5328.0, 10033.0, 20578.0, 45123.0, 112434.0, 395497.0, 288356.0, 88842.0, 37225.0, 17237.0, 8750.0, 4583.0, 2639.0, 1540.0, 903.0, 605.0, 346.0, 239.0, 164.0, 121.0, 76.0, 43.0, 38.0, 28.0, 26.0, 11.0, 9.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0731201171875, -0.07096195220947266, -0.06880378723144531, -0.06664562225341797, -0.06448745727539062, -0.06232929229736328, -0.06017112731933594, -0.058012962341308594, -0.05585479736328125, -0.053696632385253906, -0.05153846740722656, -0.04938030242919922, -0.047222137451171875, -0.04506397247314453, -0.04290580749511719, -0.040747642517089844, -0.0385894775390625, -0.036431312561035156, -0.03427314758300781, -0.03211498260498047, -0.029956817626953125, -0.02779865264892578, -0.025640487670898438, -0.023482322692871094, -0.02132415771484375, -0.019165992736816406, -0.017007827758789062, -0.014849662780761719, -0.012691497802734375, -0.010533332824707031, -0.008375167846679688, -0.006217002868652344, -0.004058837890625, -0.0019006729125976562, 0.0002574920654296875, 0.0024156570434570312, 0.004573822021484375, 0.006731986999511719, 0.008890151977539062, 0.011048316955566406, 0.01320648193359375, 0.015364646911621094, 0.017522811889648438, 0.01968097686767578, 0.021839141845703125, 0.02399730682373047, 0.026155471801757812, 0.028313636779785156, 0.0304718017578125, 0.032629966735839844, 0.03478813171386719, 0.03694629669189453, 0.039104461669921875, 0.04126262664794922, 0.04342079162597656, 0.045578956604003906, 0.04773712158203125, 0.049895286560058594, 0.05205345153808594, 0.05421161651611328, 0.056369781494140625, 0.05852794647216797, 0.06068611145019531, 0.06284427642822266, 0.06500244140625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 4.0, 4.0, 6.0, 9.0, 5.0, 11.0, 14.0, 8.0, 10.0, 21.0, 21.0, 20.0, 36.0, 41.0, 40.0, 39.0, 44.0, 42.0, 56.0, 45.0, 39.0, 47.0, 41.0, 45.0, 47.0, 31.0, 36.0, 34.0, 35.0, 24.0, 21.0, 26.0, 12.0, 16.0, 16.0, 11.0, 8.0, 8.0, 4.0, 5.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0726318359375, -0.07026100158691406, -0.06789016723632812, -0.06551933288574219, -0.06314849853515625, -0.06077766418457031, -0.058406829833984375, -0.05603599548339844, -0.0536651611328125, -0.05129432678222656, -0.048923492431640625, -0.04655265808105469, -0.04418182373046875, -0.04181098937988281, -0.039440155029296875, -0.03706932067871094, -0.034698486328125, -0.03232765197753906, -0.029956817626953125, -0.027585983276367188, -0.02521514892578125, -0.022844314575195312, -0.020473480224609375, -0.018102645874023438, -0.0157318115234375, -0.013360977172851562, -0.010990142822265625, -0.008619308471679688, -0.00624847412109375, -0.0038776397705078125, -0.001506805419921875, 0.0008640289306640625, 0.00323486328125, 0.0056056976318359375, 0.007976531982421875, 0.010347366333007812, 0.01271820068359375, 0.015089035034179688, 0.017459869384765625, 0.019830703735351562, 0.0222015380859375, 0.024572372436523438, 0.026943206787109375, 0.029314041137695312, 0.03168487548828125, 0.03405570983886719, 0.036426544189453125, 0.03879737854003906, 0.041168212890625, 0.04353904724121094, 0.045909881591796875, 0.04828071594238281, 0.05065155029296875, 0.05302238464355469, 0.055393218994140625, 0.05776405334472656, 0.0601348876953125, 0.06250572204589844, 0.06487655639648438, 0.06724739074707031, 0.06961822509765625, 0.07198905944824219, 0.07435989379882812, 0.07673072814941406, 0.0791015625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 6.0, 8.0, 13.0, 20.0, 38.0, 59.0, 133.0, 227.0, 400.0, 1135.0, 4488.0, 33634.0, 924628.0, 74031.0, 7163.0, 1577.0, 537.0, 221.0, 108.0, 53.0, 29.0, 15.0, 12.0, 9.0, 5.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.255859375, -0.24847412109375, -0.2410888671875, -0.23370361328125, -0.226318359375, -0.21893310546875, -0.2115478515625, -0.20416259765625, -0.19677734375, -0.18939208984375, -0.1820068359375, -0.17462158203125, -0.167236328125, -0.15985107421875, -0.1524658203125, -0.14508056640625, -0.1376953125, -0.13031005859375, -0.1229248046875, -0.11553955078125, -0.108154296875, -0.10076904296875, -0.0933837890625, -0.08599853515625, -0.07861328125, -0.07122802734375, -0.0638427734375, -0.05645751953125, -0.049072265625, -0.04168701171875, -0.0343017578125, -0.02691650390625, -0.01953125, -0.01214599609375, -0.0047607421875, 0.00262451171875, 0.010009765625, 0.01739501953125, 0.0247802734375, 0.03216552734375, 0.03955078125, 0.04693603515625, 0.0543212890625, 0.06170654296875, 0.069091796875, 0.07647705078125, 0.0838623046875, 0.09124755859375, 0.0986328125, 0.10601806640625, 0.1134033203125, 0.12078857421875, 0.128173828125, 0.13555908203125, 0.1429443359375, 0.15032958984375, 0.15771484375, 0.16510009765625, 0.1724853515625, 0.17987060546875, 0.187255859375, 0.19464111328125, 0.2020263671875, 0.20941162109375, 0.216796875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 2.0, 2.0, 3.0, 12.0, 7.0, 4.0, 8.0, 9.0, 10.0, 10.0, 14.0, 16.0, 22.0, 25.0, 29.0, 34.0, 41.0, 47.0, 72.0, 66.0, 78.0, 84.0, 69.0, 81.0, 50.0, 38.0, 23.0, 25.0, 24.0, 20.0, 16.0, 13.0, 12.0, 11.0, 5.0, 6.0, 3.0, 3.0, 3.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34814453125, -0.3368034362792969, -0.32546234130859375, -0.3141212463378906, -0.3027801513671875, -0.2914390563964844, -0.28009796142578125, -0.2687568664550781, -0.257415771484375, -0.24607467651367188, -0.23473358154296875, -0.22339248657226562, -0.2120513916015625, -0.20071029663085938, -0.18936920166015625, -0.17802810668945312, -0.16668701171875, -0.15534591674804688, -0.14400482177734375, -0.13266372680664062, -0.1213226318359375, -0.10998153686523438, -0.09864044189453125, -0.08729934692382812, -0.075958251953125, -0.06461715698242188, -0.05327606201171875, -0.041934967041015625, -0.0305938720703125, -0.019252777099609375, -0.00791168212890625, 0.003429412841796875, 0.0147705078125, 0.026111602783203125, 0.03745269775390625, 0.048793792724609375, 0.0601348876953125, 0.07147598266601562, 0.08281707763671875, 0.09415817260742188, 0.105499267578125, 0.11684036254882812, 0.12818145751953125, 0.13952255249023438, 0.1508636474609375, 0.16220474243164062, 0.17354583740234375, 0.18488693237304688, 0.19622802734375, 0.20756912231445312, 0.21891021728515625, 0.23025131225585938, 0.2415924072265625, 0.2529335021972656, 0.26427459716796875, 0.2756156921386719, 0.286956787109375, 0.2982978820800781, 0.30963897705078125, 0.3209800720214844, 0.3323211669921875, 0.3436622619628906, 0.35500335693359375, 0.3663444519042969, 0.377685546875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 6.0, 5.0, 2.0, 9.0, 11.0, 6.0, 20.0, 14.0, 18.0, 37.0, 42.0, 50.0, 76.0, 117.0, 166.0, 279.0, 464.0, 1062.0, 2347.0, 6899.0, 30214.0, 762292.0, 211221.0, 23247.0, 5779.0, 2014.0, 858.0, 469.0, 249.0, 163.0, 116.0, 74.0, 62.0, 36.0, 28.0, 25.0, 20.0, 15.0, 9.0, 7.0, 10.0, 3.0, 4.0, 1.0, 7.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04010009765625, -0.03871345520019531, -0.037326812744140625, -0.03594017028808594, -0.03455352783203125, -0.03316688537597656, -0.031780242919921875, -0.030393600463867188, -0.0290069580078125, -0.027620315551757812, -0.026233673095703125, -0.024847030639648438, -0.02346038818359375, -0.022073745727539062, -0.020687103271484375, -0.019300460815429688, -0.017913818359375, -0.016527175903320312, -0.015140533447265625, -0.013753890991210938, -0.01236724853515625, -0.010980606079101562, -0.009593963623046875, -0.008207321166992188, -0.0068206787109375, -0.0054340362548828125, -0.004047393798828125, -0.0026607513427734375, -0.00127410888671875, 0.0001125335693359375, 0.001499176025390625, 0.0028858184814453125, 0.0042724609375, 0.0056591033935546875, 0.007045745849609375, 0.008432388305664062, 0.00981903076171875, 0.011205673217773438, 0.012592315673828125, 0.013978958129882812, 0.0153656005859375, 0.016752243041992188, 0.018138885498046875, 0.019525527954101562, 0.02091217041015625, 0.022298812866210938, 0.023685455322265625, 0.025072097778320312, 0.026458740234375, 0.027845382690429688, 0.029232025146484375, 0.030618667602539062, 0.03200531005859375, 0.03339195251464844, 0.034778594970703125, 0.03616523742675781, 0.0375518798828125, 0.03893852233886719, 0.040325164794921875, 0.04171180725097656, 0.04309844970703125, 0.04448509216308594, 0.045871734619140625, 0.04725837707519531, 0.04864501953125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 6.0, 9.0, 9.0, 9.0, 11.0, 11.0, 19.0, 24.0, 20.0, 30.0, 33.0, 49.0, 54.0, 63.0, 87.0, 70.0, 72.0, 72.0, 63.0, 57.0, 32.0, 44.0, 32.0, 29.0, 16.0, 18.0, 8.0, 13.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 6.0, 2.0, 5.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4185905456542969e-05, -1.3763085007667542e-05, -1.3340264558792114e-05, -1.2917444109916687e-05, -1.249462366104126e-05, -1.2071803212165833e-05, -1.1648982763290405e-05, -1.1226162314414978e-05, -1.080334186553955e-05, -1.0380521416664124e-05, -9.957700967788696e-06, -9.534880518913269e-06, -9.112060070037842e-06, -8.689239621162415e-06, -8.266419172286987e-06, -7.84359872341156e-06, -7.420778274536133e-06, -6.9979578256607056e-06, -6.575137376785278e-06, -6.152316927909851e-06, -5.729496479034424e-06, -5.306676030158997e-06, -4.883855581283569e-06, -4.461035132408142e-06, -4.038214683532715e-06, -3.6153942346572876e-06, -3.1925737857818604e-06, -2.769753336906433e-06, -2.346932888031006e-06, -1.9241124391555786e-06, -1.5012919902801514e-06, -1.0784715414047241e-06, -6.556510925292969e-07, -2.3283064365386963e-07, 1.8998980522155762e-07, 6.128102540969849e-07, 1.0356307029724121e-06, 1.4584511518478394e-06, 1.8812716007232666e-06, 2.304092049598694e-06, 2.726912498474121e-06, 3.1497329473495483e-06, 3.5725533962249756e-06, 3.995373845100403e-06, 4.41819429397583e-06, 4.841014742851257e-06, 5.2638351917266846e-06, 5.686655640602112e-06, 6.109476089477539e-06, 6.532296538352966e-06, 6.9551169872283936e-06, 7.377937436103821e-06, 7.800757884979248e-06, 8.223578333854675e-06, 8.646398782730103e-06, 9.06921923160553e-06, 9.492039680480957e-06, 9.914860129356384e-06, 1.0337680578231812e-05, 1.0760501027107239e-05, 1.1183321475982666e-05, 1.1606141924858093e-05, 1.202896237373352e-05, 1.2451782822608948e-05, 1.2874603271484375e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 5.0, 7.0, 9.0, 13.0, 18.0, 29.0, 60.0, 132.0, 290.0, 878.0, 3826.0, 24295.0, 889860.0, 115957.0, 10274.0, 1957.0, 527.0, 202.0, 88.0, 41.0, 28.0, 22.0, 15.0, 5.0, 9.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0736083984375, -0.07149219512939453, -0.06937599182128906, -0.0672597885131836, -0.06514358520507812, -0.06302738189697266, -0.06091117858886719, -0.05879497528076172, -0.05667877197265625, -0.05456256866455078, -0.05244636535644531, -0.050330162048339844, -0.048213958740234375, -0.046097755432128906, -0.04398155212402344, -0.04186534881591797, -0.0397491455078125, -0.03763294219970703, -0.03551673889160156, -0.033400535583496094, -0.031284332275390625, -0.029168128967285156, -0.027051925659179688, -0.02493572235107422, -0.02281951904296875, -0.02070331573486328, -0.018587112426757812, -0.016470909118652344, -0.014354705810546875, -0.012238502502441406, -0.010122299194335938, -0.008006095886230469, -0.005889892578125, -0.0037736892700195312, -0.0016574859619140625, 0.00045871734619140625, 0.002574920654296875, 0.004691123962402344, 0.0068073272705078125, 0.008923530578613281, 0.01103973388671875, 0.013155937194824219, 0.015272140502929688, 0.017388343811035156, 0.019504547119140625, 0.021620750427246094, 0.023736953735351562, 0.02585315704345703, 0.0279693603515625, 0.03008556365966797, 0.03220176696777344, 0.034317970275878906, 0.036434173583984375, 0.038550376892089844, 0.04066658020019531, 0.04278278350830078, 0.04489898681640625, 0.04701519012451172, 0.04913139343261719, 0.051247596740722656, 0.053363800048828125, 0.055480003356933594, 0.05759620666503906, 0.05971240997314453, 0.06182861328125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 4.0, 4.0, 9.0, 10.0, 9.0, 7.0, 9.0, 11.0, 9.0, 15.0, 15.0, 28.0, 54.0, 58.0, 84.0, 107.0, 110.0, 119.0, 80.0, 59.0, 47.0, 18.0, 19.0, 23.0, 24.0, 10.0, 8.0, 11.0, 9.0, 10.0, 9.0, 6.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.04913330078125, -0.047570228576660156, -0.04600715637207031, -0.04444408416748047, -0.042881011962890625, -0.04131793975830078, -0.03975486755371094, -0.038191795349121094, -0.03662872314453125, -0.035065650939941406, -0.03350257873535156, -0.03193950653076172, -0.030376434326171875, -0.02881336212158203, -0.027250289916992188, -0.025687217712402344, -0.0241241455078125, -0.022561073303222656, -0.020998001098632812, -0.01943492889404297, -0.017871856689453125, -0.01630878448486328, -0.014745712280273438, -0.013182640075683594, -0.01161956787109375, -0.010056495666503906, -0.008493423461914062, -0.006930351257324219, -0.005367279052734375, -0.0038042068481445312, -0.0022411346435546875, -0.0006780624389648438, 0.000885009765625, 0.0024480819702148438, 0.0040111541748046875, 0.005574226379394531, 0.007137298583984375, 0.008700370788574219, 0.010263442993164062, 0.011826515197753906, 0.01338958740234375, 0.014952659606933594, 0.016515731811523438, 0.01807880401611328, 0.019641876220703125, 0.02120494842529297, 0.022768020629882812, 0.024331092834472656, 0.0258941650390625, 0.027457237243652344, 0.029020309448242188, 0.03058338165283203, 0.032146453857421875, 0.03370952606201172, 0.03527259826660156, 0.036835670471191406, 0.03839874267578125, 0.039961814880371094, 0.04152488708496094, 0.04308795928955078, 0.044651031494140625, 0.04621410369873047, 0.04777717590332031, 0.049340248107910156, 0.0509033203125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 4.0, 8.0, 9.0, 18.0, 43.0, 80.0, 268.0, 363.0, 107.0, 38.0, 33.0, 14.0, 10.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0455381870269775, -1.9872790575027466, -1.9290199279785156, -1.8707609176635742, -1.8125017881393433, -1.7542426586151123, -1.695983648300171, -1.63772451877594, -1.579465389251709, -1.521206259727478, -1.462947130203247, -1.4046881198883057, -1.3464289903640747, -1.2881698608398438, -1.2299108505249023, -1.1716517210006714, -1.1133925914764404, -1.0551334619522095, -0.9968743920326233, -0.9386153221130371, -0.8803561925888062, -0.8220970630645752, -0.763837993144989, -0.7055789232254028, -0.6473197937011719, -0.5890606641769409, -0.5308015942573547, -0.47254249453544617, -0.4142833948135376, -0.35602429509162903, -0.29776519536972046, -0.2395060956478119, -0.18124699592590332, -0.12298789620399475, -0.06472879648208618, -0.006469696760177612, 0.05178940296173096, 0.11004850268363953, 0.1683076024055481, 0.22656670212745667, 0.28482580184936523, 0.3430849015712738, 0.4013440012931824, 0.45960310101509094, 0.5178622007369995, 0.5761213302612305, 0.6343804001808167, 0.6926394701004028, 0.7508985996246338, 0.8091577291488647, 0.8674167990684509, 0.9256758689880371, 0.9839349985122681, 1.042194128036499, 1.1004531383514404, 1.1587122678756714, 1.2169713973999023, 1.2752305269241333, 1.3334896564483643, 1.3917486667633057, 1.4500077962875366, 1.5082669258117676, 1.566525936126709, 1.62478506565094, 1.683044195175171]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 1.0, 3.0, 6.0, 8.0, 4.0, 10.0, 10.0, 11.0, 17.0, 25.0, 21.0, 20.0, 41.0, 45.0, 63.0, 73.0, 87.0, 88.0, 71.0, 78.0, 51.0, 46.0, 32.0, 24.0, 25.0, 26.0, 17.0, 10.0, 7.0, 16.0, 11.0, 9.0, 5.0, 11.0, 6.0, 3.0, 3.0, 1.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.0160033702850342, -0.9856521487236023, -0.9553009271621704, -0.9249496459960938, -0.8945984244346619, -0.86424720287323, -0.8338959813117981, -0.8035447597503662, -0.7731934785842896, -0.7428422570228577, -0.7124910354614258, -0.6821397542953491, -0.6517885327339172, -0.6214373111724854, -0.5910860896110535, -0.5607348680496216, -0.5303835868835449, -0.500032365322113, -0.46968111395835876, -0.4393298923969269, -0.4089786410331726, -0.3786274194717407, -0.34827619791030884, -0.31792494654655457, -0.28757375478744507, -0.2572225332260132, -0.2268712818622589, -0.19652006030082703, -0.16616880893707275, -0.13581758737564087, -0.10546635091304779, -0.07511511445045471, -0.04476386308670044, -0.01441262848675251, 0.01593860611319542, 0.0462898388504982, 0.07664107531309128, 0.10699230432510376, 0.13734354078769684, 0.16769477725028992, 0.198046013712883, 0.22839725017547607, 0.25874847173690796, 0.28909972310066223, 0.3194509446620941, 0.3498021960258484, 0.3801534175872803, 0.41050463914871216, 0.44085589051246643, 0.4712071120738983, 0.5015583634376526, 0.5319095849990845, 0.5622608065605164, 0.5926120281219482, 0.6229633092880249, 0.6533145308494568, 0.6836657524108887, 0.7140169739723206, 0.7443681955337524, 0.7747194766998291, 0.805070698261261, 0.8354219198226929, 0.8657731413841248, 0.8961243629455566, 0.9264756441116333]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 8.0, 7.0, 18.0, 15.0, 11.0, 25.0, 21.0, 12.0, 24.0, 26.0, 29.0, 33.0, 15.0, 43.0, 65.0, 124.0, 151.0, 70.0, 39.0, 30.0, 36.0, 23.0, 20.0, 24.0, 23.0, 23.0, 15.0, 10.0, 8.0, 8.0, 11.0, 8.0, 8.0, 5.0, 5.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0712890625, -0.06891536712646484, -0.06654167175292969, -0.06416797637939453, -0.061794281005859375, -0.05942058563232422, -0.05704689025878906, -0.054673194885253906, -0.05229949951171875, -0.049925804138183594, -0.04755210876464844, -0.04517841339111328, -0.042804718017578125, -0.04043102264404297, -0.03805732727050781, -0.035683631896972656, -0.0333099365234375, -0.030936241149902344, -0.028562545776367188, -0.02618885040283203, -0.023815155029296875, -0.02144145965576172, -0.019067764282226562, -0.016694068908691406, -0.01432037353515625, -0.011946678161621094, -0.009572982788085938, -0.007199287414550781, -0.004825592041015625, -0.0024518966674804688, -7.82012939453125e-05, 0.0022954940795898438, 0.004669189453125, 0.007042884826660156, 0.009416580200195312, 0.011790275573730469, 0.014163970947265625, 0.01653766632080078, 0.018911361694335938, 0.021285057067871094, 0.02365875244140625, 0.026032447814941406, 0.028406143188476562, 0.03077983856201172, 0.033153533935546875, 0.03552722930908203, 0.03790092468261719, 0.040274620056152344, 0.0426483154296875, 0.045022010803222656, 0.04739570617675781, 0.04976940155029297, 0.052143096923828125, 0.05451679229736328, 0.05689048767089844, 0.059264183044433594, 0.06163787841796875, 0.0640115737915039, 0.06638526916503906, 0.06875896453857422, 0.07113265991210938, 0.07350635528564453, 0.07588005065917969, 0.07825374603271484, 0.08062744140625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 6.0, 3.0, 4.0, 1.0, 7.0, 1.0, 5.0, 5.0, 9.0, 20.0, 13.0, 25.0, 33.0, 45.0, 53.0, 103.0, 132.0, 247.0, 489.0, 1103.0, 2891.0, 9028.0, 154523.0, 8198933.0, 13901.0, 3907.0, 1548.0, 671.0, 303.0, 194.0, 97.0, 63.0, 56.0, 39.0, 22.0, 25.0, 23.0, 9.0, 7.0, 7.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 5.0, 2.0, 2.0], "bins": [-0.4251953363418579, -0.4119632840156555, -0.3987312316894531, -0.3854992091655731, -0.3722671568393707, -0.35903510451316833, -0.34580308198928833, -0.33257102966308594, -0.31933897733688354, -0.30610692501068115, -0.29287487268447876, -0.27964285016059875, -0.26641079783439636, -0.25317874550819397, -0.23994670808315277, -0.22671467065811157, -0.21348261833190918, -0.2002505660057068, -0.1870185285806656, -0.1737864911556244, -0.160554438829422, -0.1473223865032196, -0.1340903490781784, -0.12085830420255661, -0.10762625932693481, -0.09439421445131302, -0.08116216957569122, -0.06793012470006943, -0.05469807982444763, -0.041466034948825836, -0.02823399007320404, -0.015001945197582245, -0.0017699003219604492, 0.011462144553661346, 0.024694189429283142, 0.03792623430490494, 0.05115827918052673, 0.06439032405614853, 0.07762236893177032, 0.09085441380739212, 0.10408645868301392, 0.11731850355863571, 0.1305505484342575, 0.1437825858592987, 0.1570146381855011, 0.1702466905117035, 0.1834787279367447, 0.1967107653617859, 0.20994281768798828, 0.22317487001419067, 0.23640690743923187, 0.24963894486427307, 0.26287099719047546, 0.27610304951667786, 0.28933507204055786, 0.30256712436676025, 0.31579917669296265, 0.32903122901916504, 0.34226328134536743, 0.35549530386924744, 0.36872735619544983, 0.3819594085216522, 0.3951914310455322, 0.4084234833717346, 0.421655535697937]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 6.0, 4.0, 7.0, 1.0, 3.0, 7.0, 4.0, 5.0, 6.0, 4.0, 1.0, 7.0, 2.0, 4.0, 4.0, 3.0, 4.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8421979546546936, -0.8183676600456238, -0.794537365436554, -0.7707071304321289, -0.7468768358230591, -0.7230465412139893, -0.6992162466049194, -0.6753859519958496, -0.6515556573867798, -0.62772536277771, -0.6038950681686401, -0.5800647735595703, -0.5562345385551453, -0.5324042439460754, -0.5085739493370056, -0.4847436547279358, -0.46091341972351074, -0.4370831251144409, -0.4132528603076935, -0.38942256569862366, -0.3655923008918762, -0.3417620062828064, -0.3179317116737366, -0.29410141706466675, -0.2702711522579193, -0.24644087255001068, -0.22261059284210205, -0.19878029823303223, -0.1749500185251236, -0.15111973881721497, -0.12728944420814514, -0.10345916450023651, -0.0796288251876831, -0.05579854175448418, -0.03196825832128525, -0.00813797116279602, 0.01569230854511261, 0.03952258825302124, 0.06335288286209106, 0.0871831625699997, 0.11101344227790833, 0.13484372198581696, 0.15867400169372559, 0.1825042963027954, 0.20633457601070404, 0.23016485571861267, 0.2539951503276825, 0.27782541513442993, 0.30165570974349976, 0.3254860043525696, 0.349316269159317, 0.37314656376838684, 0.3969768285751343, 0.4208071231842041, 0.4446374177932739, 0.46846771240234375, 0.4922979772090912, 0.5161282420158386, 0.5399585366249084, 0.5637888312339783, 0.5876191258430481, 0.6114493608474731, 0.635279655456543, 0.6591099500656128, 0.6829402446746826]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 11.0, 13.0, 17.0, 22.0, 40.0, 56.0, 71.0, 92.0, 96.0, 118.0, 97.0, 102.0, 85.0, 66.0, 38.0, 35.0, 16.0, 11.0, 8.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0726318359375, -0.06878089904785156, -0.06492996215820312, -0.06107902526855469, -0.05722808837890625, -0.05337715148925781, -0.049526214599609375, -0.04567527770996094, -0.0418243408203125, -0.03797340393066406, -0.034122467041015625, -0.030271530151367188, -0.02642059326171875, -0.022569656372070312, -0.018718719482421875, -0.014867782592773438, -0.011016845703125, -0.0071659088134765625, -0.003314971923828125, 0.0005359649658203125, 0.00438690185546875, 0.008237838745117188, 0.012088775634765625, 0.015939712524414062, 0.0197906494140625, 0.023641586303710938, 0.027492523193359375, 0.03134346008300781, 0.03519439697265625, 0.03904533386230469, 0.042896270751953125, 0.04674720764160156, 0.05059814453125, 0.05444908142089844, 0.058300018310546875, 0.06215095520019531, 0.06600189208984375, 0.06985282897949219, 0.07370376586914062, 0.07755470275878906, 0.0814056396484375, 0.08525657653808594, 0.08910751342773438, 0.09295845031738281, 0.09680938720703125, 0.10066032409667969, 0.10451126098632812, 0.10836219787597656, 0.112213134765625, 0.11606407165527344, 0.11991500854492188, 0.12376594543457031, 0.12761688232421875, 0.1314678192138672, 0.13531875610351562, 0.13916969299316406, 0.1430206298828125, 0.14687156677246094, 0.15072250366210938, 0.1545734405517578, 0.15842437744140625, 0.1622753143310547, 0.16612625122070312, 0.16997718811035156, 0.173828125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 7.0, 2.0, 4.0, 16.0, 22.0, 32.0, 50.0, 72.0, 175.0, 334.0, 817.0, 2804.0, 12739.0, 75737.0, 306130.0, 103090.0, 16722.0, 3654.0, 1044.0, 381.0, 191.0, 93.0, 62.0, 35.0, 23.0, 5.0, 8.0, 4.0, 3.0, 1.0, 6.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.78271484375, -0.7553253173828125, -0.727935791015625, -0.7005462646484375, -0.67315673828125, -0.6457672119140625, -0.618377685546875, -0.5909881591796875, -0.5635986328125, -0.5362091064453125, -0.508819580078125, -0.4814300537109375, -0.45404052734375, -0.4266510009765625, -0.399261474609375, -0.3718719482421875, -0.344482421875, -0.3170928955078125, -0.289703369140625, -0.2623138427734375, -0.23492431640625, -0.2075347900390625, -0.180145263671875, -0.1527557373046875, -0.1253662109375, -0.0979766845703125, -0.070587158203125, -0.0431976318359375, -0.01580810546875, 0.0115814208984375, 0.038970947265625, 0.0663604736328125, 0.09375, 0.1211395263671875, 0.148529052734375, 0.1759185791015625, 0.20330810546875, 0.2306976318359375, 0.258087158203125, 0.2854766845703125, 0.3128662109375, 0.3402557373046875, 0.367645263671875, 0.3950347900390625, 0.42242431640625, 0.4498138427734375, 0.477203369140625, 0.5045928955078125, 0.531982421875, 0.5593719482421875, 0.586761474609375, 0.6141510009765625, 0.64154052734375, 0.6689300537109375, 0.696319580078125, 0.7237091064453125, 0.7510986328125, 0.7784881591796875, 0.805877685546875, 0.8332672119140625, 0.86065673828125, 0.8880462646484375, 0.915435791015625, 0.9428253173828125, 0.97021484375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 7.0, 4.0, 4.0, 7.0, 15.0, 8.0, 17.0, 16.0, 14.0, 32.0, 26.0, 39.0, 56.0, 61.0, 47.0, 52.0, 77.0, 61.0, 59.0, 76.0, 56.0, 47.0, 39.0, 35.0, 26.0, 27.0, 17.0, 18.0, 9.0, 13.0, 6.0, 9.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0771484375, -0.07456493377685547, -0.07198143005371094, -0.0693979263305664, -0.06681442260742188, -0.06423091888427734, -0.06164741516113281, -0.05906391143798828, -0.05648040771484375, -0.05389690399169922, -0.05131340026855469, -0.048729896545410156, -0.046146392822265625, -0.043562889099121094, -0.04097938537597656, -0.03839588165283203, -0.0358123779296875, -0.03322887420654297, -0.030645370483398438, -0.028061866760253906, -0.025478363037109375, -0.022894859313964844, -0.020311355590820312, -0.01772785186767578, -0.01514434814453125, -0.012560844421386719, -0.009977340698242188, -0.007393836975097656, -0.004810333251953125, -0.0022268295288085938, 0.0003566741943359375, 0.0029401779174804688, 0.005523681640625, 0.008107185363769531, 0.010690689086914062, 0.013274192810058594, 0.015857696533203125, 0.018441200256347656, 0.021024703979492188, 0.02360820770263672, 0.02619171142578125, 0.02877521514892578, 0.03135871887207031, 0.033942222595214844, 0.036525726318359375, 0.039109230041503906, 0.04169273376464844, 0.04427623748779297, 0.0468597412109375, 0.04944324493408203, 0.05202674865722656, 0.054610252380371094, 0.057193756103515625, 0.059777259826660156, 0.06236076354980469, 0.06494426727294922, 0.06752777099609375, 0.07011127471923828, 0.07269477844238281, 0.07527828216552734, 0.07786178588867188, 0.0804452896118164, 0.08302879333496094, 0.08561229705810547, 0.08819580078125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 5.0, 13.0, 18.0, 30.0, 88.0, 122.0, 93.0, 51.0, 22.0, 11.0, 11.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8101673722267151, -0.7868161201477051, -0.7634648680686951, -0.7401136159896851, -0.7167624235153198, -0.6934111714363098, -0.6700599193572998, -0.6467086672782898, -0.6233574151992798, -0.6000061631202698, -0.5766549110412598, -0.5533036589622498, -0.5299524068832397, -0.5066012144088745, -0.4832499623298645, -0.4598987102508545, -0.4365474581718445, -0.4131962060928345, -0.38984495401382446, -0.36649373173713684, -0.34314247965812683, -0.3197912275791168, -0.2964400053024292, -0.2730887532234192, -0.24973750114440918, -0.22638624906539917, -0.20303501188755035, -0.17968377470970154, -0.15633252263069153, -0.13298127055168152, -0.1096300333738327, -0.08627879619598389, -0.0629274845123291, -0.03957623988389969, -0.016224995255470276, 0.007126249372959137, 0.03047749400138855, 0.05382873862981796, 0.07717998325824738, 0.10053122043609619, 0.1238824725151062, 0.1472337245941162, 0.17058496177196503, 0.19393619894981384, 0.21728745102882385, 0.24063870310783386, 0.2639899253845215, 0.2873411774635315, 0.3106924295425415, 0.3340436816215515, 0.3573949337005615, 0.38074615597724915, 0.40409740805625916, 0.42744866013526917, 0.4507998824119568, 0.4741511344909668, 0.4975023865699768, 0.5208536386489868, 0.5442048907279968, 0.5675561428070068, 0.5909073352813721, 0.6142585873603821, 0.6376098394393921, 0.6609610915184021, 0.6843123435974121]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 0.0, 4.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 5.0, 5.0, 7.0, 6.0, 4.0, 8.0, 12.0, 18.0, 34.0, 55.0, 63.0, 63.0, 65.0, 52.0, 21.0, 14.0, 12.0, 6.0, 4.0, 1.0, 4.0, 3.0, 3.0, 1.0, 3.0, 0.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4378100037574768, -0.4249344766139984, -0.41205894947052, -0.39918339252471924, -0.38630786538124084, -0.37343233823776245, -0.36055681109428406, -0.34768128395080566, -0.3348057270050049, -0.3219301998615265, -0.3090546727180481, -0.2961791157722473, -0.2833035886287689, -0.2704280614852905, -0.25755253434181213, -0.24467700719833374, -0.23180148005485535, -0.21892595291137695, -0.20605041086673737, -0.19317488372325897, -0.18029934167861938, -0.167423814535141, -0.1545482873916626, -0.1416727602481842, -0.12879721820354462, -0.11592168360948563, -0.10304614901542664, -0.09017062187194824, -0.07729508727788925, -0.06441955268383026, -0.05154402554035187, -0.03866849094629288, -0.025792956352233887, -0.012917423620820045, -4.1890889406204224e-05, 0.012833639979362488, 0.02570917457342148, 0.03858470916748047, 0.05146023631095886, 0.06433577090501785, 0.07721130549907684, 0.09008684009313583, 0.10296237468719482, 0.11583790183067322, 0.1287134289741516, 0.1415889710187912, 0.1544644981622696, 0.16734004020690918, 0.18021556735038757, 0.19309109449386597, 0.20596663653850555, 0.21884216368198395, 0.23171770572662354, 0.24459323287010193, 0.2574687600135803, 0.2703442871570587, 0.2832198143005371, 0.2960953414440155, 0.3089708685874939, 0.3218464255332947, 0.33472195267677307, 0.34759747982025146, 0.36047300696372986, 0.37334853410720825, 0.38622409105300903]}, "eval/loss": 0.3051322400569916, "eval/wer": 0.08994446648155494, "eval/runtime": 575.2498, "eval/samples_per_second": 4.593, "eval/steps_per_second": 0.575, "train/train_runtime": 27349.9818, "train/train_samples_per_second": 5.217, "train/train_steps_per_second": 0.082, "train/total_flos": 0.0, "train/train_loss": 1.4829948718221064} \ No newline at end of file